diff --git a/.github/workflows/black.yml b/.github/workflows/black.yml new file mode 100644 index 000000000..96aaea347 --- /dev/null +++ b/.github/workflows/black.yml @@ -0,0 +1,24 @@ +name: Black Code Formatter + +on: [push, pull_request] + +jobs: + black: + runs-on: ubuntu-latest + + steps: + - name: Check out code + uses: actions/checkout@v4 + + - name: Set up Python + uses: actions/setup-python@v2 + with: + python-version: "3.11" + + - name: Install Black + run: | + python -m pip install --upgrade pip + pip install black + + - name: Check Black Formatting + run: black --check . diff --git a/.github/workflows/main.yml b/.github/workflows/main.yml index c42657ae2..c02c060dd 100644 --- a/.github/workflows/main.yml +++ b/.github/workflows/main.yml @@ -1,4 +1,4 @@ -name: Py 3.7 3.8, 3.9 | Windows Mac Linux +name: Py 3.8, 3.9, 3.10, 3.11 | Windows Mac Linux on: push: @@ -9,153 +9,364 @@ on: branches: - master - develop - jobs: + set-os: + runs-on: ubuntu-latest + outputs: + matrix_os: ${{ steps.set-matrix.outputs.matrix_os }} + steps: + - id: set-matrix + run: | + if [[ "${{ github.event_name }}" == "pull_request" && "${{ github.base_ref }}" == "develop" ]]; then + echo "matrix_os=[ \"ubuntu-latest\"]" >> $GITHUB_OUTPUT + else + echo "matrix_os=[\"windows-latest\", \"ubuntu-latest\", \"macos-latest\"]" >> $GITHUB_OUTPUT + fi + + check-changes: + runs-on: ubuntu-latest + outputs: + wave_io_hindcast_changed: ${{ steps.changes.outputs.wave_io_hindcast }} + should-run-hindcast: ${{ steps.hindcast-logic.outputs.should-run-hindcast }} + steps: + - name: Checkout code + uses: actions/checkout@v4 + + - name: Check for changes in wave/io/hindcast + id: changes + uses: dorny/paths-filter@v3 + with: + filters: | + wave_io_hindcast: + - 'mhkit/wave/io/hindcast/**' + - 'mhkit/tests/wave/io/hindcast/**' + + - id: hindcast-logic + run: | + if [[ "${{ github.event.pull_request.base.ref }}" == "master" || "${{ steps.changes.outputs.wave_io_hindcast }}" == "true" ]]; then + echo "should-run-hindcast=true" >> "$GITHUB_OUTPUT" + else + echo "should-run-hindcast=false" >> "$GITHUB_OUTPUT" + fi + + prepare-nonhindcast-cache: + runs-on: ubuntu-latest + env: + PYTHON_VER: 3.9 + steps: + - name: Checkout code + uses: actions/checkout@v4 + + - name: Setup Miniconda + uses: conda-incubator/setup-miniconda@v3 + with: + miniconda-version: 'latest' + auto-update-conda: true + python-version: ${{ env.PYTHON_VER }} + activate-environment: TESTconda + use-only-tar-bz2: true + + - name: Setup Conda environment + shell: bash -l {0} + run: | + conda install numpy cython pip hdf5 libnetcdf cftime netcdf4 --strict-channel-priority + pip install -e . --force-reinstall + + - name: Install dependencies + shell: bash -l {0} + run: | + python -m pip install --upgrade pip wheel + pip install coverage pytest coveralls . + + - name: Prepare non-hindcast API data + shell: bash -l {0} + run: | + pytest mhkit/tests/river/test_io_usgs.py + pytest mhkit/tests/tidal/test_io.py + pytest mhkit/tests/wave/io/test_cdip.py + + - name: Upload data as artifact + uses: actions/upload-artifact@v4 + with: + name: data + path: ~/.cache/mhkit + + prepare-wave-hindcast-cache: + needs: [check-changes] + runs-on: ubuntu-latest + env: + PYTHON_VER: 3.9 + if: (needs.check-changes.outputs.should-run-hindcast == 'true') + steps: + - name: Checkout code + uses: actions/checkout@v4 + + - name: Setup Miniconda + uses: conda-incubator/setup-miniconda@v3 + with: + miniconda-version: 'latest' + auto-update-conda: true + activate-environment: TEST + python-version: ${{ env.PYTHON_VER }} + use-only-tar-bz2: true + + - name: Setup Conda environment + shell: bash -l {0} + run: | + conda install numpy cython pip pytest hdf5 libnetcdf cftime netcdf4 coverage --strict-channel-priority + pip install -e . --force-reinstall + + - name: Install dependencies + shell: bash -l {0} + run: | + python -m pip install --upgrade pip wheel + pip install coverage pytest coveralls . + + - name: Prepare Wave Hindcast data + shell: bash -l {0} + run: | + pytest mhkit/tests/wave/io/hindcast/test_hindcast.py + + - name: Upload Wave Hindcast data as artifact + uses: actions/upload-artifact@v4 + with: + name: wave-hindcast-data + path: ~/.cache/mhkit + + prepare-wind-hindcast-cache: + needs: [check-changes, prepare-wave-hindcast-cache] + runs-on: ubuntu-latest + env: + PYTHON_VER: 3.9 + if: (needs.check-changes.outputs.should-run-hindcast == 'true') + steps: + - name: Checkout code + uses: actions/checkout@v4 + + - name: Setup Miniconda + uses: conda-incubator/setup-miniconda@v3 + with: + miniconda-version: 'latest' + auto-update-conda: true + activate-environment: TEST + python-version: ${{ env.PYTHON_VER }} + use-only-tar-bz2: true + + - name: Setup Conda environment + shell: bash -l {0} + run: | + conda install numpy cython pip pytest hdf5 libnetcdf cftime netcdf4 coverage --strict-channel-priority + pip install -e . --no-deps --force-reinstall + + - name: Install dependencies + shell: bash -l {0} + run: | + python -m pip install --upgrade pip wheel + pip install coverage pytest coveralls . + + - name: Prepare Wind Hindcast data + shell: bash -l {0} + run: | + pytest mhkit/tests/wave/io/hindcast/test_wind_toolkit.py + + - name: Upload Wind Hindcast data as artifact + uses: actions/upload-artifact@v4 + with: + name: wind-hindcast-data + path: ~/.cache/mhkit + conda-build: name: conda-${{ matrix.os }}/${{ matrix.python-version }} + needs: [set-os, prepare-nonhindcast-cache] runs-on: ${{ matrix.os }} strategy: fail-fast: false matrix: - os: ["windows-latest", "ubuntu-latest", "macos-latest"] - python-version: [3.7, 3.8, 3.9] + os: ${{fromJson(needs.set-os.outputs.matrix_os)}} + python-version: ['3.8', '3.9', '3.10', '3.11'] + env: + PYTHON_VER: ${{ matrix.python-version }} steps: - - uses: actions/checkout@v2 + - uses: actions/checkout@v4 - - name: Setup Conda - uses: s-weigand/setup-conda@v1 + - name: Setup Miniconda + uses: conda-incubator/setup-miniconda@v3 with: - activate-conda: false - conda-channels: conda-forge + miniconda-version: 'latest' + auto-update-conda: true + environment-file: environment.yml + activate-environment: TEST + python-version: ${{ matrix.python-version }} + use-only-tar-bz2: false - - name: Python ${{ matrix.python-version }} + - name: Create and setup Conda environment shell: bash -l {0} run: | - conda create --name TEST python=${{ matrix.python-version }} numpy cython pip pytest hdf5 libnetcdf cftime netcdf4 --strict-channel-priority - source activate TEST - export PATH="${CONDA_PREFIX}/bin:${CONDA_PREFIX}/Library/bin:$PATH" # so setup.py finds nc-config - pip install -e . --no-deps --force-reinstall + conda install -c conda-forge pytest coverage=7.5.0 coveralls --strict-channel-priority + pip install -e . --force-reinstall - - name: Tests - shell: bash -l {0} - run: | - source activate TEST - python -m pip install --upgrade pip wheel - pip install coverage - pip install pytest - pip install coveralls - pip install . + - name: Download data from artifact + uses: actions/download-artifact@v4 + with: + name: data + path: ~/.cache/mhkit - - name: Run pytest + - name: Run pytest & generate coverage report shell: bash -l {0} run: | - source activate TEST coverage run --rcfile=.github/workflows/.coveragerc --source=./mhkit/ -m pytest -c .github/workflows/pytest.ini + coverage lcov - name: Upload coverage data to coveralls.io - shell: bash -l {0} - run: | - source activate TEST - coveralls --service=github - env: - GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }} - COVERALLS_FLAG_NAME: ${{ matrix.python-version }} - COVERALLS_PARALLEL: true + uses: coverallsapp/github-action@master + with: + github-token: ${{ secrets.GITHUB_TOKEN }} + flag-name: ${{ matrix.python-version }} + parallel: true + path-to-lcov: ./coverage.lcov pip-build: name: pip-${{ matrix.os }}/${{ matrix.python-version }} + needs: [set-os, prepare-nonhindcast-cache] runs-on: ${{ matrix.os }} strategy: fail-fast: false matrix: - os: ["windows-latest", "ubuntu-latest", "macos-latest"] - python-version: [3.8, 3.9] + os: ${{fromJson(needs.set-os.outputs.matrix_os)}} + python-version: ['3.8', '3.9', '3.10', '3.11'] steps: - - uses: conda-incubator/setup-miniconda@v2 + - uses: conda-incubator/setup-miniconda@v3 - name: Set up Python ${{ matrix.python-version }} - uses: actions/setup-python@v2 + uses: actions/setup-python@v5 with: python-version: ${{ matrix.python-version }} + - name: Install HDF5 (macOS with Python 3.8) + if: startsWith(runner.os, 'macOS') && matrix.python-version == '3.8' + run: brew install hdf5 + + - name: Install NetCDF (macOS with Python 3.8) + if: startsWith(runner.os, 'macOS') && matrix.python-version == '3.8' + run: brew install netcdf + + - name: Set environment variables (macOS with Python 3.8) + if: startsWith(runner.os, 'macOS') && matrix.python-version == '3.8' + run: | + echo "HDF5_DIR=$(brew --prefix hdf5)" >> $GITHUB_ENV + echo "NETCDF4_DIR=$(brew --prefix netcdf)" >> $GITHUB_ENV + echo "PKG_CONFIG_PATH=$(brew --prefix hdf5)/lib/pkgconfig:$(brew --prefix netcdf)/lib/pkgconfig:$PKG_CONFIG_PATH" >> $GITHUB_ENV + - name: Set up Git repository - uses: actions/checkout@v2 + uses: actions/checkout@v4 + + - name: Download data from artifact + uses: actions/download-artifact@v4 + with: + name: data + path: ~/.cache/mhkit - name: Update and install packages + shell: bash -l {0} run: | python -m pip install --upgrade pip wheel - pip install coverage - pip install pytest - pip install coveralls - pip install . + pip install coverage pytest coveralls . - - name: Run pytest + - name: Run pytest & generate coverage report + shell: bash -l {0} run: | - coverage run --rcfile=.github/workflows/.coveragerc --source=./mhkit/ -m pytest -c .github/workflows/pytest.ini + coverage run --rcfile=.github/workflows/.coveragerc --source=./mhkit/ -m pytest -c .github/workflows/pytest.ini + coverage lcov - name: Upload coverage data to coveralls.io - run: coveralls --service=github - env: - GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }} - COVERALLS_FLAG_NAME: ${{ matrix.python-version }} - COVERALLS_PARALLEL: true + uses: coverallsapp/github-action@master + with: + github-token: ${{ secrets.GITHUB_TOKEN }} + flag-name: ${{ matrix.python-version }} + parallel: true + path-to-lcov: ./coverage.lcov hindcast-calls: name: hindcast-${{ matrix.os }}/${{ matrix.python-version }} + needs: + [ + check-changes, + prepare-wave-hindcast-cache, + prepare-wind-hindcast-cache, + set-os, + ] + if: (needs.check-changes.outputs.should-run-hindcast == 'true') + runs-on: ${{ matrix.os }} strategy: max-parallel: 1 fail-fast: false matrix: - os: ["windows-latest", "macos-latest"] - python-version: [3.9] + os: ${{fromJson(needs.set-os.outputs.matrix_os)}} + python-version: ['3.8', '3.9', '3.10', '3.11'] steps: - - uses: actions/checkout@v2 + - uses: actions/checkout@v4 - - name: Setup Conda - uses: s-weigand/setup-conda@v1 + - name: Setup Miniconda + uses: conda-incubator/setup-miniconda@v3 with: - activate-conda: false - conda-channels: conda-forge + miniconda-version: 'latest' + auto-update-conda: true + environment-file: environment.yml + activate-environment: TEST + python-version: ${{ matrix.python-version }} + use-only-tar-bz2: false - - name: Python ${{ matrix.python-version }} + - name: Setup Conda environment shell: bash -l {0} run: | - conda create --name TEST python=${{ matrix.python-version }} numpy cython pip pytest hdf5 libnetcdf cftime netcdf4 coverage --strict-channel-priority - source activate TEST - export PATH="${CONDA_PREFIX}/bin:${CONDA_PREFIX}/Library/bin:$PATH" # so setup.py finds nc-config - pip install -e . --no-deps --force-reinstall + conda install -c conda-forge pytest coverage=7.5.0 coveralls --strict-channel-priority + pip install -e . --force-reinstall - - name: Install MHKiT - shell: bash -l {0} + - name: Download Wave Hindcast data from artifact + uses: actions/download-artifact@v4 + with: + name: wave-hindcast-data + path: ~/.cache/mhkit/wave-hindcast + + - name: Download Wind Hindcast data from artifact + uses: actions/download-artifact@v4 + with: + name: wind-hindcast-data + path: ~/.cache/mhkit/wind-hindcast + + - name: Consolidate hindcast data run: | - source activate TEST - python -m pip install --upgrade pip wheel - pip install coveralls - pip install . + mkdir -p ~/.cache/mhkit/hindcast + mv ~/.cache/mhkit/wave-hindcast/hindcast/* ~/.cache/mhkit/hindcast/ + mv ~/.cache/mhkit/wind-hindcast/hindcast/* ~/.cache/mhkit/hindcast/ + shell: bash - - name: Run pytest + - name: Install MHKiT and run pytest shell: bash -l {0} run: | - source activate TEST - coverage run --rcfile=.github/workflows/.coveragehindcastrc -m pytest -c .github/workflows/pytest-hindcast.ini + coverage run --rcfile=.github/workflows/.coveragehindcastrc -m pytest -c .github/workflows/pytest-hindcast.ini + coverage lcov - name: Upload coverage data to coveralls.io - shell: bash -l {0} - run: | - source activate TEST - coveralls --service=github - env: - GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }} - COVERALLS_FLAG_NAME: ${{ matrix.python-version }} - COVERALLS_PARALLEL: true + uses: coverallsapp/github-action@master + with: + github-token: ${{ secrets.GITHUB_TOKEN }} + flag-name: ${{ matrix.python-version }} + parallel: true + path-to-lcov: ./coverage.lcov coveralls: name: Indicate completion to coveralls.io needs: [conda-build, pip-build, hindcast-calls] + if: | + always() && + needs.conda-build.result == 'success' && + needs.pip-build.result == 'success' && + (needs.hindcast-calls.result == 'success' || needs.hindcast-calls.result == 'skipped') runs-on: ubuntu-latest container: python:3-slim steps: diff --git a/.github/workflows/pylint.yml b/.github/workflows/pylint.yml new file mode 100644 index 000000000..08458f95d --- /dev/null +++ b/.github/workflows/pylint.yml @@ -0,0 +1,30 @@ +name: Pylint Loads + +on: [push, pull_request] + +jobs: + formatting-and-linting: + runs-on: ubuntu-latest + + steps: + - name: Check out code + uses: actions/checkout@v4 + + - name: Set up Python + uses: actions/setup-python@v2 + with: + python-version: '3.11' + + - name: Install dependencies + run: | + python -m pip install --upgrade pip wheel + pip install pylint + pip install . + + - name: Run Pylint on mhkit/loads/ + run: | + pylint mhkit/loads/ + + - name: Run Pylint on mhkit/power/ + run: | + pylint mhkit/power/ diff --git a/.hscfg b/.hscfg index f6f00424b..f9aa99caa 100644 --- a/.hscfg +++ b/.hscfg @@ -1,4 +1,4 @@ hs_endpoint = https://developer.nrel.gov/api/hsds hs_username = hs_password = -hs_api_key = 3K3JQbjZmWctY0xmIfSYvYgtIcM3CN0cb1Y2w9bf +hs_api_key = jODGciIBnejrYd9GXxgXjbbAjMDLBMWQer05P98N diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml new file mode 100644 index 000000000..b0037417e --- /dev/null +++ b/.pre-commit-config.yaml @@ -0,0 +1,8 @@ +# To run Black formating every time you commit: +# pip install pre-commit +# pre-commit install +repos: + - repo: https://github.com/psf/black + rev: stable + hooks: + - id: black diff --git a/.pypirc b/.pypirc deleted file mode 100644 index be070c7e6..000000000 --- a/.pypirc +++ /dev/null @@ -1,7 +0,0 @@ -[distutils] -index-servers=pypi - -[pypi] -repository = https://upload.pypi.org/legacy/ -username = -password = \ No newline at end of file diff --git a/README.md b/README.md index d4d0833cf..15e9483a7 100644 --- a/README.md +++ b/README.md @@ -1,5 +1,4 @@ -![](figures/logo.png) MHKiT-Python -===================================== +# ![](logo.png) MHKiT-Python

@@ -16,37 +15,41 @@

-MHKiT-Python is a Python package designed for marine renewable energy applications to assist in -data processing and visualization. The software package include functionality for: +MHKiT-Python is a Python package designed for marine renewable energy applications to assist in +data processing and visualization. The software package include functionality for: -* Data processing -* Data visualization -* Data quality control -* Resource assessment -* Device performance -* Device loads +- Data processing +- Data visualization +- Data quality control +- Resource assessment +- Device performance +- Device loads + +## Documentation -Documentation ------------------- MHKiT-Python documentation includes overview information, installation instructions, API documentation, and examples. See the [MHKiT documentation](https://mhkit-software.github.io/MHKiT) for more information. -Installation ------------------------- -MHKiT-Python requires Python (3.7, 3.8, or 3.9) along with several Python -package dependencies. MHKiT-Python can be installed from PyPI using the command ``pip install mhkit``. +## Installation + +MHKiT-Python requires Python (3.8, 3.9, 3.10, 3.11) along with several Python +package dependencies. MHKiT-Python can be installed from PyPI using the command: + +`pip install mhkit` + See [installation instructions](https://mhkit-software.github.io/MHKiT/installation.html) for more information. -Copyright and license ------------------------- -MHKiT-Python is copyright through the National Renewable Energy Laboratory, -Pacific Northwest National Laboratory, and Sandia National Laboratories. +## Copyright and license + +MHKiT-Python is copyright through the National Renewable Energy Laboratory, +Pacific Northwest National Laboratory, and Sandia National Laboratories. The software is distributed under the Revised BSD License. See [copyright and license](LICENSE.md) for more information. -Issues ------------------------- +## Issues + The GitHub platform has the Issues feature that is used to track ideas, feedback, tasks, and/or bugs. To submit an Issue, follow the steps below. More information about GitHub Issues can be found [here](https://docs.github.com/en/issues/tracking-your-work-with-issues/about-issues) + 1. Navigate to the [MHKiT-Python main page](https://github.com/MHKiT-Software/MHKiT-Python) 2. 2.Under the repository name (upper left), click **Issues**. 3. Click **New Issue**. @@ -54,9 +57,10 @@ The GitHub platform has the Issues feature that is used to track ideas, feedback 5. Provide a **Title** and **description** for the issue. Be sure the title is relevant to the issue and that the description is clear and provided with sufficient detail. 6. When you're finished, click **Submit new issue**. The developers will follow-up once the issue is addressed. -Creating a fork ------------------------- +## Creating a fork + The GitHub platform has the Fork feature that facilitates code modification and contributions. A fork is a new repository that shares code and visibility settings with the original upstream repository. To fork MHKiT-Python, follow the steps below. More information about GitHub Forks can be found [here](https://docs.github.com/en/get-started/quickstart/fork-a-repo) + 1. Navigate to the [MHKiT-Python main page](https://github.com/MHKiT-Software/MHKiT-Python) 2. Under the repository name (upper left), click **Fork**. 3. Select an owner for the forked repository. @@ -65,25 +69,38 @@ The GitHub platform has the Fork feature that facilitates code modification and 6. Choose whether to copy only the default branch or all branches to the new fork. You will only need copy the default branch to contribute to MHKiT-Python. 7. When you're finished, click **Create fork**. You will now have a fork of the MHKiT-Python repository. -Creating a branch ------------------------- +## Creating a branch + The GitHub platform has the branch feature that facilitates code contributions and collaboration amongst developers. A branch isolates development work without affecting other branches in the repository. Each repository has one default branch, and can have multiple other branches. To create a branch of your forked MHKiT-Python repository, follow the steps below. More information about GitHub branches can be found [here](https://docs.github.com/en/pull-requests/collaborating-with-pull-requests/proposing-changes-to-your-work-with-pull-requests/about-branches) + 1. Navigate to your fork of MHKiT-Python (see instructions above) 2. Above the list of files, click **Branches**. -3. Click **New Branch**. +3. Click **New Branch**. 4. Enter a name for the branch. Be sure to select **MHKiT-Software/MHKiT-Python:master** as the source. 5. Click **Create branch**. You will now have a branch on your fork of MHKiT-Python that you can use to work with the code base. -Creating a pull request ------------------------- +## Creating a pull request + The GitHub platform has the pull request feature that allows you to propose changes to a repository such as MHKiT-Python. The pull request will allow the repository administrators to evaluate the pull request. To create a pull request for MHKiT-Python repository, follow the steps below. More information about GitHub pull requests can be found [here](https://docs.github.com/en/pull-requests/collaborating-with-pull-requests/proposing-changes-to-your-work-with-pull-requests/creating-a-pull-request) + 1. Navigate to the [MHKiT-Python main page](https://github.com/MHKiT-Software/MHKiT-Python) 2. Above the list of files, click **Pull request**. -3. On the compare page, click **Compare accross forks**. -4. In the "base branch" drop-down menu, select the branch of the upstream repository you'd like to merge changes into. +3. On the compare page, click **Compare accross forks**. +4. In the "base branch" drop-down menu, select the branch of the upstream repository you'd like to merge changes into. 5. In the "head fork" drop-down menu, select your fork, then use the "compare branch" drop-down menu to select the branch you made your changes in. 6. Type a title and description for your pull request. 7. If you want to allow anyone with push access to the upstream repository to make changes to your pull request, select **Allow edits from maintainers**. 8. To create a pull request that is ready for review, click **Create Pull Request**. To create a draft pull request, use the drop-down and select **Create Draft Pull Request**, then click **Draft Pull Request**. More information about draft pull requests can be found [here](https://docs.github.com/en/pull-requests/collaborating-with-pull-requests/proposing-changes-to-your-work-with-pull-requests/about-pull-requests#draft-pull-requests) 9. MHKiT-Python adminstrators will review your pull request and contact you if needed. +## Code Formatting in MHKiT + +MHKiT adheres to the "black" code formatting standard to maintain a consistent and readable code style. Developers contributing to MHKiT have several options to ensure their code meets this standard: + +1. **Manual Formatting with Black**: Install the 'black' formatter and run it manually from the terminal to format your code. This can be done by executing a command like `black [file or directory]`. + +2. **IDE Extension**: If you are using an Integrated Development Environment (IDE) like Visual Studio Code (VS Code), you can install the 'black' formatter as an extension. This allows for automatic formatting of code within the IDE. + +3. **Pre-Commit Hook**: Enable the pre-commit hook in your development environment. This automatically formats your code with 'black' each time you make a commit, ensuring that all committed code conforms to the formatting standard. + +For detailed instructions on installing and using 'black', please refer to the [Black Documentation](https://black.readthedocs.io/en/stable/). This resource provides comprehensive guidance on installation, usage, and configuration of the formatter. diff --git a/ci/install_python.ps1 b/ci/install_python.ps1 deleted file mode 100644 index b41eea5e5..000000000 --- a/ci/install_python.ps1 +++ /dev/null @@ -1,93 +0,0 @@ -# Sample script to install Python and pip under Windows -# Authors: Olivier Grisel, Jonathan Helmus and Kyle Kastner -# License: CC0 1.0 Universal: http://creativecommons.org/publicdomain/zero/1.0/ - -$MINICONDA_URL = "http://repo.continuum.io/miniconda/" -$BASE_URL = "https://www.python.org/ftp/python/" - - -function DownloadMiniconda ($python_version, $platform_suffix) { - $webclient = New-Object System.Net.WebClient - if ($python_version -eq "3.4") { - $filename = "Miniconda3-3.7.3-Windows-" + $platform_suffix + ".exe" - } else { - $filename = "Miniconda-3.7.3-Windows-" + $platform_suffix + ".exe" - } - $url = $MINICONDA_URL + $filename - - $basedir = $pwd.Path + "\" - $filepath = $basedir + $filename - if (Test-Path $filename) { - Write-Host "Reusing" $filepath - return $filepath - } - - # Download and retry up to 3 times in case of network transient errors. - Write-Host "Downloading" $filename "from" $url - $retry_attempts = 2 - for($i=0; $i -lt $retry_attempts; $i++){ - try { - $webclient.DownloadFile($url, $filepath) - break - } - Catch [Exception]{ - Start-Sleep 1 - } - } - if (Test-Path $filepath) { - Write-Host "File saved at" $filepath - } else { - # Retry once to get the error message if any at the last try - $webclient.DownloadFile($url, $filepath) - } - return $filepath -} - - -function InstallMiniconda ($python_version, $architecture, $python_home) { - Write-Host "Installing Python" $python_version "for" $architecture "bit architecture to" $python_home - if (Test-Path $python_home) { - Write-Host $python_home "already exists, skipping." - return $false - } - if ($architecture -eq "32") { - $platform_suffix = "x86" - } else { - $platform_suffix = "x86_64" - } - $filepath = DownloadMiniconda $python_version $platform_suffix - Write-Host "Installing" $filepath "to" $python_home - $install_log = $python_home + ".log" - $args = "/S /D=$python_home" - Write-Host $filepath $args - Start-Process -FilePath $filepath -ArgumentList $args -Wait -Passthru - if (Test-Path $python_home) { - Write-Host "Python $python_version ($architecture) installation complete" - } else { - Write-Host "Failed to install Python in $python_home" - Get-Content -Path $install_log - Exit 1 - } -} - - -function InstallMinicondaPip ($python_home) { - $pip_path = $python_home + "\Scripts\pip.exe" - $conda_path = $python_home + "\Scripts\conda.exe" - if (-not(Test-Path $pip_path)) { - Write-Host "Installing pip..." - $args = "install --yes pip" - Write-Host $conda_path $args - Start-Process -FilePath "$conda_path" -ArgumentList $args -Wait -Passthru - } else { - Write-Host "pip already installed." - } -} - - -function main () { - InstallMiniconda $env:PYTHON_VERSION $env:PYTHON_ARCH $env:PYTHON - InstallMinicondaPip $env:PYTHON -} - -main \ No newline at end of file diff --git a/ci/requirements-py36.yml b/ci/requirements-py36.yml deleted file mode 100644 index 9f58e5202..000000000 --- a/ci/requirements-py36.yml +++ /dev/null @@ -1,15 +0,0 @@ -name: test_env -channels: - - defaults - - conda-forge -dependencies: - - python=3.6 - - pandas - - numpy - - scipy - - matplotlib - - requests - - nose - - NREL-rex - - pip: - - coveralls diff --git a/ci/requirements-py37.yml b/ci/requirements-py37.yml deleted file mode 100644 index 28efef533..000000000 --- a/ci/requirements-py37.yml +++ /dev/null @@ -1,15 +0,0 @@ -name: test_env -channels: - - defaults - - conda-forge -dependencies: - - python=3.7 - - pandas - - numpy - - scipy - - matplotlib - - requests - - nose - - NREL-rex - - pip: - - coveralls diff --git a/environment.yml b/environment.yml new file mode 100644 index 000000000..92b603f09 --- /dev/null +++ b/environment.yml @@ -0,0 +1,25 @@ +name: myenv +channels: + - conda-forge + - defaults +dependencies: + - python>=3.8 + - pandas>=1.0.0 + - numpy>=1.21.0 + - scipy + - matplotlib + - requests + - lxml + - scikit-learn + - statsmodels + - bottleneck + - beautifulsoup4 + - xarray + - h5py>=3.6.0 + - netcdf4>=1.5.8 + - pip: + - pecos>=0.3.0 + - fatpack + - NREL-rex>=0.2.63 + - h5pyd>=0.7.0 + - six>=1.13.0 diff --git a/examples/ADCP_Delft3D_TRTS_example.ipynb b/examples/ADCP_Delft3D_TRTS_example.ipynb index 142ebc068..4b3655ce6 100644 --- a/examples/ADCP_Delft3D_TRTS_example.ipynb +++ b/examples/ADCP_Delft3D_TRTS_example.ipynb @@ -30,13 +30,14 @@ "import matplotlib\n", "import scipy.io\n", "import netCDF4\n", - "import math \n", + "import math\n", "import utm\n", + "\n", "# MHKiT Imports\n", "from mhkit.dolfyn.rotate import api as ap\n", "from mhkit.dolfyn.adp import api\n", "from mhkit import dolfyn as dlfn\n", - "from mhkit.river.io import d3d \n", + "from mhkit.river.io import d3d\n", "from mhkit import river" ] }, @@ -705,10 +706,14 @@ ], "source": [ "# Read in the two transect passes\n", - "transect_1_raw = api.read('data/river/ADCP_transect/tanana_transects_08_10_10_0_002_10-08-10_142214.PD0') \n", - "transect_2_raw = api.read('data/river/ADCP_transect/tanana_transects_08_10_10_0_003_10-08-10_143335.PD0')\n", + "transect_1_raw = api.read(\n", + " \"data/river/ADCP_transect/tanana_transects_08_10_10_0_002_10-08-10_142214.PD0\"\n", + ")\n", + "transect_2_raw = api.read(\n", + " \"data/river/ADCP_transect/tanana_transects_08_10_10_0_003_10-08-10_143335.PD0\"\n", + ")\n", "# Create one dataset from the two passes\n", - "transect_1_2= xr.merge([transect_1_raw, transect_2_raw])\n", + "transect_1_2 = xr.merge([transect_1_raw, transect_2_raw])\n", "# Print the xarray data\n", "transect_1_2" ] @@ -731,15 +736,11 @@ "outputs": [], "source": [ "# Convert Coordiantes to UTM using utm module\n", - "utm_x_y = utm.from_latlon(\n", - " transect_1_2.latitude_gps, \n", - " transect_1_2.longitude_gps, \n", - " 6,'W'\n", - " ) \n", - "\n", - "# Create a DataFrame from the points \n", - "gps = [[x, y] for x, y in zip(utm_x_y[0], utm_x_y[1])] \n", - "gps_points = pd.DataFrame(np.array(gps), columns= ['utm_x','utm_y'])" + "utm_x_y = utm.from_latlon(transect_1_2.latitude_gps, transect_1_2.longitude_gps, 6, \"W\")\n", + "\n", + "# Create a DataFrame from the points\n", + "gps = [[x, y] for x, y in zip(utm_x_y[0], utm_x_y[1])]\n", + "gps_points = pd.DataFrame(np.array(gps), columns=[\"utm_x\", \"utm_y\"])" ] }, { @@ -760,7 +761,7 @@ "source": [ "# Nenana Alaska is 15.7 deg East\n", "angle = 15.7\n", - "ap.set_declination(transect_1_2, angle, inplace=True) " + "ap.set_declination(transect_1_2, angle, inplace=True)" ] }, { @@ -780,8 +781,8 @@ "metadata": {}, "outputs": [], "source": [ - "# Rotate to 'earth' coordinate system \n", - "api.rotate2(transect_1_2, 'earth', inplace=True)" + "# Rotate to 'earth' coordinate system\n", + "api.rotate2(transect_1_2, \"earth\", inplace=True)" ] }, { @@ -831,48 +832,55 @@ } ], "source": [ - "\n", "# Linear regression using first order polyfit\n", - "a,b = np.polyfit(gps_points.utm_x, gps_points.utm_y,1)\n", + "a, b = np.polyfit(gps_points.utm_x, gps_points.utm_y, 1)\n", "\n", "# Generate a DataFrame of points from the linear regression\n", - "ideal= [ [x, y] for x, y in zip(gps_points.utm_x, a*gps_points.utm_x+b)] \n", - "ideal_points = pd.DataFrame(np.array(ideal), columns= ['utm_x','utm_y'])\n", + "ideal = [[x, y] for x, y in zip(gps_points.utm_x, a * gps_points.utm_x + b)]\n", + "ideal_points = pd.DataFrame(np.array(ideal), columns=[\"utm_x\", \"utm_y\"])\n", "\n", "# Repeat UTM corrdinates to match the ADCP points matrix (dir, range, time)\n", "utm_x_points = np.tile(gps_points.utm_x, np.size(transect_1_2.range))\n", - "utm_y_points = np.tile(a*gps_points.utm_x+b, np.size(transect_1_2.range))\n", - "depth_points = np.repeat( transect_1_2.range, np.size(gps_points.utm_x))\n", + "utm_y_points = np.tile(a * gps_points.utm_x + b, np.size(transect_1_2.range))\n", + "depth_points = np.repeat(transect_1_2.range, np.size(gps_points.utm_x))\n", "\n", - "ADCP_ideal_points={\n", - " 'utm_x': utm_x_points, \n", - " 'utm_y': utm_y_points, \n", - " 'waterdepth': depth_points\n", - " }\n", - "ADCP_ideal_points=pd.DataFrame(ADCP_ideal_points)\n", + "ADCP_ideal_points = {\n", + " \"utm_x\": utm_x_points,\n", + " \"utm_y\": utm_y_points,\n", + " \"waterdepth\": depth_points,\n", + "}\n", + "ADCP_ideal_points = pd.DataFrame(ADCP_ideal_points)\n", "\n", "# Initialize the figure\n", - "figure(figsize=(8,6))\n", + "figure(figsize=(8, 6))\n", "fig, ax = plt.subplots()\n", "\n", "# Get data from the original transect in UTM for comparison\n", - "transect_1 = utm.from_latlon(transect_1_raw.latitude_gps, transect_1_raw.longitude_gps, 6, 'W') \n", - "transect_2 = utm.from_latlon(transect_2_raw.latitude_gps, transect_2_raw.longitude_gps, 6, 'W') \n", + "transect_1 = utm.from_latlon(\n", + " transect_1_raw.latitude_gps, transect_1_raw.longitude_gps, 6, \"W\"\n", + ")\n", + "transect_2 = utm.from_latlon(\n", + " transect_2_raw.latitude_gps, transect_2_raw.longitude_gps, 6, \"W\"\n", + ")\n", "\n", "# Plot the original transect data for comparison\n", - "plt.plot(transect_1[0],transect_1[1], 'b', label= 'GPS Transect 1' )\n", - "plt.plot(transect_2[0],transect_2[1], 'r--', label= 'GPS Transect 2')\n", + "plt.plot(transect_1[0], transect_1[1], \"b\", label=\"GPS Transect 1\")\n", + "plt.plot(transect_2[0], transect_2[1], \"r--\", label=\"GPS Transect 2\")\n", "\n", "# Plot the Idealized Transect\n", - "plt.plot(ADCP_ideal_points.utm_x, ADCP_ideal_points.utm_y, 'k-.', label='Ideal Transect')\n", - "plt.ticklabel_format(style= 'scientific',useOffset=False)\n", - "ax.get_xaxis().set_major_formatter(matplotlib.ticker.FuncFormatter(lambda x, p: format(int(x), ',')))\n", + "plt.plot(\n", + " ADCP_ideal_points.utm_x, ADCP_ideal_points.utm_y, \"k-.\", label=\"Ideal Transect\"\n", + ")\n", + "plt.ticklabel_format(style=\"scientific\", useOffset=False)\n", + "ax.get_xaxis().set_major_formatter(\n", + " matplotlib.ticker.FuncFormatter(lambda x, p: format(int(x), \",\"))\n", + ")\n", "plt.xticks(rotation=45)\n", "\n", "# Plot Settings\n", "plt.legend()\n", - "plt.xlabel('$UTM_x (m)$')\n", - "plt.ylabel('$UTM_y (m)$')" + "plt.xlabel(\"$UTM_x (m)$\")\n", + "plt.ylabel(\"$UTM_y (m)$\")" ] }, { @@ -893,7 +901,7 @@ "outputs": [], "source": [ "# Adjust the range offset, included here for reference\n", - "offset=0\n", + "offset = 0\n", "api.clean.set_range_offset(transect_1_2, offset)" ] }, @@ -937,11 +945,11 @@ ], "source": [ "# Apply the correlation filter\n", - "min_correlation=40\n", + "min_correlation = 40\n", "transect_1_2 = api.clean.correlation_filter(transect_1_2, thresh=min_correlation)\n", "\n", "# Plot the results the (data is displayed upside-down)\n", - "transect_1_2.corr.sel(beam=1).plot() " + "transect_1_2.corr.sel(beam=1).plot()" ] }, { @@ -969,23 +977,25 @@ ], "source": [ "# Filtering out depth sounder values above the river surface\n", - "depth_sounder = transect_1_2.where(transect_1_2.dist_bt > 0 )\n", + "depth_sounder = transect_1_2.where(transect_1_2.dist_bt > 0)\n", "\n", "# Of the 4 values beams get the shallowest depth value at each location\n", "bottom = np.min(depth_sounder.dist_bt, axis=0)\n", "\n", - "# River bottom for ideal transect \n", - "bottom_avg = interp.griddata(gps_points, bottom, ideal_points, method='linear')\n", + "# River bottom for ideal transect\n", + "bottom_avg = interp.griddata(gps_points, bottom, ideal_points, method=\"linear\")\n", "\n", "# Create a matrix of depths\n", - "bottom_filter = d3d.create_points(x=bottom_avg, y=transect_1_2.range.to_numpy(), waterdepth=1)\n", + "bottom_filter = d3d.create_points(\n", + " x=bottom_avg, y=transect_1_2.range.to_numpy(), waterdepth=1\n", + ")\n", "\n", - "# Creating a mask matrix with ones in the area of the river cross section and nan's outside \n", + "# Creating a mask matrix with ones in the area of the river cross section and nan's outside\n", "river_bottom_filter = []\n", - "for index, row in bottom_filter.iterrows():\n", - " if row['x'] > row['y']: \n", - " filter = 1 \n", - " else: \n", + "for index, row in bottom_filter.iterrows():\n", + " if row[\"x\"] > row[\"y\"]:\n", + " filter = 1\n", + " else:\n", " filter = float(\"nan\")\n", " river_bottom_filter = np.append(river_bottom_filter, filter)" ] @@ -1177,33 +1187,26 @@ ], "source": [ "# Tiling the GPS data for each depth bin\n", - "gps_utm_x = np.tile(\n", - " gps_points.utm_x, \n", - " np.size(transect_1_2.range)\n", - " )\n", - "gps_utm_y = np.tile(\n", - " gps_points.utm_y, \n", - " np.size(transect_1_2.range)\n", - " )\n", + "gps_utm_x = np.tile(gps_points.utm_x, np.size(transect_1_2.range))\n", + "gps_utm_y = np.tile(gps_points.utm_y, np.size(transect_1_2.range))\n", "\n", "# Repeating the depth bins for each GPS point\n", - "depth = np.repeat( \n", - " transect_1_2.range, \n", - " np.size(gps_points.utm_x)\n", - " )\n", + "depth = np.repeat(transect_1_2.range, np.size(gps_points.utm_x))\n", "\n", "# Create Dataframe from the calculated points\n", - "ADCP_points = pd.DataFrame({\n", - " 'utm_x': gps_utm_x, \n", - " 'utm_y': gps_utm_y, \n", - " 'waterdepth': depth\n", - " })\n", - "\n", - "# Raveling the veocity data to correspond with 'ADCP_points' and filtering out velocity data bellow the river bottom \n", - "ADCP_points['east_velocity']= np.ravel(transect_1_2.vel[0, :,:]) * river_bottom_filter\n", - "ADCP_points['north_velocity']= np.ravel(transect_1_2.vel[1, :,:]) * river_bottom_filter\n", - "ADCP_points['vertical_velocity']= np.ravel(transect_1_2.vel[2, :,:])* river_bottom_filter\n", - "ADCP_points= ADCP_points.dropna()\n", + "ADCP_points = pd.DataFrame(\n", + " {\"utm_x\": gps_utm_x, \"utm_y\": gps_utm_y, \"waterdepth\": depth}\n", + ")\n", + "\n", + "# Raveling the veocity data to correspond with 'ADCP_points' and filtering out velocity data bellow the river bottom\n", + "ADCP_points[\"east_velocity\"] = np.ravel(transect_1_2.vel[0, :, :]) * river_bottom_filter\n", + "ADCP_points[\"north_velocity\"] = (\n", + " np.ravel(transect_1_2.vel[1, :, :]) * river_bottom_filter\n", + ")\n", + "ADCP_points[\"vertical_velocity\"] = (\n", + " np.ravel(transect_1_2.vel[2, :, :]) * river_bottom_filter\n", + ")\n", + "ADCP_points = ADCP_points.dropna()\n", "\n", "# Show points\n", "ADCP_points" @@ -1226,29 +1229,33 @@ "metadata": {}, "outputs": [], "source": [ - "# Project velocity onto ideal tansect \n", - "ADCP_ideal= pd.DataFrame()\n", - "ADCP_ideal['east_velocity'] = interp.griddata(\n", - " ADCP_points[['utm_x','utm_y','waterdepth']],\n", - " ADCP_points['east_velocity'],\n", - " ADCP_ideal_points[['utm_x','utm_y','waterdepth']],\n", - " method='linear'\n", - " )\n", - "ADCP_ideal['north_velocity'] = interp.griddata(\n", - " ADCP_points[['utm_x','utm_y','waterdepth']],\n", - " ADCP_points['north_velocity'],\n", - " ADCP_ideal_points[['utm_x','utm_y','waterdepth']],\n", - " method='linear'\n", - " )\n", - "ADCP_ideal['vertical_velocity'] = interp.griddata(\n", - " ADCP_points[['utm_x','utm_y','waterdepth']],\n", - " ADCP_points['vertical_velocity'],\n", - " ADCP_ideal_points[['utm_x','utm_y','waterdepth']],\n", - " method='linear'\n", - " )\n", + "# Project velocity onto ideal tansect\n", + "ADCP_ideal = pd.DataFrame()\n", + "ADCP_ideal[\"east_velocity\"] = interp.griddata(\n", + " ADCP_points[[\"utm_x\", \"utm_y\", \"waterdepth\"]],\n", + " ADCP_points[\"east_velocity\"],\n", + " ADCP_ideal_points[[\"utm_x\", \"utm_y\", \"waterdepth\"]],\n", + " method=\"linear\",\n", + ")\n", + "ADCP_ideal[\"north_velocity\"] = interp.griddata(\n", + " ADCP_points[[\"utm_x\", \"utm_y\", \"waterdepth\"]],\n", + " ADCP_points[\"north_velocity\"],\n", + " ADCP_ideal_points[[\"utm_x\", \"utm_y\", \"waterdepth\"]],\n", + " method=\"linear\",\n", + ")\n", + "ADCP_ideal[\"vertical_velocity\"] = interp.griddata(\n", + " ADCP_points[[\"utm_x\", \"utm_y\", \"waterdepth\"]],\n", + " ADCP_points[\"vertical_velocity\"],\n", + " ADCP_ideal_points[[\"utm_x\", \"utm_y\", \"waterdepth\"]],\n", + " method=\"linear\",\n", + ")\n", "\n", "# Calculate the magnitude of the velocity components\n", - "ADCP_ideal['magnitude']= np.sqrt(ADCP_ideal.east_velocity**2+ADCP_ideal.north_velocity**2+ADCP_ideal.vertical_velocity**2)" + "ADCP_ideal[\"magnitude\"] = np.sqrt(\n", + " ADCP_ideal.east_velocity**2\n", + " + ADCP_ideal.north_velocity**2\n", + " + ADCP_ideal.vertical_velocity**2\n", + ")" ] }, { @@ -1298,29 +1305,31 @@ ], "source": [ "# Set the contour color bar bounds\n", - "min_plot=0\n", - "max_plot=3\n", + "min_plot = 0\n", + "max_plot = 3\n", "\n", - "# The Contour of velocity magnitude from the ADCP transect data \n", - "fig,ax = plt.subplots(figsize=(10,4.4))\n", + "# The Contour of velocity magnitude from the ADCP transect data\n", + "fig, ax = plt.subplots(figsize=(10, 4.4))\n", "\n", "contour_plot = plt.tripcolor(\n", - " ADCP_ideal_points.utm_x, \n", - " -ADCP_ideal_points.waterdepth, \n", - " ADCP_ideal.magnitude*river_bottom_filter,\n", + " ADCP_ideal_points.utm_x,\n", + " -ADCP_ideal_points.waterdepth,\n", + " ADCP_ideal.magnitude * river_bottom_filter,\n", " vmin=min_plot,\n", - " vmax=max_plot\n", + " vmax=max_plot,\n", ")\n", "\n", - "plt.xlabel('$UTM_x (m)$')\n", - "plt.ylabel('Water Depth (m)')\n", - "cbar= plt.colorbar(contour_plot)\n", - "cbar.set_label('velocity [m/s]')\n", - "plt.ylim([-8.5,-1])\n", - "plt.xlim([400950,401090])\n", - "plt.plot(ideal_points.utm_x,-bottom_avg,'k', label= 'river bottom')\n", - "plt.legend(loc= 7)\n", - "ax.get_xaxis().set_major_formatter(matplotlib.ticker.FuncFormatter(lambda x, p: format(int(x), ',')))\n", + "plt.xlabel(\"$UTM_x (m)$\")\n", + "plt.ylabel(\"Water Depth (m)\")\n", + "cbar = plt.colorbar(contour_plot)\n", + "cbar.set_label(\"velocity [m/s]\")\n", + "plt.ylim([-8.5, -1])\n", + "plt.xlim([400950, 401090])\n", + "plt.plot(ideal_points.utm_x, -bottom_avg, \"k\", label=\"river bottom\")\n", + "plt.legend(loc=7)\n", + "ax.get_xaxis().set_major_formatter(\n", + " matplotlib.ticker.FuncFormatter(lambda x, p: format(int(x), \",\"))\n", + ")\n", "plt.xticks(rotation=45)" ] }, @@ -1363,38 +1372,39 @@ ], "source": [ "# Interpolate points by getting min & max first\n", - "start_utmx = min(ADCP_ideal_points.utm_x)\n", + "start_utmx = min(ADCP_ideal_points.utm_x)\n", "start_utmy = min(ADCP_ideal_points.utm_y)\n", "\n", "end_utmx = max(ADCP_ideal_points.utm_x)\n", "end_utmy = min(ADCP_ideal_points.utm_y)\n", "\n", "# Using N points for x calculate the y values on an ideal transect from the linear regression used earlier\n", - "N=10\n", + "N = 10\n", "utm_x_ideal_downsampeled = np.linspace(start_utmx, end_utmx, N)\n", - "utm_y_ideal_downsampeled = (a*utm_x_ideal_downsampeled) + b\n", - "\n", + "utm_y_ideal_downsampeled = (a * utm_x_ideal_downsampeled) + b\n", "\n", "\n", "# Plot the Idealized Transect for comparison\n", "plt.plot(\n", - " ADCP_ideal_points.utm_x, \n", - " ADCP_ideal_points.utm_y, \n", - " '.', ms=1, label='Ideal Transect'\n", - " )\n", + " ADCP_ideal_points.utm_x, ADCP_ideal_points.utm_y, \".\", ms=1, label=\"Ideal Transect\"\n", + ")\n", "\n", "# Plot the downsampled transect\n", "plt.plot(\n", - " utm_x_ideal_downsampeled, \n", - " utm_y_ideal_downsampeled, \n", - " 'ro', label='Down Sampled Ideal Transect')\n", + " utm_x_ideal_downsampeled,\n", + " utm_y_ideal_downsampeled,\n", + " \"ro\",\n", + " label=\"Down Sampled Ideal Transect\",\n", + ")\n", "\n", "\n", "# Plot settings\n", - "ax.get_xaxis().set_major_formatter(matplotlib.ticker.FuncFormatter(lambda x, p: format(int(x), ',')))\n", + "ax.get_xaxis().set_major_formatter(\n", + " matplotlib.ticker.FuncFormatter(lambda x, p: format(int(x), \",\"))\n", + ")\n", "plt.xticks(rotation=45)\n", - "plt.xlabel('$UTM_x$')\n", - "plt.ylabel('$UTM_y$')\n", + "plt.xlabel(\"$UTM_x$\")\n", + "plt.ylabel(\"$UTM_y$\")\n", "plt.legend()" ] }, @@ -1435,52 +1445,46 @@ ], "source": [ "# Create an idealized depth N layers deep\n", - "N_layers=12\n", + "N_layers = 12\n", "downsampled_depth = np.linspace(\n", - " transect_1_2.range.min(), \n", - " np.nanmax(bottom_avg), \n", - " N_layers\n", - " )\n", + " transect_1_2.range.min(), np.nanmax(bottom_avg), N_layers\n", + ")\n", "\n", - "# Repeat this over the N points of the DownSampled Ideal Transect above \n", - "depth_ideal_points_downsampled = np.repeat(\n", - " downsampled_depth,\n", - " N\n", - " )\n", + "# Repeat this over the N points of the DownSampled Ideal Transect above\n", + "depth_ideal_points_downsampled = np.repeat(downsampled_depth, N)\n", "\n", "# Tile the x, y over the N of layers to add to a DataFrame\n", - "utm_x_ideal_points_downsampled= np.tile(\n", - " utm_x_ideal_downsampeled, \n", - " N_layers\n", - " )\n", - "utm_y_ideal_points_downsampled= np.tile(\n", - " utm_y_ideal_downsampeled, \n", - " N_layers\n", - " )\n", + "utm_x_ideal_points_downsampled = np.tile(utm_x_ideal_downsampeled, N_layers)\n", + "utm_y_ideal_points_downsampled = np.tile(utm_y_ideal_downsampeled, N_layers)\n", "\n", "# Create a Dataframe of our idealized x,y,depth points\n", - "ADCP_ideal_points_downsamples=pd.DataFrame({\n", - " 'utm_x': utm_x_ideal_points_downsampled, \n", - " 'utm_y': utm_y_ideal_points_downsampled,\n", - " 'waterdepth': depth_ideal_points_downsampled\n", - " })\n", + "ADCP_ideal_points_downsamples = pd.DataFrame(\n", + " {\n", + " \"utm_x\": utm_x_ideal_points_downsampled,\n", + " \"utm_y\": utm_y_ideal_points_downsampled,\n", + " \"waterdepth\": depth_ideal_points_downsampled,\n", + " }\n", + ")\n", "\n", "# Plot the Down sampled data points at the x locations\n", - "fig,ax = plt.subplots(figsize=(10,4.4))\n", - "plt.plot(ADCP_ideal_points_downsamples.utm_x, \n", - " ADCP_ideal_points_downsamples.waterdepth * -1, \n", - " 'ro', \n", - " )\n", + "fig, ax = plt.subplots(figsize=(10, 4.4))\n", + "plt.plot(\n", + " ADCP_ideal_points_downsamples.utm_x,\n", + " ADCP_ideal_points_downsamples.waterdepth * -1,\n", + " \"ro\",\n", + ")\n", "\n", "# Plot the ADCP river bed\n", - "plt.plot(ideal_points.utm_x,-bottom_avg,'k', label= 'river bottom')\n", + "plt.plot(ideal_points.utm_x, -bottom_avg, \"k\", label=\"river bottom\")\n", "\n", "# Plot settings\n", - "ax.get_xaxis().set_major_formatter(matplotlib.ticker.FuncFormatter(lambda x, p: format(int(x), ',')))\n", + "ax.get_xaxis().set_major_formatter(\n", + " matplotlib.ticker.FuncFormatter(lambda x, p: format(int(x), \",\"))\n", + ")\n", "plt.xticks(rotation=45)\n", - "plt.title('DownSampled Ideal Transect Depth')\n", - "plt.xlabel('$UTM_x [m]$')\n", - "plt.ylabel('$ Depth [m]$')" + "plt.title(\"DownSampled Ideal Transect Depth\")\n", + "plt.xlabel(\"$UTM_x [m]$\")\n", + "plt.ylabel(\"$ Depth [m]$\")" ] }, { @@ -1632,27 +1636,31 @@ } ], "source": [ - "# Project velocity onto ideal tansect \n", - "ADCP_ideal_downsamples= pd.DataFrame()\n", - "ADCP_ideal_downsamples['east_velocity']= interp.griddata(\n", - " ADCP_points[['utm_x','utm_y','waterdepth']],\n", - " ADCP_points['east_velocity'],\n", - " ADCP_ideal_points_downsamples[['utm_x','utm_y','waterdepth']],\n", - " method='linear'\n", - " )\n", - "ADCP_ideal_downsamples['north_velocity']= interp.griddata(\n", - " ADCP_points[['utm_x','utm_y','waterdepth']],\n", - " ADCP_points['north_velocity'],\n", - " ADCP_ideal_points_downsamples[['utm_x','utm_y','waterdepth']],\n", - " method='linear'\n", + "# Project velocity onto ideal tansect\n", + "ADCP_ideal_downsamples = pd.DataFrame()\n", + "ADCP_ideal_downsamples[\"east_velocity\"] = interp.griddata(\n", + " ADCP_points[[\"utm_x\", \"utm_y\", \"waterdepth\"]],\n", + " ADCP_points[\"east_velocity\"],\n", + " ADCP_ideal_points_downsamples[[\"utm_x\", \"utm_y\", \"waterdepth\"]],\n", + " method=\"linear\",\n", + ")\n", + "ADCP_ideal_downsamples[\"north_velocity\"] = interp.griddata(\n", + " ADCP_points[[\"utm_x\", \"utm_y\", \"waterdepth\"]],\n", + " ADCP_points[\"north_velocity\"],\n", + " ADCP_ideal_points_downsamples[[\"utm_x\", \"utm_y\", \"waterdepth\"]],\n", + " method=\"linear\",\n", + ")\n", + "ADCP_ideal_downsamples[\"vertical_velocity\"] = interp.griddata(\n", + " ADCP_points[[\"utm_x\", \"utm_y\", \"waterdepth\"]],\n", + " ADCP_points[\"vertical_velocity\"],\n", + " ADCP_ideal_points_downsamples[[\"utm_x\", \"utm_y\", \"waterdepth\"]],\n", + " method=\"linear\",\n", + ")\n", + "ADCP_ideal_downsamples[\"magnitude\"] = np.sqrt(\n", + " ADCP_ideal_downsamples.east_velocity**2\n", + " + ADCP_ideal_downsamples.north_velocity**2\n", + " + ADCP_ideal_downsamples.vertical_velocity**2\n", ")\n", - "ADCP_ideal_downsamples['vertical_velocity']= interp.griddata(\n", - " ADCP_points[['utm_x','utm_y','waterdepth']],\n", - " ADCP_points['vertical_velocity'],\n", - " ADCP_ideal_points_downsamples[['utm_x','utm_y','waterdepth']],\n", - " method='linear'\n", - " )\n", - "ADCP_ideal_downsamples['magnitude']= np.sqrt(ADCP_ideal_downsamples.east_velocity**2+ADCP_ideal_downsamples.north_velocity**2+ADCP_ideal_downsamples.vertical_velocity**2)\n", "ADCP_ideal_downsamples" ] }, @@ -1682,23 +1690,31 @@ ], "source": [ "# Create a DataFrame of downsampled points\n", - "ideal_downsampeled= [ [x, y] for x, y in zip(utm_x_ideal_downsampeled, utm_y_ideal_downsampeled)] \n", - "ideal_points_downsampled = pd.DataFrame(np.array(ideal_downsampeled), columns= ['utm_x','utm_y'])\n", + "ideal_downsampeled = [\n", + " [x, y] for x, y in zip(utm_x_ideal_downsampeled, utm_y_ideal_downsampeled)\n", + "]\n", + "ideal_points_downsampled = pd.DataFrame(\n", + " np.array(ideal_downsampeled), columns=[\"utm_x\", \"utm_y\"]\n", + ")\n", "\n", - "# River bottom for downsampled ideal transect \n", - "bottom_avg_downsampled= interp.griddata(gps_points, bottom, ideal_points_downsampled, method='linear')\n", + "# River bottom for downsampled ideal transect\n", + "bottom_avg_downsampled = interp.griddata(\n", + " gps_points, bottom, ideal_points_downsampled, method=\"linear\"\n", + ")\n", "\n", "# Create a matrix of depths\n", - "bottom_filter_downsampled = d3d.create_points(x=bottom_avg_downsampled, y=downsampled_depth, waterdepth=1)\n", - "\n", - "# Creating a mask matrix with ones in the area of the river cross section and nan's outside \n", - "river_bottom_filter_downsampled= []\n", - "for index, row in bottom_filter_downsampled.iterrows():\n", - " if row['x'] > row['y']: \n", - " filter= 1 \n", - " else: \n", - " filter= float(\"nan\")\n", - " river_bottom_filter_downsampled= np.append(river_bottom_filter_downsampled, filter)" + "bottom_filter_downsampled = d3d.create_points(\n", + " x=bottom_avg_downsampled, y=downsampled_depth, waterdepth=1\n", + ")\n", + "\n", + "# Creating a mask matrix with ones in the area of the river cross section and nan's outside\n", + "river_bottom_filter_downsampled = []\n", + "for index, row in bottom_filter_downsampled.iterrows():\n", + " if row[\"x\"] > row[\"y\"]:\n", + " filter = 1\n", + " else:\n", + " filter = float(\"nan\")\n", + " river_bottom_filter_downsampled = np.append(river_bottom_filter_downsampled, filter)" ] }, { @@ -1747,28 +1763,30 @@ } ], "source": [ - "# Plotting \n", - "fig,ax = plt.subplots(figsize=(10,4.4))\n", + "# Plotting\n", + "fig, ax = plt.subplots(figsize=(10, 4.4))\n", "contour_plot = plt.tripcolor(\n", - " ADCP_ideal_points_downsamples.utm_x, \n", - " -ADCP_ideal_points_downsamples.waterdepth, \n", - " ADCP_ideal_downsamples.magnitude*river_bottom_filter_downsampled,\n", + " ADCP_ideal_points_downsamples.utm_x,\n", + " -ADCP_ideal_points_downsamples.waterdepth,\n", + " ADCP_ideal_downsamples.magnitude * river_bottom_filter_downsampled,\n", " vmin=min_plot,\n", - " vmax=max_plot\n", - " )\n", + " vmax=max_plot,\n", + ")\n", "\n", "# Plot river bottom for comparison\n", - "plt.plot(ideal_points.utm_x,-bottom_avg,'k', label= 'river bottom')\n", + "plt.plot(ideal_points.utm_x, -bottom_avg, \"k\", label=\"river bottom\")\n", "\n", "# Plot Settings\n", - "plt.xlabel('$UTM_x$ (m)')\n", - "plt.ylabel('Water Depth (m)')\n", - "cbar= plt.colorbar(contour_plot)\n", - "cbar.set_label('Velocity [m/s]')\n", - "plt.ylim([-8.5,-1])\n", - "plt.xlim([400950,401090])\n", - "plt.legend(loc= 7)\n", - "ax.get_xaxis().set_major_formatter(matplotlib.ticker.FuncFormatter(lambda x, p: format(int(x), ',')))\n", + "plt.xlabel(\"$UTM_x$ (m)\")\n", + "plt.ylabel(\"Water Depth (m)\")\n", + "cbar = plt.colorbar(contour_plot)\n", + "cbar.set_label(\"Velocity [m/s]\")\n", + "plt.ylim([-8.5, -1])\n", + "plt.xlim([400950, 401090])\n", + "plt.legend(loc=7)\n", + "ax.get_xaxis().set_major_formatter(\n", + " matplotlib.ticker.FuncFormatter(lambda x, p: format(int(x), \",\"))\n", + ")\n", "plt.xticks(rotation=45)" ] }, @@ -1842,33 +1860,33 @@ "# Use the requests method to obtain 1 day of instantneous gage height data\n", "water_level_USGS_data = river.io.usgs.request_usgs_data(\n", " station=\"15515500\",\n", - " parameter='00065',\n", - " start_date='2010-08-10',\n", - " end_date='2010-08-10',\n", - " data_type='Instantaneous'\n", - " )\n", + " parameter=\"00065\",\n", + " start_date=\"2010-08-10\",\n", + " end_date=\"2010-08-10\",\n", + " data_type=\"Instantaneous\",\n", + ")\n", "\n", "# Plot data\n", "water_level_USGS_data.plot()\n", "\n", "# Plot Settings\n", - "plt.xlabel('Time')\n", - "plt.ylabel('Gage Height (feet)')\n", + "plt.xlabel(\"Time\")\n", + "plt.ylabel(\"Gage Height (feet)\")\n", "\n", "# Use the requests method to obtain 1 day of instantneous discharge data\n", "discharge_USGS_data = river.io.usgs.request_usgs_data(\n", " station=\"15515500\",\n", - " parameter='00060',\n", - " start_date='2010-08-10',\n", - " end_date='2010-08-10',\n", - " data_type='Instantaneous'\n", - " )\n", + " parameter=\"00060\",\n", + " start_date=\"2010-08-10\",\n", + " end_date=\"2010-08-10\",\n", + " data_type=\"Instantaneous\",\n", + ")\n", "\n", "# Print data\n", "discharge_USGS_data.plot()\n", "# Plot Settings\n", - "plt.xlabel('Time')\n", - "plt.ylabel('Dischage ($f^3/s$)')" + "plt.xlabel(\"Time\")\n", + "plt.ylabel(\"Dischage ($f^3/s$)\")" ] }, { @@ -1888,10 +1906,12 @@ "outputs": [], "source": [ "# Import the simulated data\n", - "d3d_data = netCDF4.Dataset('data/river/ADCP_transect/tanana81010_final_map.nc')\n", + "d3d_data = netCDF4.Dataset(\"data/river/ADCP_transect/tanana81010_final_map.nc\")\n", "\n", "# Get the ADCP sample points\n", - "ADCP_ideal_points_downsamples_xy = ADCP_ideal_points_downsamples.rename(columns={\"utm_x\": \"x\", \"utm_y\": \"y\"})" + "ADCP_ideal_points_downsamples_xy = ADCP_ideal_points_downsamples.rename(\n", + " columns={\"utm_x\": \"x\", \"utm_y\": \"y\"}\n", + ")" ] }, { @@ -1919,11 +1939,13 @@ ], "source": [ "# Interpolate the Delft3D simulated data onto the the sample points\n", - "variables= ['ucy', 'ucx', 'ucz']\n", - "D3D= d3d.variable_interpolation(d3d_data, variables, points= ADCP_ideal_points_downsamples_xy)\n", + "variables = [\"ucy\", \"ucx\", \"ucz\"]\n", + "D3D = d3d.variable_interpolation(\n", + " d3d_data, variables, points=ADCP_ideal_points_downsamples_xy\n", + ")\n", "\n", "# Calculate the magnitude of the velocity\n", - "D3D['magnitude'] = np.sqrt(D3D.ucy**2 + D3D.ucx**2 + D3D.ucz**2)" + "D3D[\"magnitude\"] = np.sqrt(D3D.ucy**2 + D3D.ucx**2 + D3D.ucz**2)" ] }, { @@ -1972,29 +1994,31 @@ ], "source": [ "# Plot Delft3D interpolated Data\n", - "fig,ax = plt.subplots(figsize=(10,4.4))\n", + "fig, ax = plt.subplots(figsize=(10, 4.4))\n", "contour_plot = plt.tripcolor(\n", - " D3D.x, \n", - " -D3D.waterdepth, \n", - " D3D.magnitude*river_bottom_filter_downsampled,\n", + " D3D.x,\n", + " -D3D.waterdepth,\n", + " D3D.magnitude * river_bottom_filter_downsampled,\n", " vmin=min_plot,\n", " vmax=max_plot,\n", - " #shading='gouraud'\n", - " alpha=1\n", + " # shading='gouraud'\n", + " alpha=1,\n", ")\n", "\n", "# Plot the river bottom calculated frol ADCP for comparison\n", - "plt.plot(ideal_points.utm_x,-bottom_avg,'k', label= 'river bottom')\n", + "plt.plot(ideal_points.utm_x, -bottom_avg, \"k\", label=\"river bottom\")\n", "\n", "# Figure settings\n", - "plt.xlabel('$UTM_x (m)$')\n", - "plt.ylabel('Water Depth (m)')\n", - "cbar= plt.colorbar(contour_plot)\n", - "cbar.set_label('velocity [m/s]')\n", - "plt.ylim([-8.5,-1])\n", - "plt.xlim([400960,401090])\n", - "plt.legend(loc= 7)\n", - "ax.get_xaxis().set_major_formatter(matplotlib.ticker.FuncFormatter(lambda x, p: format(int(x), ',')))\n", + "plt.xlabel(\"$UTM_x (m)$\")\n", + "plt.ylabel(\"Water Depth (m)\")\n", + "cbar = plt.colorbar(contour_plot)\n", + "cbar.set_label(\"velocity [m/s]\")\n", + "plt.ylim([-8.5, -1])\n", + "plt.xlim([400960, 401090])\n", + "plt.legend(loc=7)\n", + "ax.get_xaxis().set_major_formatter(\n", + " matplotlib.ticker.FuncFormatter(lambda x, p: format(int(x), \",\"))\n", + ")\n", "plt.xticks(rotation=45)" ] }, @@ -2021,7 +2045,10 @@ "outputs": [], "source": [ "# L1\n", - "L1_Magnitude= abs(ADCP_ideal_downsamples.magnitude-D3D.magnitude)/ADCP_ideal_downsamples.magnitude" + "L1_Magnitude = (\n", + " abs(ADCP_ideal_downsamples.magnitude - D3D.magnitude)\n", + " / ADCP_ideal_downsamples.magnitude\n", + ")" ] }, { @@ -2039,15 +2066,17 @@ "metadata": {}, "outputs": [], "source": [ - "river_bottom_edge_filter_downsampled= []\n", - "for i in L1_Magnitude:\n", - " if 1 > i: \n", - " filter= 1 \n", - " else: \n", - " filter= float(\"nan\")\n", - " river_bottom_edge_filter_downsampled= np.append(river_bottom_edge_filter_downsampled, filter)\n", - " \n", - "error_filter = river_bottom_edge_filter_downsampled*river_bottom_filter_downsampled" + "river_bottom_edge_filter_downsampled = []\n", + "for i in L1_Magnitude:\n", + " if 1 > i:\n", + " filter = 1\n", + " else:\n", + " filter = float(\"nan\")\n", + " river_bottom_edge_filter_downsampled = np.append(\n", + " river_bottom_edge_filter_downsampled, filter\n", + " )\n", + "\n", + "error_filter = river_bottom_edge_filter_downsampled * river_bottom_filter_downsampled" ] }, { @@ -2079,7 +2108,7 @@ ], "source": [ "# Calculate and priont the Mean Absolute Error\n", - "MAE= np.sum(L1_Magnitude*error_filter)/len(L1_Magnitude[L1_Magnitude< 1000 ])\n", + "MAE = np.sum(L1_Magnitude * error_filter) / len(L1_Magnitude[L1_Magnitude < 1000])\n", "MAE" ] }, @@ -2121,33 +2150,35 @@ ], "source": [ "# Set the min and max error values\n", - "max_plot_error=1\n", - "min_plot_error=0\n", + "max_plot_error = 1\n", + "min_plot_error = 0\n", "\n", "# Plotting the L1 error\n", - "fig,ax = plt.subplots(figsize=(10,4.4))\n", + "fig, ax = plt.subplots(figsize=(10, 4.4))\n", "contour_plot_L1 = plt.tripcolor(\n", - " D3D.x, \n", - " -D3D.waterdepth, \n", - " L1_Magnitude*error_filter,\n", + " D3D.x,\n", + " -D3D.waterdepth,\n", + " L1_Magnitude * error_filter,\n", " vmin=min_plot_error,\n", - " vmax=max_plot_error\n", - " )\n", + " vmax=max_plot_error,\n", + ")\n", "\n", "# Plot the river bottom for comparison\n", - "plt.plot(ideal_points.utm_x,-bottom_avg,'k', label= 'river bottom')\n", + "plt.plot(ideal_points.utm_x, -bottom_avg, \"k\", label=\"river bottom\")\n", "\n", "# Plot settings\n", - "plt.xlim([400960,401090])\n", - "plt.ylim([-8.5,-1])\n", - "plt.xlabel('UTM x (m)')\n", - "plt.ylabel('Water Depth (m)')\n", - "cbar= plt.colorbar(contour_plot_L1)\n", - "cbar.set_label('$L_1$ Velocity Error')\n", - "plt.legend(loc= 7)\n", - "\n", - "ax.get_xaxis().set_major_formatter(matplotlib.ticker.FuncFormatter(lambda x, p: format(int(x), ',')))\n", - "plt.xticks(rotation=45)\n" + "plt.xlim([400960, 401090])\n", + "plt.ylim([-8.5, -1])\n", + "plt.xlabel(\"UTM x (m)\")\n", + "plt.ylabel(\"Water Depth (m)\")\n", + "cbar = plt.colorbar(contour_plot_L1)\n", + "cbar.set_label(\"$L_1$ Velocity Error\")\n", + "plt.legend(loc=7)\n", + "\n", + "ax.get_xaxis().set_major_formatter(\n", + " matplotlib.ticker.FuncFormatter(lambda x, p: format(int(x), \",\"))\n", + ")\n", + "plt.xticks(rotation=45)" ] }, { @@ -2169,8 +2200,11 @@ "metadata": {}, "outputs": [], "source": [ - "# L2 \n", - "L2_Magnitude= ((ADCP_ideal_downsamples.magnitude-D3D.magnitude)/ADCP_ideal_downsamples.magnitude)**2" + "# L2\n", + "L2_Magnitude = (\n", + " (ADCP_ideal_downsamples.magnitude - D3D.magnitude)\n", + " / ADCP_ideal_downsamples.magnitude\n", + ") ** 2" ] }, { @@ -2202,7 +2236,7 @@ } ], "source": [ - "MSE=np.sum(L2_Magnitude*error_filter)/np.size(L2_Magnitude[L2_Magnitude< 1000])\n", + "MSE = np.sum(L2_Magnitude * error_filter) / np.size(L2_Magnitude[L2_Magnitude < 1000])\n", "MSE" ] }, @@ -2244,29 +2278,31 @@ ], "source": [ "# Create a contour plot of the error\n", - "# Plotting \n", - "fig,ax = plt.subplots(figsize=(10,4.4))\n", + "# Plotting\n", + "fig, ax = plt.subplots(figsize=(10, 4.4))\n", "contour_plot_L2 = plt.tripcolor(\n", - " D3D.x, \n", - " -D3D.waterdepth, \n", - " L2_Magnitude*error_filter,\n", + " D3D.x,\n", + " -D3D.waterdepth,\n", + " L2_Magnitude * error_filter,\n", " vmin=min_plot_error,\n", - " vmax=max_plot_error\n", + " vmax=max_plot_error,\n", ")\n", "\n", "# Plot the river bottom for comparison\n", - "plt.plot(ideal_points.utm_x,-bottom_avg,'k', label= 'river bottom')\n", + "plt.plot(ideal_points.utm_x, -bottom_avg, \"k\", label=\"river bottom\")\n", "\n", "# Plot settings\n", - "plt.xlim([400960,401090])\n", - "plt.ylim([-8.5,-1])\n", - "plt.xlabel('UTM x (m)')\n", - "plt.ylabel('Water Depth (m)')\n", - "cbar= plt.colorbar(contour_plot_L1)\n", - "cbar.set_label('$L_2$ Velocity Error')\n", - "plt.legend(loc= 7)\n", - "\n", - "ax.get_xaxis().set_major_formatter(matplotlib.ticker.FuncFormatter(lambda x, p: format(int(x), ',')))\n", + "plt.xlim([400960, 401090])\n", + "plt.ylim([-8.5, -1])\n", + "plt.xlabel(\"UTM x (m)\")\n", + "plt.ylabel(\"Water Depth (m)\")\n", + "cbar = plt.colorbar(contour_plot_L1)\n", + "cbar.set_label(\"$L_2$ Velocity Error\")\n", + "plt.legend(loc=7)\n", + "\n", + "ax.get_xaxis().set_major_formatter(\n", + " matplotlib.ticker.FuncFormatter(lambda x, p: format(int(x), \",\"))\n", + ")\n", "plt.xticks(rotation=45)" ] }, @@ -2301,7 +2337,7 @@ ], "source": [ "# L inf\n", - "L_inf=np.nanmax(L1_Magnitude*error_filter)\n", + "L_inf = np.nanmax(L1_Magnitude * error_filter)\n", "L_inf" ] }, diff --git a/examples/Delft3D_example.ipynb b/examples/Delft3D_example.ipynb index a87de112b..1c76ca080 100644 --- a/examples/Delft3D_example.ipynb +++ b/examples/Delft3D_example.ipynb @@ -22,14 +22,15 @@ "outputs": [], "source": [ "from os.path import abspath, dirname, join, normpath, relpath\n", - "from mhkit.river.io import d3d \n", + "from mhkit.river.io import d3d\n", "from math import isclose\n", "import scipy.interpolate as interp\n", "import matplotlib.pyplot as plt\n", "import numpy as np\n", "import pandas as pd\n", "import netCDF4\n", - "plt.rcParams.update({'font.size': 15}) # Set font size of plots title and labels " + "\n", + "plt.rcParams.update({\"font.size\": 15}) # Set font size of plots title and labels" ] }, { @@ -111,16 +112,16 @@ ], "source": [ "# Downloading Data\n", - "datadir = normpath(join(relpath(join('data', 'river', 'd3d'))))\n", - "filename= 'turbineTest_map.nc'\n", - "d3d_data = netCDF4.Dataset(join(datadir,filename)) \n", + "datadir = normpath(join(relpath(join(\"data\", \"river\", \"d3d\"))))\n", + "filename = \"turbineTest_map.nc\"\n", + "d3d_data = netCDF4.Dataset(join(datadir, filename))\n", "\n", "# Printing variable and description\n", "for var in d3d_data.variables.keys():\n", - " try: \n", + " try:\n", " d3d_data[var].long_name\n", " except:\n", - " print(f'\"{var}\"') \n", + " print(f'\"{var}\"')\n", " else:\n", " print(f'\"{var}\": {d3d_data[var].long_name}')" ] @@ -150,7 +151,7 @@ } ], "source": [ - "time= d3d.get_all_time(d3d_data)\n", + "time = d3d.get_all_time(d3d_data)\n", "print(time)" ] }, @@ -186,7 +187,7 @@ ], "source": [ "seconds_run = 62\n", - "time_index=d3d._convert_time(d3d_data,seconds_run=seconds_run)\n", + "time_index = d3d._convert_time(d3d_data, seconds_run=seconds_run)\n", "print(time_index)" ] }, @@ -229,14 +230,14 @@ } ], "source": [ - "# Getting variable data \n", - "variable= 'ucx' \n", - "var_data_df= d3d.get_all_data_points(d3d_data, variable, time_index=4)\n", + "# Getting variable data\n", + "variable = \"ucx\"\n", + "var_data_df = d3d.get_all_data_points(d3d_data, variable, time_index=4)\n", "print(var_data_df)\n", "\n", - "# Setting plot limits \n", - "max_plot_vel= 1.25\n", - "min_plot_vel=0.5" + "# Setting plot limits\n", + "max_plot_vel = 1.25\n", + "min_plot_vel = 0.5" ] }, { @@ -331,21 +332,21 @@ ], "source": [ "# Use rectangular grid min and max to find flume centerline\n", - "xmin=var_data_df.x.max()\n", - "xmax=var_data_df.x.min()\n", + "xmin = var_data_df.x.max()\n", + "xmax = var_data_df.x.min()\n", "\n", - "ymin=var_data_df.y.max()\n", - "ymax=var_data_df.y.min()\n", + "ymin = var_data_df.y.max()\n", + "ymax = var_data_df.y.min()\n", "\n", - "waterdepth_min=var_data_df.waterdepth.max()\n", - "waterdepth_max=var_data_df.waterdepth.min()\n", + "waterdepth_min = var_data_df.waterdepth.max()\n", + "waterdepth_max = var_data_df.waterdepth.min()\n", "\n", - "# Creating one array and 2 points \n", + "# Creating one array and 2 points\n", "x = np.linspace(xmin, xmax)\n", - "y = np.mean([ymin,ymax])\n", - "waterdepth = np.mean([waterdepth_min,waterdepth_max])\n", + "y = np.mean([ymin, ymax])\n", + "waterdepth = np.mean([waterdepth_min, waterdepth_max])\n", "\n", - "# Creating an array of points \n", + "# Creating an array of points\n", "cline_points = d3d.create_points(x, y, waterdepth)\n", "cline_points.head()" ] @@ -390,19 +391,19 @@ "source": [ "# Interpolate raw data onto the centerline\n", "cline_variable = interp.griddata(\n", - " var_data_df[['x','y','waterdepth']], \n", + " var_data_df[[\"x\", \"y\", \"waterdepth\"]],\n", " var_data_df[variable],\n", - " cline_points[['x','y','waterdepth']]\n", - ") \n", + " cline_points[[\"x\", \"y\", \"waterdepth\"]],\n", + ")\n", "\n", "# Plotting\n", - "plt.figure(figsize=(12,5))\n", + "plt.figure(figsize=(12, 5))\n", "plt.plot(x, cline_variable)\n", "\n", "plt.grid()\n", - "plt.xlabel('x (m)')\n", - "plt.ylabel('$u_x$ [m/s]' )\n", - "plt.title(f'Centerline Velocity at: {var_data_df.time[1]} s')" + "plt.xlabel(\"x (m)\")\n", + "plt.ylabel(\"$u_x$ [m/s]\")\n", + "plt.title(f\"Centerline Velocity at: {var_data_df.time[1]} s\")" ] }, { @@ -451,23 +452,23 @@ "layer = 2\n", "layer_data = d3d.get_layer_data(d3d_data, variable, layer)\n", "\n", - "# Plotting \n", - "plt.figure(figsize=(12,4))\n", + "# Plotting\n", + "plt.figure(figsize=(12, 4))\n", "contour_plot = plt.tricontourf(\n", " layer_data.x,\n", - " layer_data.y, \n", - " layer_data.v, \n", + " layer_data.y,\n", + " layer_data.v,\n", " vmin=min_plot_vel,\n", " vmax=max_plot_vel,\n", - " levels=np.linspace(min_plot_vel,max_plot_vel,10)\n", + " levels=np.linspace(min_plot_vel, max_plot_vel, 10),\n", ")\n", - " \n", + "\n", "cbar = plt.colorbar(contour_plot)\n", - "cbar.set_label('$u_x$ [m/s]')\n", - " \n", - "plt.xlabel('x [m]')\n", - "plt.ylabel('y [m]')\n", - "plt.title(f'Velocity on Layer {layer} at Time: {layer_data.time[1]} s')" + "cbar.set_label(\"$u_x$ [m/s]\")\n", + "\n", + "plt.xlabel(\"x [m]\")\n", + "plt.ylabel(\"y [m]\")\n", + "plt.title(f\"Velocity on Layer {layer} at Time: {layer_data.time[1]} s\")" ] }, { @@ -617,9 +618,9 @@ "# Create x-y plane at z level midpoint\n", "x2 = np.linspace(xmin, xmax, num=100)\n", "y_contour = np.linspace(ymin, ymax, num=40)\n", - "z2 = np.mean([waterdepth_min,waterdepth_max])\n", + "z2 = np.mean([waterdepth_min, waterdepth_max])\n", "\n", - "contour_points = d3d.create_points(x2, y_contour, z2) \n", + "contour_points = d3d.create_points(x2, y_contour, z2)\n", "contour_points" ] }, @@ -639,9 +640,9 @@ "outputs": [], "source": [ "contour_variable = interp.griddata(\n", - " var_data_df[['x','y','waterdepth']],\n", + " var_data_df[[\"x\", \"y\", \"waterdepth\"]],\n", " var_data_df[variable],\n", - " contour_points[['x','y','waterdepth']]\n", + " contour_points[[\"x\", \"y\", \"waterdepth\"]],\n", ")" ] }, @@ -673,23 +674,23 @@ } ], "source": [ - "# Plotting \n", - "plt.figure(figsize=(12,4))\n", + "# Plotting\n", + "plt.figure(figsize=(12, 4))\n", "contour_plot = plt.tricontourf(\n", " contour_points.x,\n", " contour_points.y,\n", " contour_variable,\n", " vmin=min_plot_vel,\n", " vmax=max_plot_vel,\n", - " levels=np.linspace(min_plot_vel,max_plot_vel,10)\n", + " levels=np.linspace(min_plot_vel, max_plot_vel, 10),\n", ")\n", "\n", - "plt.xlabel('x (m)')\n", - "plt.ylabel('y (m)')\n", - "plt.title(f'Velocity on x-y Plane')\n", + "plt.xlabel(\"x (m)\")\n", + "plt.ylabel(\"y (m)\")\n", + "plt.title(f\"Velocity on x-y Plane\")\n", "\n", - "cbar= plt.colorbar(contour_plot)\n", - "cbar.set_label(f'$u_x$ [m/s]')" + "cbar = plt.colorbar(contour_plot)\n", + "cbar.set_label(f\"$u_x$ [m/s]\")" ] }, { @@ -925,33 +926,29 @@ } ], "source": [ - "# Calculating turbulent intensity \n", - "TI=d3d.turbulent_intensity(\n", - " d3d_data,\n", - " points=contour_points,\n", - " intermediate_values=True\n", - ") \n", + "# Calculating turbulent intensity\n", + "TI = d3d.turbulent_intensity(d3d_data, points=contour_points, intermediate_values=True)\n", "\n", - "# Creating new plot limits \n", - "max_plot_TI=27\n", - "min_plot_TI=0\n", + "# Creating new plot limits\n", + "max_plot_TI = 27\n", + "min_plot_TI = 0\n", "\n", - "# Plotting \n", - "plt.figure(figsize=(12,4))\n", + "# Plotting\n", + "plt.figure(figsize=(12, 4))\n", "contour_plot = plt.tricontourf(\n", - " TI.x, \n", - " TI.y, \n", + " TI.x,\n", + " TI.y,\n", " TI.turbulent_intensity,\n", - " vmin=min_plot_TI, \n", + " vmin=min_plot_TI,\n", " vmax=max_plot_TI,\n", - " levels=np.linspace(min_plot_TI,max_plot_TI,10)\n", + " levels=np.linspace(min_plot_TI, max_plot_TI, 10),\n", ")\n", "\n", - "plt.xlabel('x (m)')\n", - "plt.ylabel('y (m)')\n", - "plt.title('Turbulent Intensity')\n", - "cbar= plt.colorbar(contour_plot)\n", - "cbar.set_label('Turbulent Intensity [%]')\n", + "plt.xlabel(\"x (m)\")\n", + "plt.ylabel(\"y (m)\")\n", + "plt.title(\"Turbulent Intensity\")\n", + "cbar = plt.colorbar(contour_plot)\n", + "cbar.set_label(\"Turbulent Intensity [%]\")\n", "\n", "TI" ] @@ -1183,37 +1180,39 @@ } ], "source": [ - "variables= ['turkin1', 'ucx', 'ucy', 'ucz']\n", + "variables = [\"turkin1\", \"ucx\", \"ucy\", \"ucz\"]\n", "\n", - "Var= d3d.variable_interpolation(d3d_data, variables, points='faces', edges = 'nearest')\n", + "Var = d3d.variable_interpolation(d3d_data, variables, points=\"faces\", edges=\"nearest\")\n", "\n", "# Replacing negative numbers close to zero with zero\n", - "neg_index=np.where(Var['turkin1']<0)# Finding negative numbers\n", + "neg_index = np.where(Var[\"turkin1\"] < 0) # Finding negative numbers\n", "\n", - "# Determining if negative number are close to zero \n", - "zero_bool= np.isclose(\n", - " Var['turkin1'][Var['turkin1']<0].array, \n", - " np.zeros(len(Var['turkin1'][Var['turkin1']<0].array)),\n", - " atol=1.0e-4\n", + "# Determining if negative number are close to zero\n", + "zero_bool = np.isclose(\n", + " Var[\"turkin1\"][Var[\"turkin1\"] < 0].array,\n", + " np.zeros(len(Var[\"turkin1\"][Var[\"turkin1\"] < 0].array)),\n", + " atol=1.0e-4,\n", ")\n", "\n", - "# Identifying the location of negative values close to zero \n", - "zero_ind= neg_index[0][zero_bool] \n", + "# Identifying the location of negative values close to zero\n", + "zero_ind = neg_index[0][zero_bool]\n", "\n", "# Identifying the location of negative number that are not close to zero\n", - "non_zero_ind= neg_index[0][~zero_bool]\n", + "non_zero_ind = neg_index[0][~zero_bool]\n", "\n", - "# Replacing negative number close to zero with zero \n", - "Var.loc[zero_ind,'turkin1']=np.zeros(len(zero_ind)) \n", + "# Replacing negative number close to zero with zero\n", + "Var.loc[zero_ind, \"turkin1\"] = np.zeros(len(zero_ind))\n", "\n", - "# Replacing negative numbers not close to zero with nan \n", - "Var.loc[non_zero_ind,'turkin1']=[np.nan]*len(non_zero_ind)\n", + "# Replacing negative numbers not close to zero with nan\n", + "Var.loc[non_zero_ind, \"turkin1\"] = [np.nan] * len(non_zero_ind)\n", "\n", - "# Calculating the root mean squared velocity \n", - "Var['u_mag']=d3d.unorm(np.array(Var['ucx']),np.array(Var['ucy']), np.array(Var['ucz']))\n", + "# Calculating the root mean squared velocity\n", + "Var[\"u_mag\"] = d3d.unorm(\n", + " np.array(Var[\"ucx\"]), np.array(Var[\"ucy\"]), np.array(Var[\"ucz\"])\n", + ")\n", "\n", - "# Calculating turbulent intensity as a percent \n", - "Var['turbulent_intensity']= (np.sqrt(2/3*Var['turkin1'])/Var['u_mag'])*100 \n", + "# Calculating turbulent intensity as a percent\n", + "Var[\"turbulent_intensity\"] = (np.sqrt(2 / 3 * Var[\"turkin1\"]) / Var[\"u_mag\"]) * 100\n", "\n", "Var" ] @@ -1258,43 +1257,47 @@ } ], "source": [ - "turbine_x_loc= 6 \n", - "turbine_diameter= 0.7\n", - "N=1\n", - "x_sample = turbine_x_loc+N*turbine_diameter\n", + "turbine_x_loc = 6\n", + "turbine_diameter = 0.7\n", + "N = 1\n", + "x_sample = turbine_x_loc + N * turbine_diameter\n", "y_samples = np.linspace(ymin, ymax, num=40)\n", - "waterdepth_samples = np.linspace(waterdepth_min,waterdepth_max, num=256)\n", + "waterdepth_samples = np.linspace(waterdepth_min, waterdepth_max, num=256)\n", "\n", - "variables= ['turkin1', 'ucx', 'ucy', 'ucz']\n", - "sample_points = d3d.create_points(x_sample, y_samples, waterdepth_samples) \n", + "variables = [\"turkin1\", \"ucx\", \"ucy\", \"ucz\"]\n", + "sample_points = d3d.create_points(x_sample, y_samples, waterdepth_samples)\n", "\n", - "Var_sample= d3d.variable_interpolation(d3d_data, variables, points= sample_points, edges = 'nearest')\n", + "Var_sample = d3d.variable_interpolation(\n", + " d3d_data, variables, points=sample_points, edges=\"nearest\"\n", + ")\n", "\n", - "#root mean squared calculation \n", - "Var_sample['u_mag']=d3d.unorm(\n", - " np.array(Var_sample['ucx']),\n", - " np.array(Var_sample['ucy']), \n", - " np.array(Var_sample['ucz'])\n", - ") \n", + "# root mean squared calculation\n", + "Var_sample[\"u_mag\"] = d3d.unorm(\n", + " np.array(Var_sample[\"ucx\"]),\n", + " np.array(Var_sample[\"ucy\"]),\n", + " np.array(Var_sample[\"ucz\"]),\n", + ")\n", "# turbulent intesity calculation\n", - "Var_sample['turbulent_intensity']= np.sqrt(2/3*Var_sample['turkin1'])/Var_sample['u_mag']*100 \n", + "Var_sample[\"turbulent_intensity\"] = (\n", + " np.sqrt(2 / 3 * Var_sample[\"turkin1\"]) / Var_sample[\"u_mag\"] * 100\n", + ")\n", "\n", - "# Plotting \n", - "plt.figure(figsize=(10,4.4))\n", + "# Plotting\n", + "plt.figure(figsize=(10, 4.4))\n", "contour_plot = plt.tricontourf(\n", - " Var_sample.y, \n", - " Var_sample.waterdepth, \n", + " Var_sample.y,\n", + " Var_sample.waterdepth,\n", " Var_sample.turbulent_intensity,\n", - " vmin=min_plot_TI, \n", + " vmin=min_plot_TI,\n", " vmax=max_plot_TI,\n", - " levels=np.linspace(min_plot_TI,max_plot_TI,10)\n", + " levels=np.linspace(min_plot_TI, max_plot_TI, 10),\n", ")\n", "\n", - "plt.xlabel('y (m)')\n", - "plt.ylabel('z (m)')\n", - "plt.title('Turbulent Intensity')\n", - "cbar= plt.colorbar(contour_plot)\n", - "cbar.set_label('Turbulent Intensity [%]')" + "plt.xlabel(\"y (m)\")\n", + "plt.ylabel(\"z (m)\")\n", + "plt.title(\"Turbulent Intensity\")\n", + "cbar = plt.colorbar(contour_plot)\n", + "cbar.set_label(\"Turbulent Intensity [%]\")" ] }, { diff --git a/examples/PacWave_resource_characterization_example.ipynb b/examples/PacWave_resource_characterization_example.ipynb index 80594fba1..0b4248f7a 100644 --- a/examples/PacWave_resource_characterization_example.ipynb +++ b/examples/PacWave_resource_characterization_example.ipynb @@ -24,7 +24,7 @@ "from sklearn.mixture import GaussianMixture\n", "from mhkit.wave.io import ndbc\n", "import matplotlib.pyplot as plt\n", - "from matplotlib import colors \n", + "from matplotlib import colors\n", "from scipy import stats\n", "import pandas as pd\n", "import numpy as np\n", @@ -32,12 +32,15 @@ "import os\n", "\n", "import matplotlib.pylab as pylab\n", - "params = {'legend.fontsize': 'x-large',\n", - " 'figure.figsize': (15, 5),\n", - " 'axes.labelsize': 'x-large',\n", - " 'axes.titlesize':'x-large',\n", - " 'xtick.labelsize':'x-large',\n", - " 'ytick.labelsize':'x-large'}\n", + "\n", + "params = {\n", + " \"legend.fontsize\": \"x-large\",\n", + " \"figure.figsize\": (15, 5),\n", + " \"axes.labelsize\": \"x-large\",\n", + " \"axes.titlesize\": \"x-large\",\n", + " \"xtick.labelsize\": \"x-large\",\n", + " \"ytick.labelsize\": \"x-large\",\n", + "}\n", "pylab.rcParams.update(params)" ] }, @@ -207,15 +210,30 @@ } ], "source": [ - "m = folium.Map(location=[44.613600975457715, -123.74317583354498], zoom_start=9, tiles=\"Stamen Terrain\", control_scale = True)\n", + "m = folium.Map(\n", + " location=[44.613600975457715, -123.74317583354498],\n", + " zoom_start=9,\n", + " tiles=\"Stamen Terrain\",\n", + " control_scale=True,\n", + ")\n", "\n", "tooltip = \"NDBC 46050\"\n", - "folium.Marker([44.669, -124.546], popup=\" Water depth: 160 m\", tooltip=tooltip).add_to(m)\n", + "folium.Marker(\n", + " [44.669, -124.546], popup=\" Water depth: 160 m\", tooltip=tooltip\n", + ").add_to(m)\n", "\n", "tooltip = \"PACWAVE North\"\n", - "folium.Marker([44.69, -124.13472222222222], tooltip=tooltip, icon=folium.Icon(color='green',icon=\"th-large\")).add_to(m)\n", + "folium.Marker(\n", + " [44.69, -124.13472222222222],\n", + " tooltip=tooltip,\n", + " icon=folium.Icon(color=\"green\", icon=\"th-large\"),\n", + ").add_to(m)\n", "tooltip = \"PACWAVE South\"\n", - "folium.Marker([44.58444444444444, -124.2125], tooltip=tooltip, icon=folium.Icon(color='red', icon=\"th\")).add_to(m)\n", + "folium.Marker(\n", + " [44.58444444444444, -124.2125],\n", + " tooltip=tooltip,\n", + " icon=folium.Icon(color=\"red\", icon=\"th\"),\n", + ").add_to(m)\n", "\n", "m.save(\"index.png\")\n", "\n", @@ -259,7 +277,7 @@ ], "source": [ "# Get buoy metadata\n", - "buoy_number = '46050' \n", + "buoy_number = \"46050\"\n", "buoy_metadata = ndbc.get_buoy_metadata(buoy_number)\n", "print(\"Buoy Metadata:\")\n", "for key, value in buoy_metadata.items():\n", @@ -631,17 +649,17 @@ ], "source": [ "# Spectral wave density for buoy 46050\n", - "parameter = 'swden'\n", + "parameter = \"swden\"\n", "\n", "\n", "# Request list of available files\n", - "ndbc_available_data= ndbc.available_data(parameter, buoy_number)\n", + "ndbc_available_data = ndbc.available_data(parameter, buoy_number)\n", "\n", "# Pass file names to NDBC and request the data\n", - "filenames = ndbc_available_data['filename']\n", + "filenames = ndbc_available_data[\"filename\"]\n", "ndbc_requested_data = ndbc.request_data(parameter, filenames)\n", "\n", - "ndbc_requested_data['2020']" + "ndbc_requested_data[\"2020\"]" ] }, { @@ -1048,13 +1066,13 @@ } ], "source": [ - "ndbc_data={}\n", + "ndbc_data = {}\n", "# Create a Datetime Index and remove NOAA date columns for each year\n", "for year in ndbc_requested_data:\n", " year_data = ndbc_requested_data[year]\n", " ndbc_data[year] = ndbc.to_datetime_index(parameter, year_data)\n", - " \n", - "ndbc_data['2020']" + "\n", + "ndbc_data[\"2020\"]" ] }, { @@ -1073,11 +1091,11 @@ "outputs": [], "source": [ "# Intialize empty lists to store the results from each year\n", - "Hm0_list=[]\n", - "Te_list=[]\n", - "J_list=[]\n", - "Tp_list=[]\n", - "Tz_list=[]\n", + "Hm0_list = []\n", + "Te_list = []\n", + "J_list = []\n", + "Tp_list = []\n", + "Tz_list = []\n", "\n", "# Iterate over each year and save the result in the initalized dictionary\n", "for year in ndbc_data:\n", @@ -1085,26 +1103,26 @@ " year_data = data_raw[data_raw != 999.0].dropna()\n", " Hm0_list.append(resource.significant_wave_height(year_data.T))\n", " Te_list.append(resource.energy_period(year_data.T))\n", - " J_list.append(resource.energy_flux(year_data.T, h=399.))\n", + " J_list.append(resource.energy_flux(year_data.T, h=399.0))\n", " Tp_list.append(resource.peak_period(year_data.T))\n", " Tz_list.append(resource.average_zero_crossing_period(year_data.T))\n", - " \n", + "\n", "# Concatenate list of Series into a single DataFrame\n", - "Te = pd.concat(Te_list ,axis=0)\n", - "Tp = pd.concat(Tp_list ,axis=0)\n", - "Hm0 = pd.concat(Hm0_list ,axis=0)\n", - "J = pd.concat(J_list ,axis=0)\n", - "Tz = pd.concat(Tz_list ,axis=0)\n", - "data = pd.concat([Hm0, Te, Tp, J, Tz],axis=1)\n", + "Te = pd.concat(Te_list, axis=0)\n", + "Tp = pd.concat(Tp_list, axis=0)\n", + "Hm0 = pd.concat(Hm0_list, axis=0)\n", + "J = pd.concat(J_list, axis=0)\n", + "Tz = pd.concat(Tz_list, axis=0)\n", + "data = pd.concat([Hm0, Te, Tp, J, Tz], axis=1)\n", "\n", "# Calculate wave steepness\n", - "data['Sm'] = data.Hm0 / (9.81/(2*np.pi) * data.Tz**2)\n", + "data[\"Sm\"] = data.Hm0 / (9.81 / (2 * np.pi) * data.Tz**2)\n", "\n", "# Drop any NaNs created from the calculation of Hm0 or Te\n", "data.dropna(inplace=True)\n", "# Sort the DateTime index\n", "data.sort_index(inplace=True)\n", - "#data" + "# data" ] }, { @@ -1140,20 +1158,22 @@ "# Start by cleaning the data of outliers\n", "data_clean = data[data.Hm0 < 20]\n", "sigma = data_clean.J.std()\n", - "data_clean = data_clean[data_clean.J > (data_clean.J.mean() - 0.9* sigma)]\n", + "data_clean = data_clean[data_clean.J > (data_clean.J.mean() - 0.9 * sigma)]\n", "\n", - "# Organizing the cleaned data \n", - "Hm0=data_clean.Hm0\n", - "Te=data_clean.Te\n", - "J=data_clean.J\n", + "# Organizing the cleaned data\n", + "Hm0 = data_clean.Hm0\n", + "Te = data_clean.Te\n", + "J = data_clean.J\n", "\n", - "# Setting the bins for the resource frequency and power distribution \n", + "# Setting the bins for the resource frequency and power distribution\n", "Hm0_bin_size = 0.5\n", - "Hm0_edges = np.arange(0,15+Hm0_bin_size,Hm0_bin_size)\n", + "Hm0_edges = np.arange(0, 15 + Hm0_bin_size, Hm0_bin_size)\n", "Te_bin_size = 1\n", - "Te_edges = np.arange(0, 20+Te_bin_size,Te_bin_size)\n", + "Te_edges = np.arange(0, 20 + Te_bin_size, Te_bin_size)\n", "\n", - "fig = mhkit.wave.graphics.plot_avg_annual_energy_matrix(Hm0, Te, J, Hm0_edges=Hm0_edges, Te_edges=Te_edges)" + "fig = mhkit.wave.graphics.plot_avg_annual_energy_matrix(\n", + " Hm0, Te, J, Hm0_edges=Hm0_edges, Te_edges=Te_edges\n", + ")" ] }, { @@ -1212,43 +1232,45 @@ } ], "source": [ - "months=data_clean.index.month\n", - "data_group=data_clean.groupby(months)\n", + "months = data_clean.index.month\n", + "data_group = data_clean.groupby(months)\n", "\n", "QoIs = data_clean.keys()\n", - "fig, axs = plt.subplots(len(QoIs),1, figsize=(8, 12), sharex=True)\n", - "#shade between 25% and 75%\n", + "fig, axs = plt.subplots(len(QoIs), 1, figsize=(8, 12), sharex=True)\n", + "# shade between 25% and 75%\n", "QoIs = data_clean.keys()\n", "for i in range(len(QoIs)):\n", " QoI = QoIs[i]\n", - " axs[i].plot(data_group.median()[QoI], marker='.')\n", + " axs[i].plot(data_group.median()[QoI], marker=\".\")\n", "\n", - " axs[i].fill_between(months.unique(),\n", - " data_group.describe()[QoI, '25%'],\n", - " data_group.describe()[QoI, '75%'],\n", - " alpha=0.2)\n", + " axs[i].fill_between(\n", + " months.unique(),\n", + " data_group.describe()[QoI, \"25%\"],\n", + " data_group.describe()[QoI, \"75%\"],\n", + " alpha=0.2,\n", + " )\n", " axs[i].grid()\n", " mx = data_group.median()[QoI].max()\n", - " mx_month= data_group.median()[QoI].argmax()+1\n", + " mx_month = data_group.median()[QoI].argmax() + 1\n", " mn = data_group.median()[QoI].min()\n", - " mn_month= data_group.median()[QoI].argmin()+1\n", - " print('--------------------------------------------')\n", - " print(f'{QoI} max:{np.round(mx,4)}, month: {mx_month}')\n", - " print(f'{QoI} min:{np.round(mn,4)}, month: {mn_month}')\n", + " mn_month = data_group.median()[QoI].argmin() + 1\n", + " print(\"--------------------------------------------\")\n", + " print(f\"{QoI} max:{np.round(mx,4)}, month: {mx_month}\")\n", + " print(f\"{QoI} min:{np.round(mn,4)}, month: {mn_month}\")\n", "\n", - "plt.setp(axs[5], xlabel='Month')\n", + "plt.setp(axs[5], xlabel=\"Month\")\n", "\n", - "plt.setp(axs[0], ylabel=f'{QoIs[0]} [m]')\n", - "plt.setp(axs[1], ylabel=f'{QoIs[1]} [s]')\n", - "plt.setp(axs[2], ylabel=f'{QoIs[2]} [s]')\n", - "plt.setp(axs[3], ylabel=f'{QoIs[3]} [kW/M]')\n", - "plt.setp(axs[4], ylabel=f'{QoIs[4]} [s]')\n", - "plt.setp(axs[5], ylabel=f'{QoIs[5]} [ ]')\n", + "plt.setp(axs[0], ylabel=f\"{QoIs[0]} [m]\")\n", + "plt.setp(axs[1], ylabel=f\"{QoIs[1]} [s]\")\n", + "plt.setp(axs[2], ylabel=f\"{QoIs[2]} [s]\")\n", + "plt.setp(axs[3], ylabel=f\"{QoIs[3]} [kW/M]\")\n", + "plt.setp(axs[4], ylabel=f\"{QoIs[4]} [s]\")\n", + "plt.setp(axs[5], ylabel=f\"{QoIs[5]} [ ]\")\n", "\n", "\n", "plt.tight_layout()\n", "\n", - "plt.savefig('40650QoIs.png')" + "plt.savefig(\"40650QoIs.png\")" ] }, { @@ -1290,7 +1312,7 @@ ], "source": [ "ax = graphics.monthly_cumulative_distribution(data_clean.J)\n", - "plt.xlim([1000, 1E6])" + "plt.xlim([1000, 1e6])" ] }, { @@ -1325,49 +1347,49 @@ } ], "source": [ - "# Delta time of sea-states \n", - "dt = (data_clean.index[2]-data_clean.index[1]).seconds \n", + "# Delta time of sea-states\n", + "dt = (data_clean.index[2] - data_clean.index[1]).seconds\n", "\n", "# Return period (years) of interest\n", - "period = 100 \n", + "period = 100\n", "copulas100 = contours.environmental_contours(\n", - " data.Hm0, \n", - " data.Te, \n", + " data.Hm0,\n", + " data.Te,\n", " dt,\n", " period,\n", - " method='PCA',\n", + " method=\"PCA\",\n", ")\n", "\n", "period = 50\n", "copulas50 = contours.environmental_contours(\n", - " data.Hm0, \n", - " data.Te, \n", - " dt, \n", - " period, \n", - " method='PCA', \n", + " data.Hm0,\n", + " data.Te,\n", + " dt,\n", + " period,\n", + " method=\"PCA\",\n", ")\n", "\n", "\n", "Te_data = np.array(data_clean.Te)\n", "Hm0_data = np.array(data_clean.Hm0)\n", "\n", - "Hm0_contours = [copulas50['PCA_x1'], copulas100['PCA_x1']]\n", - "Te_contours = [copulas50['PCA_x2'], copulas100['PCA_x2']]\n", + "Hm0_contours = [copulas50[\"PCA_x1\"], copulas100[\"PCA_x1\"]]\n", + "Te_contours = [copulas50[\"PCA_x2\"], copulas100[\"PCA_x2\"]]\n", "\n", - "fig, ax = plt.subplots(figsize=(9,4))\n", + "fig, ax = plt.subplots(figsize=(9, 4))\n", "ax = graphics.plot_environmental_contour(\n", - " Te_data, \n", - " Hm0_data, \n", - " Te_contours, \n", - " Hm0_contours , \n", - " data_label='NDBC 46050', \n", - " contour_label=['50 Year Contour','100 Year Contour'],\n", - " x_label = 'Energy Period, $Te$ [s]',\n", - " y_label = 'Sig. wave height, $Hm0$ [m]', \n", - " ax=ax\n", + " Te_data,\n", + " Hm0_data,\n", + " Te_contours,\n", + " Hm0_contours,\n", + " data_label=\"NDBC 46050\",\n", + " contour_label=[\"50 Year Contour\", \"100 Year Contour\"],\n", + " x_label=\"Energy Period, $Te$ [s]\",\n", + " y_label=\"Sig. wave height, $Hm0$ [m]\",\n", + " ax=ax,\n", ")\n", - "plt.legend(loc='upper left')\n", - "plt.tight_layout() " + "plt.legend(loc=\"upper left\")\n", + "plt.tight_layout()" ] }, { @@ -1390,10 +1412,14 @@ ], "source": [ "print(f\"50-year: Hm0 max {copulas50['PCA_x1'].max().round(1)}\")\n", - "print(f\"50-year: Te at Hm0 max {copulas50['PCA_x2'][copulas50['PCA_x1'].argmax()].round(1)}\")\n", + "print(\n", + " f\"50-year: Te at Hm0 max {copulas50['PCA_x2'][copulas50['PCA_x1'].argmax()].round(1)}\"\n", + ")\n", "print(\"\\n\")\n", "print(f\"100-year: Hm0 max {copulas100['PCA_x1'].max().round(1)}\")\n", - "print(f\"100-year: Te at Hm0 max { copulas100['PCA_x2'][copulas100['PCA_x1'].argmax()].round(1)}\")" + "print(\n", + " f\"100-year: Te at Hm0 max { copulas100['PCA_x2'][copulas100['PCA_x1'].argmax()].round(1)}\"\n", + ")" ] }, { @@ -1423,9 +1449,9 @@ } ], "source": [ - "nHours = (data_clean.index[1] - data_clean.index[0]).seconds/3600\n", + "nHours = (data_clean.index[1] - data_clean.index[0]).seconds / 3600\n", "Total = data_clean.J.sum() * nHours\n", - "print(f'{Total} (W*hr)/m')" + "print(f\"{Total} (W*hr)/m\")" ] }, { @@ -1451,11 +1477,12 @@ } ], "source": [ - "Jsum, xe, ye, bn = stats.binned_statistic_2d(data_clean.Hm0, data_clean.Te, data_clean.J,\n", - " statistic='sum')#,bins=[Te_bins, Hm0_bins])\n", + "Jsum, xe, ye, bn = stats.binned_statistic_2d(\n", + " data_clean.Hm0, data_clean.Te, data_clean.J, statistic=\"sum\"\n", + ") # ,bins=[Te_bins, Hm0_bins])\n", "\n", - "hist_result = np.round(Jsum.sum().sum()/Total,4)\n", - "print(f'{hist_result} = (2D Histogram J) / (1-year total J) ')" + "hist_result = np.round(Jsum.sum().sum() / Total, 4)\n", + "print(f\"{hist_result} = (2D Histogram J) / (1-year total J) \")" ] }, { @@ -1497,30 +1524,29 @@ ], "source": [ "# Compute Gaussian Mixture Model for each number of clusters\n", - "Ns= [4, 8, 16, 32, 64]\n", + "Ns = [4, 8, 16, 32, 64]\n", "X = np.vstack((data_clean.Te.values, data_clean.Hm0.values)).T\n", - "fig, axs = plt.subplots(len(Ns),1, figsize=(8, 24), sharex=True)\n", + "fig, axs = plt.subplots(len(Ns), 1, figsize=(8, 24), sharex=True)\n", "\n", - "results={}\n", + "results = {}\n", "for N in Ns:\n", " gmm = GaussianMixture(n_components=N).fit(X)\n", "\n", " # Save centers and weights\n", - " result = pd.DataFrame(gmm.means_, columns=['Te','Hm0'])\n", - " result['weights'] = gmm.weights_\n", + " result = pd.DataFrame(gmm.means_, columns=[\"Te\", \"Hm0\"])\n", + " result[\"weights\"] = gmm.weights_\n", "\n", - " result['Tp'] = result.Te / 0.858\n", + " result[\"Tp\"] = result.Te / 0.858\n", " results[N] = result\n", - " \n", - " \n", + "\n", " labels = gmm.predict(X)\n", - " \n", + "\n", " i = Ns.index(N)\n", " axs[i].scatter(data_clean.Te.values, data_clean.Hm0.values, c=labels, s=40)\n", - " axs[i].plot(result.Te, result.Hm0, 'm+')\n", - " axs[i].title.set_text(f'{N} Clusters')\n", - " plt.setp(axs[i], ylabel='Energy Period, $T_e$ [s]')\n", - "plt.setp(axs[len(Ns)-1], xlabel='Sig. wave height, $Hm0$ [m') " + " axs[i].plot(result.Te, result.Hm0, \"m+\")\n", + " axs[i].title.set_text(f\"{N} Clusters\")\n", + " plt.setp(axs[i], ylabel=\"Energy Period, $T_e$ [s]\")\n", + "plt.setp(axs[len(Ns) - 1], xlabel=\"Sig. wave height, $Hm0$ [m\")" ] }, { @@ -1555,26 +1581,26 @@ ], "source": [ "w = ndbc_data[year].columns.values\n", - "f = w / 2*np.pi\n", + "f = w / 2 * np.pi\n", "\n", "\n", "for N in results:\n", " result = results[N]\n", - " J=[]\n", + " J = []\n", " for i in range(len(result)):\n", " b = resource.jonswap_spectrum(f, result.Tp[i], result.Hm0[i])\n", - " J.extend([resource.energy_flux(b, h=399.).values[0][0]])\n", - " \n", - " result['J'] = J\n", + " J.extend([resource.energy_flux(b, h=399.0).values[0][0]])\n", + "\n", + " result[\"J\"] = J\n", " results[N] = result\n", "\n", - "ratios={}\n", + "ratios = {}\n", "for N in results:\n", - " J_hr = results[N].J*len(data_clean)\n", - " total_weighted_J= (J_hr * results[N].weights).sum()\n", + " J_hr = results[N].J * len(data_clean)\n", + " total_weighted_J = (J_hr * results[N].weights).sum()\n", " normalized_weighted_J = total_weighted_J / Total\n", " ratios[N] = np.round(normalized_weighted_J, 4)\n", - " \n", + "\n", "pd.Series(ratios)" ] }, diff --git a/examples/SWAN_example.ipynb b/examples/SWAN_example.ipynb index 974ca6cc0..d4eeb4620 100644 --- a/examples/SWAN_example.ipynb +++ b/examples/SWAN_example.ipynb @@ -20,7 +20,7 @@ "from os.path import join\n", "import pandas as pd\n", "\n", - "swan_data_folder = join('data','wave','swan')" + "swan_data_folder = join(\"data\", \"wave\", \"swan\")" ] }, { @@ -41,9 +41,9 @@ "metadata": {}, "outputs": [], "source": [ - "swan_table_file = join(swan_data_folder, 'SWANOUT.DAT')\n", - "swan_block_file = join(swan_data_folder, 'SWANOUTBlock.DAT')\n", - "swan_block_mat_file = join(swan_data_folder, 'SWANOUT.mat')" + "swan_table_file = join(swan_data_folder, \"SWANOUT.DAT\")\n", + "swan_block_file = join(swan_data_folder, \"SWANOUTBlock.DAT\")\n", + "swan_block_mat_file = join(swan_data_folder, \"SWANOUT.mat\")" ] }, { @@ -646,7 +646,7 @@ } ], "source": [ - "swan_block['Significant wave height']" + "swan_block[\"Significant wave height\"]" ] }, { @@ -1082,7 +1082,7 @@ } ], "source": [ - "swan_block_mat['Hsig']" + "swan_block_mat[\"Hsig\"]" ] }, { @@ -1323,10 +1323,9 @@ ], "source": [ "plt.figure()\n", - "plt.tricontourf(swan_table.Xp, swan_table.Yp, \n", - " swan_table.Hsig, levels=256)\n", + "plt.tricontourf(swan_table.Xp, swan_table.Yp, swan_table.Hsig, levels=256)\n", "cbar = plt.colorbar()\n", - "cbar.set_label('Significant wave height [m]')" + "cbar.set_label(\"Significant wave height [m]\")" ] }, { @@ -1349,11 +1348,15 @@ ], "source": [ "plt.figure()\n", - "plt.tricontourf(swan_block_mat_as_table.x, swan_block_mat_as_table.y, \n", - " swan_block_mat_as_table.Hsig,\n", - " levels=256, cmap='viridis')\n", + "plt.tricontourf(\n", + " swan_block_mat_as_table.x,\n", + " swan_block_mat_as_table.y,\n", + " swan_block_mat_as_table.Hsig,\n", + " levels=256,\n", + " cmap=\"viridis\",\n", + ")\n", "cbar = plt.colorbar()\n", - "cbar.set_label('Significant wave height [m]')" + "cbar.set_label(\"Significant wave height [m]\")" ] }, { @@ -1376,11 +1379,15 @@ ], "source": [ "plt.figure()\n", - "plt.tricontourf(swan_block_as_table.x, swan_block_as_table.y, \n", - " swan_block_as_table['Significant wave height'], \n", - " levels=256, cmap='viridis')\n", + "plt.tricontourf(\n", + " swan_block_as_table.x,\n", + " swan_block_as_table.y,\n", + " swan_block_as_table[\"Significant wave height\"],\n", + " levels=256,\n", + " cmap=\"viridis\",\n", + ")\n", "cbar = plt.colorbar()\n", - "cbar.set_label('Significant wave height [m]')" + "cbar.set_label(\"Significant wave height [m]\")" ] }, { @@ -1412,10 +1419,10 @@ ], "source": [ "plt.figure()\n", - "plt.imshow(swan_block_mat['Hsig'])\n", + "plt.imshow(swan_block_mat[\"Hsig\"])\n", "plt.gca().invert_yaxis()\n", "cbar = plt.colorbar()\n", - "cbar.set_label('Significant wave height [m]')" + "cbar.set_label(\"Significant wave height [m]\")" ] } ], diff --git a/examples/WPTO_hindcast_example.ipynb b/examples/WPTO_hindcast_example.ipynb index 9963a9ff0..1b6565797 100644 --- a/examples/WPTO_hindcast_example.ipynb +++ b/examples/WPTO_hindcast_example.ipynb @@ -101,7 +101,7 @@ } ], "source": [ - "lat_lon = [44.624076,-124.280097]\n", + "lat_lon = [44.624076, -124.280097]\n", "region = wave.io.hindcast.hindcast.region_selection(lat_lon)\n", "print(region)" ] @@ -121,12 +121,14 @@ "metadata": {}, "outputs": [], "source": [ - "data_type = '3-hour' # setting the data type to the 3-hour dataset\n", + "data_type = \"3-hour\" # setting the data type to the 3-hour dataset\n", "years = [1995]\n", - "lat_lon = (44.624076,-124.280097) \n", - "parameter = 'significant_wave_height' \n", + "lat_lon = (44.624076, -124.280097)\n", + "parameter = \"significant_wave_height\"\n", "\n", - "Hs, metadata= wave.io.hindcast.hindcast.request_wpto_point_data(data_type,parameter,lat_lon,years)" + "Hs, metadata = wave.io.hindcast.hindcast.request_wpto_point_data(\n", + " data_type, parameter, lat_lon, years\n", + ")" ] }, { @@ -378,11 +380,12 @@ } ], "source": [ - "parameter = 'energy_period'\n", - "lat_lon = ((44.624076,-124.280097),\n", - " (43.489171,-125.152137)) \n", + "parameter = \"energy_period\"\n", + "lat_lon = ((44.624076, -124.280097), (43.489171, -125.152137))\n", "\n", - "Te, metadata = wave.io.hindcast.hindcast.request_wpto_point_data(data_type, parameter, lat_lon, years)\n", + "Te, metadata = wave.io.hindcast.hindcast.request_wpto_point_data(\n", + " data_type, parameter, lat_lon, years\n", + ")\n", "\n", "# View Te from two locations\n", "Te.head()" @@ -582,11 +585,13 @@ } ], "source": [ - "years = [1995, 1996] \n", - "parameter = 'omni-directional_wave_power'\n", - "lat_lon = (44.624076,-124.280097) \n", + "years = [1995, 1996]\n", + "parameter = \"omni-directional_wave_power\"\n", + "lat_lon = (44.624076, -124.280097)\n", "\n", - "J, metadata= wave.io.hindcast.hindcast.request_wpto_point_data(data_type,parameter,lat_lon,years) \n", + "J, metadata = wave.io.hindcast.hindcast.request_wpto_point_data(\n", + " data_type, parameter, lat_lon, years\n", + ")\n", "\n", "J" ] @@ -670,12 +675,14 @@ "metadata": {}, "outputs": [], "source": [ - "data_type = '1-hour' # Setting the data_type to 1 hour data\n", - "years = [1995] \n", - "parameter = ['significant_wave_height','peak_period','mean_wave_direction']\n", - "lat_lon = (44.624076,-124.280097) \n", + "data_type = \"1-hour\" # Setting the data_type to 1 hour data\n", + "years = [1995]\n", + "parameter = [\"significant_wave_height\", \"peak_period\", \"mean_wave_direction\"]\n", + "lat_lon = (44.624076, -124.280097)\n", "\n", - "data, metadata= wave.io.hindcast.hindcast.request_wpto_point_data(data_type,parameter,lat_lon,years) " + "data, metadata = wave.io.hindcast.hindcast.request_wpto_point_data(\n", + " data_type, parameter, lat_lon, years\n", + ")" ] }, { @@ -801,34 +808,35 @@ "from numpy import histogramdd, array, arange, mean\n", "\n", "# Generate bins for Hm0, Te and Direction\n", - "Hm0_bins = arange(0, data.significant_wave_height_0.values.max() + 0.5, 0.5) \n", + "Hm0_bins = arange(0, data.significant_wave_height_0.values.max() + 0.5, 0.5)\n", "Te_bins = arange(0, data.peak_period_0.values.max() + 1, 1)\n", "Dir_bins = arange(0, data.mean_wave_direction_0.values.max() + 10, 10)\n", "\n", "# Combine data for better handling\n", - "jpd_3d = array([\n", - " data.significant_wave_height_0.values.flatten(),\n", - " data.peak_period_0.values.flatten(),\n", - " data.mean_wave_direction_0.values.flatten()\n", - " ]).T\n", + "jpd_3d = array(\n", + " [\n", + " data.significant_wave_height_0.values.flatten(),\n", + " data.peak_period_0.values.flatten(),\n", + " data.mean_wave_direction_0.values.flatten(),\n", + " ]\n", + ").T\n", "\n", "# Calculate the bin centers of the data\n", - "Hm0_center = array([\n", - " mean([Hm0_bins[i+1],Hm0_bins[i]]) \n", - " for i in range(Hm0_bins.shape[0]-1)\n", - " ])\n", - "Te_center = array([\n", - " mean([Te_bins[i+1],Te_bins[i]]) \n", - " for i in range(Te_bins.shape[0]-1)\n", - " ])\n", - "Dir_center = array([\n", - " mean([Dir_bins[i+1],Dir_bins[i]]) \n", - " for i in range(Dir_bins.shape[0]-1)\n", - " ])\n", + "Hm0_center = array(\n", + " [mean([Hm0_bins[i + 1], Hm0_bins[i]]) for i in range(Hm0_bins.shape[0] - 1)]\n", + ")\n", + "Te_center = array(\n", + " [mean([Te_bins[i + 1], Te_bins[i]]) for i in range(Te_bins.shape[0] - 1)]\n", + ")\n", + "Dir_center = array(\n", + " [mean([Dir_bins[i + 1], Dir_bins[i]]) for i in range(Dir_bins.shape[0] - 1)]\n", + ")\n", "\n", "\n", - "# Calculate the JPD for Hm0, Te, and Dir \n", - "probability, edges = histogramdd(jpd_3d,bins=[Hm0_bins,Te_bins,Dir_bins],density=True)" + "# Calculate the JPD for Hm0, Te, and Dir\n", + "probability, edges = histogramdd(\n", + " jpd_3d, bins=[Hm0_bins, Te_bins, Dir_bins], density=True\n", + ")" ] }, { @@ -1844,36 +1852,38 @@ "fig.subplots_adjust(right=0.8, bottom=0.25)\n", "\n", "d = 0\n", - "plot_jpd = probability[:,:,d]\n", + "plot_jpd = probability[:, :, d]\n", "\n", - "im = ax.imshow(plot_jpd, origin='lower', aspect='auto')\n", + "im = ax.imshow(plot_jpd, origin=\"lower\", aspect=\"auto\")\n", "\n", - "axcolor = 'lightgoldenrodyellow'\n", + "axcolor = \"lightgoldenrodyellow\"\n", "axDir = plt.axes([0.3, 0.075, 0.45, 0.03], facecolor=axcolor)\n", "\n", - "newD = Slider(axDir, 'Income Wave\\n Direction', 5, 355, valinit=d, valstep=10)\n", + "newD = Slider(axDir, \"Income Wave\\n Direction\", 5, 355, valinit=d, valstep=10)\n", + "\n", "\n", "def update(val):\n", - " d = int(newD.val/10)\n", - " im.set_data(probability[:,:,d])\n", + " d = int(newD.val / 10)\n", + " im.set_data(probability[:, :, d])\n", " fig.canvas.draw()\n", "\n", + "\n", "newD.on_changed(update)\n", "\n", "cax = fig.add_axes([0.82, 0.3, 0.03, 0.5])\n", - "cbar = fig.colorbar(im, cax=cax, orientation='vertical')\n", + "cbar = fig.colorbar(im, cax=cax, orientation=\"vertical\")\n", "\n", - "cbar.set_label('Probability Density (1/(sec*m*deg)', rotation=270, labelpad=15)\n", + "cbar.set_label(\"Probability Density (1/(sec*m*deg)\", rotation=270, labelpad=15)\n", "\n", - "ax.set_xlabel('Te (seconds)')\n", - "ax.set_ylabel('Hm0 (meters)')\n", + "ax.set_xlabel(\"Te (seconds)\")\n", + "ax.set_ylabel(\"Hm0 (meters)\")\n", "\n", "ax.set_xticks(arange(len(Te_center)))\n", "ax.set_yticks(arange(len(Hm0_center)))\n", - "ax.set_xticklabels(Te_center,rotation=45)\n", + "ax.set_xticklabels(Te_center, rotation=45)\n", "ax.set_yticklabels(Hm0_center)\n", "\n", - "fig.suptitle('Joint Probability Density\\n of Hm0 and Te per Direction')\n" + "fig.suptitle(\"Joint Probability Density\\n of Hm0 and Te per Direction\")" ] }, { @@ -1905,9 +1915,11 @@ } ], "source": [ - "year = '1993' # only one year can be passed at a time as a string\n", - "lat_lon=(43.489171,-125.152137)\n", - "dir_spectra,meta = wave.io.hindcast.hindcast.request_wpto_directional_spectrum(lat_lon,year)\n", + "year = \"1993\" # only one year can be passed at a time as a string\n", + "lat_lon = (43.489171, -125.152137)\n", + "dir_spectra, meta = wave.io.hindcast.hindcast.request_wpto_directional_spectrum(\n", + " lat_lon, year\n", + ")\n", "\n", "print(dir_spectra)" ] diff --git a/examples/adcp_example.ipynb b/examples/adcp_example.ipynb index 0c1c77d37..6c1cbdfff 100644 --- a/examples/adcp_example.ipynb +++ b/examples/adcp_example.ipynb @@ -1,4013 +1,4086 @@ { - "cells": [ - { - "attachments": {}, - "cell_type": "markdown", - "metadata": {}, - "source": [ - "# Analyzing ADCP Data with MHKiT\n", - "\n", - "The following example illustrates a straightforward workflow for analyzing Acoustic Doppler Current Profiler (ADCP) data utilizing MHKiT. MHKiT has integrated the DOLfYN codebase as a module to facilitate ADCP and Acoustic Doppler Velocimetry (ADV) data processing.\n", - "\n", - "Here is a standard workflow for ADCP data analysis:\n", - "\n", - "1. **Import Data**\n", - "\n", - "2. **Review, QC, and Prepare the Raw Data**:\n", - " 1. Calculate or verify the correctness of depth bin locations\n", - " 2. Discard data recorded above the water surface or below the seafloor\n", - " 3. Assess the quality of velocity, beam amplitude, and/or beam correlation data\n", - " 4. Rotate Data Coordinate System\n", - "\n", - "3. **Data Averaging**: \n", - " - If not already executed within the instrument, average the data into time bins of a predetermined duration, typically between 5 and 10 minutes\n", - "\n", - "4. **Speed and Direction**\n", - "\n", - "5. **Plotting**\n", - "\n", - "6. **Saving and Loading DOLfYN datasets**\n", - "\n", - "7. **Turbulence Statistics**\n", - " 1. TI\n", - " 2. Power Spectral Densities\n", - " 3. TKE Dissipation Rate\n", - " 4. TKE Componenets\n", - " 5. ADCP Noise\n", - " 6. TKE Production\n", - " 7. TKE Balance \n", - "\n", - "\n", - "Begin your analysis by importing the requisite tools:" - ] - }, - { - "cell_type": "code", - "execution_count": 1, - "metadata": { - "scrolled": true - }, - "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "c:\\Users\\mcve343\\Anaconda3\\lib\\site-packages\\xarray\\backends\\cfgrib_.py:29: UserWarning: Failed to load cfgrib - most likely there is a problem accessing the ecCodes library. Try `import cfgrib` to get the full error message\n", - " warnings.warn(\n" - ] - } - ], - "source": [ - "from mhkit import dolfyn\n", - "from mhkit.dolfyn.adp import api" - ] - }, - { - "attachments": {}, - "cell_type": "markdown", - "metadata": {}, - "source": [ - "## 1. Importing Raw Instrument Data\n", - "\n", - "One of DOLfYN's key features is its ability to directly import raw data from an Acoustic Doppler Current Profiler (ADCP) right after it has been transferred. In this instance, we are using a Nortek Signature1000 ADCP, with the data stored in files with an '.ad2cp' extension. This specific dataset represents several hours of velocity data, captured at 1 Hz by an ADCP mounted on a bottom lander within a tidal inlet. The list of instruments compatible with DOLfYN can be found in the [MHKiT DOLfYN documentation](https://mhkit-software.github.io/MHKiT/mhkit-python/api.dolfyn.html).\n", - "\n", - "We'll start by importing the raw data file downloaded from the instrument. The `read` function processes the raw file and converts the information into an xarray Dataset. This Dataset includes several groups of variables:\n", - "\n", - "1. **Velocity**: Recorded in the coordinate system saved by the instrument (beam, XYZ, ENU)\n", - "2. **Beam Data**: Includes amplitude and correlation data\n", - "3. **Instrumental & Environmental Measurements**: Captures the instrument's bearing and environmental conditions\n", - "4. **Orientation Matrices**: Used by DOLfYN for rotating through different coordinate frames.\n" - ] - }, - { - "cell_type": "code", - "execution_count": 2, - "metadata": { - "scrolled": true - }, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "Reading file data/dolfyn/Sig1000_tidal.ad2cp ...\n" - ] - } - ], - "source": [ - "ds = dolfyn.read('data/dolfyn/Sig1000_tidal.ad2cp')" - ] - }, - { - "attachments": {}, - "cell_type": "markdown", - "metadata": {}, - "source": [ - "There are two ways to see what's in a Dataset. The first is to simply type the dataset's name to see the standard xarray output. To access a particular variable in a dataset, use dict-style (`ds['vel']`) or attribute-style syntax (`ds.vel`). See the [xarray docs](http://xarray.pydata.org/en/stable/getting-started-guide/quick-overview.html) for more details on how to use the xarray format." - ] - }, - { - "cell_type": "code", - "execution_count": 3, - "metadata": {}, - "outputs": [ - { - "data": { - "text/html": [ - "
\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "
<xarray.Dataset>\n",
-              "Dimensions:              (time: 55000, dirIMU: 3, dir: 4, range: 28, beam: 4,\n",
-              "                          earth: 3, inst: 3, q: 4, time_b5: 55000,\n",
-              "                          range_b5: 28, x1: 4, x2: 4)\n",
-              "Coordinates:\n",
-              "  * time                 (time) datetime64[ns] 2020-08-15T00:20:00.500999927 ...\n",
-              "  * dirIMU               (dirIMU) <U1 'E' 'N' 'U'\n",
-              "  * dir                  (dir) <U2 'E' 'N' 'U1' 'U2'\n",
-              "  * range                (range) float64 0.6 1.1 1.6 2.1 ... 12.6 13.1 13.6 14.1\n",
-              "  * beam                 (beam) int32 1 2 3 4\n",
-              "  * earth                (earth) <U1 'E' 'N' 'U'\n",
-              "  * inst                 (inst) <U1 'X' 'Y' 'Z'\n",
-              "  * q                    (q) <U1 'w' 'x' 'y' 'z'\n",
-              "  * time_b5              (time_b5) datetime64[ns] 2020-08-15T00:20:00.4384999...\n",
-              "  * range_b5             (range_b5) float64 0.6 1.1 1.6 2.1 ... 13.1 13.6 14.1\n",
-              "  * x1                   (x1) int32 1 2 3 4\n",
-              "  * x2                   (x2) int32 1 2 3 4\n",
-              "Data variables: (12/38)\n",
-              "    c_sound              (time) float32 1.502e+03 1.502e+03 ... 1.498e+03\n",
-              "    temp                 (time) float32 14.55 14.55 14.55 ... 13.47 13.47 13.47\n",
-              "    pressure             (time) float32 9.713 9.718 9.718 ... 9.596 9.594 9.596\n",
-              "    mag                  (dirIMU, time) float32 72.5 72.7 72.6 ... -197.2 -195.7\n",
-              "    accel                (dirIMU, time) float32 -0.00479 -0.01437 ... 9.729\n",
-              "    batt                 (time) float32 16.6 16.6 16.6 16.6 ... 16.4 16.4 15.2\n",
-              "    ...                   ...\n",
-              "    telemetry_data       (time) uint8 0 0 0 0 0 0 0 0 0 0 ... 0 0 0 0 0 0 0 0 0\n",
-              "    boost_running        (time) uint8 0 0 0 0 0 0 0 0 1 0 ... 0 1 0 0 0 0 0 0 1\n",
-              "    heading              (time) float32 -12.52 -12.51 -12.51 ... -12.52 -12.5\n",
-              "    pitch                (time) float32 -0.065 -0.06 -0.06 ... -0.06 -0.05 -0.05\n",
-              "    roll                 (time) float32 -7.425 -7.42 -7.42 ... -6.45 -6.45 -6.45\n",
-              "    beam2inst_orientmat  (x1, x2) float32 1.183 0.0 -1.183 ... 0.5518 0.0 0.5518\n",
-              "Attributes: (12/34)\n",
-              "    filehead_config:       {"CLOCKSTR": {"TIME": "\\"2020-08-13 13:56:21\\""}, ...\n",
-              "    inst_model:            Signature1000\n",
-              "    inst_make:             Nortek\n",
-              "    inst_type:             ADCP\n",
-              "    burst_config:          {"press_valid": true, "temp_valid": true, "compass...\n",
-              "    n_cells:               28\n",
-              "    ...                    ...\n",
-              "    proc_idle_less_12pct:  0\n",
-              "    rotate_vars:           ['vel', 'accel', 'accel_b5', 'angrt', 'angrt_b5', ...\n",
-              "    coord_sys:             earth\n",
-              "    fs:                    1\n",
-              "    has_imu:               1\n",
-              "    beam_angle:            25
" - ], - "text/plain": [ - "\n", - "Dimensions: (time: 55000, dirIMU: 3, dir: 4, range: 28, beam: 4,\n", - " earth: 3, inst: 3, q: 4, time_b5: 55000,\n", - " range_b5: 28, x1: 4, x2: 4)\n", - "Coordinates:\n", - " * time (time) datetime64[ns] 2020-08-15T00:20:00.500999927 ...\n", - " * dirIMU (dirIMU) : Nortek Signature1000\n", - " . 15.28 hours (started: Aug 15, 2020 00:20)\n", - " . earth-frame\n", - " . (55000 pings @ 1Hz)\n", - " Variables:\n", - " - time ('time',)\n", - " - time_b5 ('time_b5',)\n", - " - vel ('dir', 'range', 'time')\n", - " - vel_b5 ('range_b5', 'time_b5')\n", - " - range ('range',)\n", - " - orientmat ('earth', 'inst', 'time')\n", - " - heading ('time',)\n", - " - pitch ('time',)\n", - " - roll ('time',)\n", - " - temp ('time',)\n", - " - pressure ('time',)\n", - " - amp ('beam', 'range', 'time')\n", - " - amp_b5 ('range_b5', 'time_b5')\n", - " - corr ('beam', 'range', 'time')\n", - " - corr_b5 ('range_b5', 'time_b5')\n", - " - accel ('dirIMU', 'time')\n", - " - angrt ('dirIMU', 'time')\n", - " - mag ('dirIMU', 'time')\n", - " ... and others (see `.variables`)" - ] - }, - "execution_count": 4, - "metadata": {}, - "output_type": "execute_result" - } - ], - "source": [ - "ds_dolfyn = ds.velds\n", - "ds_dolfyn" - ] - }, - { - "attachments": {}, - "cell_type": "markdown", - "metadata": {}, - "source": [ - "## 2. Initial Steps for Data Quality Control (QC)\n", - "\n", - "### 2.1: Set the Deployment Height\n", - "\n", - "When using Nortek instruments, the deployment software does not factor in the deployment height. The deployment height represents the position of the Acoustic Doppler Current Profiler (ADCP) within the water column. \n", - "\n", - "In this context, the center of the first depth bin is situated at a distance that is the sum of three elements: \n", - "1. Deployment height (the ADCP's position in the water column)\n", - "2. Blanking distance (the minimum distance from the ADCP to the first measurement point)\n", - "3. Cell size (the vertical distance of each measurement bin in the water column)\n", - "\n", - "To ensure accurate readings, it is critical to calibrate the 'range' coordinate to make '0' correspond to the seafloor. This calibration can be achieved using the `set_range_offset` function. This function is also useful when working with a down-facing instrument as it helps account for the depth below the water surface. \n", - "\n", - "For those using a Teledyne RDI ADCP, the TRDI deployment software will prompt you to specify the deployment height/depth during setup. If there's a need for calibration post-deployment, the `set_range_offset` function can be utilized in the same way as described above." - ] - }, - { - "cell_type": "code", - "execution_count": 5, - "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "" - ] - }, - "execution_count": 5, - "metadata": {}, - "output_type": "execute_result" - }, - { - "data": { - "image/png": "", - "text/plain": [ - "
" - ] - }, - "metadata": {}, - "output_type": "display_data" - } - ], - "source": [ - "ds['vel'][1].plot()" - ] - }, - { - "cell_type": "code", - "execution_count": 6, - "metadata": {}, - "outputs": [], - "source": [ - "# The ADCP transducers were measured to be 0.6 m from the feet of the lander\n", - "api.clean.set_range_offset(ds, 0.6)" - ] - }, - { - "attachments": {}, - "cell_type": "markdown", - "metadata": {}, - "source": [ - "So, the center of bin 1 is located at 1.2 m:" - ] - }, - { - "cell_type": "code", - "execution_count": 7, - "metadata": {}, - "outputs": [ - { - "data": { - "text/html": [ - "
\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "
<xarray.DataArray 'range' (range: 28)>\n",
-              "array([ 1.2,  1.7,  2.2,  2.7,  3.2,  3.7,  4.2,  4.7,  5.2,  5.7,  6.2,  6.7,\n",
-              "        7.2,  7.7,  8.2,  8.7,  9.2,  9.7, 10.2, 10.7, 11.2, 11.7, 12.2, 12.7,\n",
-              "       13.2, 13.7, 14.2, 14.7])\n",
-              "Coordinates:\n",
-              "  * range    (range) float64 1.2 1.7 2.2 2.7 3.2 ... 12.7 13.2 13.7 14.2 14.7\n",
-              "Attributes:\n",
-              "    units:    m
" - ], - "text/plain": [ - "\n", - "array([ 1.2, 1.7, 2.2, 2.7, 3.2, 3.7, 4.2, 4.7, 5.2, 5.7, 6.2, 6.7,\n", - " 7.2, 7.7, 8.2, 8.7, 9.2, 9.7, 10.2, 10.7, 11.2, 11.7, 12.2, 12.7,\n", - " 13.2, 13.7, 14.2, 14.7])\n", - "Coordinates:\n", - " * range (range) float64 1.2 1.7 2.2 2.7 3.2 ... 12.7 13.2 13.7 14.2 14.7\n", - "Attributes:\n", - " units: m" - ] - }, - "execution_count": 7, - "metadata": {}, - "output_type": "execute_result" - } - ], - "source": [ - "ds.range" - ] - }, - { - "attachments": {}, - "cell_type": "markdown", - "metadata": {}, - "source": [ - "### 2.2. Discard Data Above Surface Level\n", - "\n", - "To reduce computational load, we can exclude all data at or above the water surface level. Since the instrument was oriented upwards, we can utilize the pressure sensor data along with the function `find_surface_from_P`. However, this approach necessitates that the pressure sensor was calibrated or 'zeroed' prior to deployment. If the instrument is facing downwards or doesn't include pressure data, the function `find_surface` can be used to detect the seabed or water surface.\n", - "\n", - "It's important to note that Acoustic Doppler Current Profilers (ADCPs) do not measure water salinity, so you'll need to supply this information to the function. The dataset returned by this function includes an additional variable, \"depth\". If `find_surface_from_P` is invoked after `set_range_offset`, \"depth\" represents the distance from the water surface to the seafloor. Otherwise, it indicates the distance to the ADCP pressure sensor.\n", - "\n", - "After determining the \"depth\", you can use the nan_beyond_surface function to discard data in depth bins at or above the actual water surface. Be aware that this function will generate a new dataset." - ] - }, - { - "cell_type": "code", - "execution_count": 8, - "metadata": {}, - "outputs": [], - "source": [ - "api.clean.find_surface_from_P(ds, salinity=31)\n", - "ds = api.clean.nan_beyond_surface(ds)" - ] - }, - { - "cell_type": "code", - "execution_count": 9, - "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "" - ] - }, - "execution_count": 9, - "metadata": {}, - "output_type": "execute_result" - }, - { - "data": { - "image/png": "", - "text/plain": [ - "
" - ] - }, - "metadata": {}, - "output_type": "display_data" - } - ], - "source": [ - "ds['vel'][1].plot()" - ] - }, - { - "attachments": {}, - "cell_type": "markdown", - "metadata": {}, - "source": [ - "### 2.3: Apply an Acoustic Signal Correlation Filter\n", - "\n", - "After removing data from bins at or above the water surface, we typically apply a filter based on acoustic signal correlation to the ADCP data. This helps to eliminate erroneous velocity data points, which can be caused by factors such as bubbles, kelp, fish, etc., moving through one or multiple beams.\n", - "\n", - "You can quickly inspect the data to determine an appropriate correlation value by using the built-in plotting feature of xarray. In the following example, we use xarray's slicing capabilities to display data from beam 1 within a range of 0 to 10 m from the ADCP.\n", - "\n", - "It's important to note that not all ADCPs provide acoustic signal correlation data, which serves as a quantitative measure of signal quality. Older ADCPs may not offer this feature, in which case you can skip this step when using such instruments." - ] - }, - { - "cell_type": "code", - "execution_count": 10, - "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "" - ] - }, - "execution_count": 10, - "metadata": {}, - "output_type": "execute_result" - }, - { - "data": { - "image/png": "", - "text/plain": [ - "
" - ] - }, - "metadata": {}, - "output_type": "display_data" - } - ], - "source": [ - "%matplotlib inline\n", - "ds['corr'].sel(beam=1, range=slice(0,10)).plot()" - ] - }, - { - "attachments": {}, - "cell_type": "markdown", - "metadata": {}, - "source": [ - "It's beneficial to also review data from the other beams. A significant portion of this data is of high quality. To avoid discarding valuable data with lower correlations, which could be due to natural variations, we can use the `correlation_filter`. This function assigns a value of NaN (not a number) to velocity values corresponding to correlations below 50%.\n", - "\n", - "However, it's important to note that the correlation threshold is dependent on the specifics of the deployment environment and the instrument used. It's not unusual to set a threshold as low as 30%, or even to forgo the use of this function entirely." - ] - }, - { - "cell_type": "code", - "execution_count": 11, - "metadata": {}, - "outputs": [], - "source": [ - "ds = api.clean.correlation_filter(ds, thresh=50)" - ] - }, - { - "cell_type": "code", - "execution_count": 12, - "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "" - ] - }, - "execution_count": 12, - "metadata": {}, - "output_type": "execute_result" - }, - { - "data": { - "image/png": "", - "text/plain": [ - "
" - ] - }, - "metadata": {}, - "output_type": "display_data" - } - ], - "source": [ - "ds['vel'][1].plot()" - ] - }, - { - "attachments": {}, - "cell_type": "markdown", - "metadata": {}, - "source": [ - "### 2.4 Rotate Data Coordinate System\n", - "\n", - "After cleaning the data, the next step is to rotate the velocity data into accurate East, North, Up (ENU) coordinates.\n", - "\n", - "ADCPs utilize an internal compass or magnetometer to determine magnetic ENU directions. You can use the set_declination function to adjust the velocity data according to the magnetic declination specific to your geographical coordinates. This declination can be looked up online for specific coordinates.\n", - "\n", - "Instruments save vector data in the coordinate system defined in the deployment configuration file. To make this data meaningful, it must be transformed through various coordinate systems (\"beam\"<->\"inst\"<->\"earth\"<->\"principal\"). This transformation is accomplished using the `rotate2` function. If the \"earth\" (ENU) coordinate system is specified, DOLfYN will automatically rotate the dataset through the required coordinate systems to reach the \"earth\" coordinates. Setting `inplace` to true will modify the input dataset directly, meaning it will not create a new dataset.\n", - "\n", - "In this case, since the ADCP data is already in the \"earth\" coordinate system, the `rotate2` function will return the input dataset without modifications. The `set_declination` function will work no matter the coordinate system." - ] - }, - { - "cell_type": "code", - "execution_count": 13, - "metadata": {}, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "Data is already in the earth coordinate system\n" - ] - } - ], - "source": [ - "dolfyn.set_declination(ds, 15.8, inplace=True) # 15.8 deg East\n", - "dolfyn.rotate2(ds, 'earth', inplace=True)" - ] - }, - { - "attachments": {}, - "cell_type": "markdown", - "metadata": {}, - "source": [ - "To rotate into the principal frame of reference (streamwise, cross-stream, vertical), if desired, we must first calculate the depth-averaged principal flow heading and add it to the dataset attributes. Then the dataset can be rotated using the same `rotate2` function. We use `inplace=False` because we do not want to alter the input dataset here." - ] - }, - { - "cell_type": "code", - "execution_count": 14, - "metadata": {}, - "outputs": [], - "source": [ - "ds.attrs['principal_heading'] = dolfyn.calc_principal_heading(ds['vel'].mean('range'))\n", - "ds_streamwise = dolfyn.rotate2(ds, 'principal', inplace=False)" - ] - }, - { - "attachments": {}, - "cell_type": "markdown", - "metadata": {}, - "source": [ - "## 3. Average the Data\n", - "\n", - "As this deployment was configured in \"burst mode\", a standard step in the analysis process is to average the velocity data into time bins. \n", - "\n", - "However, if the instrument was set up in an \"averaging mode\" (where a specific profile and/or average interval was set, for instance, averaging 5 minutes of data every 30 minutes), this step would have been performed within the ADCP during deployment and can thus be skipped.\n", - "\n", - "To average the data into time bins (also known as ensembles), you should first initialize the binning tool `ADPBinner`. The parameter \"n_bin\" represents the number of data points in each ensemble. In this case, we're dealing with 300 seconds' worth of data. The \"fs\" parameter stands for the sampling frequency, which for this deployment is 1 Hz. Once the binning tool is initialized, you can use the `bin_average` function to average the data into ensembles." - ] - }, - { - "cell_type": "code", - "execution_count": 15, - "metadata": { - "scrolled": true - }, - "outputs": [], - "source": [ - "avg_tool = api.ADPBinner(n_bin=ds.fs*300, fs=ds.fs)\n", - "ds_avg = avg_tool.bin_average(ds)" - ] - }, - { - "cell_type": "code", - "execution_count": 16, - "metadata": {}, - "outputs": [ - { - "data": { - "text/html": [ - "
\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "
<xarray.Dataset>\n",
-              "Dimensions:         (time: 183, dirIMU: 3, range: 28, dir: 4, beam: 4,\n",
-              "                     earth: 3, inst: 3, q: 4, time_b5: 183, range_b5: 28)\n",
-              "Coordinates:\n",
-              "  * time            (time) datetime64[ns] 2020-08-15T00:22:30.001030683 ... 2...\n",
-              "  * dirIMU          (dirIMU) <U1 'E' 'N' 'U'\n",
-              "  * range           (range) float64 1.2 1.7 2.2 2.7 3.2 ... 13.2 13.7 14.2 14.7\n",
-              "  * dir             (dir) <U2 'E' 'N' 'U1' 'U2'\n",
-              "  * beam            (beam) int32 1 2 3 4\n",
-              "  * earth           (earth) <U1 'E' 'N' 'U'\n",
-              "  * inst            (inst) <U1 'X' 'Y' 'Z'\n",
-              "  * q               (q) <U1 'w' 'x' 'y' 'z'\n",
-              "  * time_b5         (time_b5) datetime64[ns] 2020-08-15T00:22:29.938495159 .....\n",
-              "  * range_b5        (range_b5) float64 1.2 1.7 2.2 2.7 ... 13.2 13.7 14.2 14.7\n",
-              "Data variables: (12/38)\n",
-              "    c_sound         (time) float32 1.502e+03 1.502e+03 ... 1.499e+03 1.498e+03\n",
-              "    U_std           (range, time) float32 0.04232 0.04293 0.04402 ... nan nan\n",
-              "    temp            (time) float32 14.49 14.59 14.54 14.45 ... 13.62 13.56 13.5\n",
-              "    pressure        (time) float32 9.712 9.699 9.685 9.67 ... 9.58 9.584 9.591\n",
-              "    mag             (dirIMU, time) float32 72.37 72.4 72.38 ... -197.1 -197.1\n",
-              "    accel           (dirIMU, time) float32 -0.3584 -0.361 ... 9.714 9.712\n",
-              "    ...              ...\n",
-              "    boost_running   (time) float32 0.1267 0.1333 0.13 ... 0.2267 0.22 0.22\n",
-              "    heading         (time) float32 3.287 3.261 3.337 3.289 ... 3.331 3.352 3.352\n",
-              "    pitch           (time) float32 -0.05523 -0.07217 ... -0.04288 -0.0429\n",
-              "    roll            (time) float32 -7.414 -7.424 -7.404 ... -6.446 -6.433 -6.436\n",
-              "    water_density   (time) float32 1.023e+03 1.023e+03 ... 1.023e+03 1.023e+03\n",
-              "    depth           (time) float32 10.28 10.26 10.25 10.23 ... 10.14 10.15 10.15\n",
-              "Attributes: (12/41)\n",
-              "    fs:                        1\n",
-              "    n_bin:                     300\n",
-              "    n_fft:                     300\n",
-              "    description:               Binned averages calculated from ensembles of s...\n",
-              "    filehead_config:           {"CLOCKSTR": {"TIME": "\\"2020-08-13 13:56:21\\"...\n",
-              "    inst_model:                Signature1000\n",
-              "    ...                        ...\n",
-              "    has_imu:                   1\n",
-              "    beam_angle:                25\n",
-              "    h_deploy:                  0.6\n",
-              "    declination:               15.8\n",
-              "    declination_in_orientmat:  1\n",
-              "    principal_heading:         11.1898
" - ], - "text/plain": [ - "\n", - "Dimensions: (time: 183, dirIMU: 3, range: 28, dir: 4, beam: 4,\n", - " earth: 3, inst: 3, q: 4, time_b5: 183, range_b5: 28)\n", - "Coordinates:\n", - " * time (time) datetime64[ns] 2020-08-15T00:22:30.001030683 ... 2...\n", - " * dirIMU (dirIMU) " - ] - }, - "execution_count": 18, - "metadata": {}, - "output_type": "execute_result" - }, - { - "data": { - "image/png": "", - "text/plain": [ - "
" - ] - }, - "metadata": {}, - "output_type": "display_data" - } - ], - "source": [ - "%matplotlib inline \n", - "from matplotlib import pyplot as plt\n", - "import matplotlib.dates as dt\n", - "\n", - "ax = plt.figure(figsize=(10,6)).add_axes([.14, .14, .8, .74])\n", - "# Plot flow speed\n", - "t = dolfyn.time.dt642date(ds_avg['time'])\n", - "plt.pcolormesh(t, ds_avg['range'], ds_avg['U_mag'], cmap='Blues', shading='nearest')\n", - "# Plot the water surface\n", - "ax.plot(t, ds_avg['depth'])\n", - "\n", - "# Set up time on x-axis\n", - "ax.set_xlabel('Time')\n", - "ax.xaxis.set_major_formatter(dt.DateFormatter('%H:%M'))\n", - "\n", - "ax.set_ylabel('Altitude [m]')\n", - "ax.set_ylim([0, 12])\n", - "plt.colorbar(label='Speed [m/s]')" - ] - }, - { - "cell_type": "code", - "execution_count": 19, - "metadata": { - "scrolled": false - }, - "outputs": [ - { - "data": { - "image/png": "", - "text/plain": [ - "
" - ] - }, - "metadata": {}, - "output_type": "display_data" - } - ], - "source": [ - "ax = plt.figure(figsize=(10,6)).add_axes([.14, .14, .8, .74])\n", - "# Plot flow direction\n", - "plt.pcolormesh(t, ds_avg['range'], ds_avg['U_dir'], cmap='twilight', shading='nearest')\n", - "# Plot the water surface\n", - "ax.plot(t, ds_avg['depth'])\n", - "\n", - "# set up time on x-axis\n", - "ax.set_xlabel('Time')\n", - "ax.xaxis.set_major_formatter(dt.DateFormatter('%H:%M'))\n", - "\n", - "ax.set_ylabel('Altitude [m]')\n", - "ax.set_ylim([0, 12]);\n", - "plt.colorbar(label='Horizontal Vel Dir [deg CW from true N]');" - ] - }, - { - "attachments": {}, - "cell_type": "markdown", - "metadata": {}, - "source": [ - "## Saving and Loading DOLfYN datasets\n", - "Datasets can be saved and reloaded using the `save` and `load` functions. Xarray is saved natively in netCDF format, hence the \".nc\" extension.\n", - "\n", - "Note: DOLfYN datasets cannot be saved using xarray's native `ds.to_netcdf`; however, DOLfYN datasets can be opened using `xarray.open_dataset`." - ] - }, - { - "cell_type": "code", - "execution_count": 20, - "metadata": {}, - "outputs": [], - "source": [ - "# Uncomment these lines to save and load to your current working directory\n", - "#dolfyn.save(ds, 'your_data.nc')\n", - "#ds_saved = dolfyn.load('your_data.nc')" - ] - }, - { - "attachments": {}, - "cell_type": "markdown", - "metadata": {}, - "source": [ - "## 7. Turbulence Statistics\n", - "\n", - "The next section of this jupyter notebook will run through the turbulence analysis of the data presented here. There was no intention of measuring turbulence in the deployment that collected this data, so results depicted here are not the highest quality. The quality of turbulence measurements from an ADCP depend heavily on the quality of the deployment setup and data collection, particularly instrument frequency, samping frequency and depth bin size.\n", - "\n", - "Read more on proper ADCP setup for turbulence measurements in: Thomson, Jim, et al. \"Measurements of turbulence at two tidal energy sites in Puget Sound, WA.\" IEEE Journal of Oceanic Engineering 37.3 (2012): 363-374.\n", - "\n", - "Most functions related to turbulence statistics in MHKiT-DOLfYN have the papers they originate from referenced in their docstrings.\n", - "\n", - "### 7.1 Turbulence Intensity\n", - "For most users, turbulence intensity (TI), the ratio of the ensemble standard deviation to ensemble flow speed given as a percent, is all most will need. In MHKiT, this is simply calculated as `.velds.I`\n", - "\n" - ] - }, - { - "cell_type": "code", - "execution_count": 21, - "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "" - ] - }, - "execution_count": 21, - "metadata": {}, - "output_type": "execute_result" - }, - { - "data": { - "image/png": "", - "text/plain": [ - "
" - ] - }, - "metadata": {}, - "output_type": "display_data" - } - ], - "source": [ - "# Turbulence Intensity\n", - "ds_avg['TI'] = ds_avg.velds.I\n", - "ds_avg['TI'].plot(cmap='Reds', ylim=(0,11))" - ] - }, - { - "attachments": {}, - "cell_type": "markdown", - "metadata": {}, - "source": [ - "### 7.2 Power Spectral Densities (Auto-Spectra)\n", - "\n", - "Other turbulence parameters include the TKE power- and cross-spectral densities (i.e the power spectra), turbulent kinetic energy (TKE, i.e. the variances of velocity vector components), Reynolds stress vector (i.e. the co-variances of velocity vector components), TKE dissipation rate, and TKE production rate. These quantities are primarily used to inform and verify hydrodynamic and coastal models, which take some or all of these quantities as input.\n", - "\n", - "The TKE production rate is the rate at which kinetic energy (KE) transitions from a useful state (able to do \"work\" in the physics sense) to turbulent; TKE is the actual amount of turbulent KE in the water; and TKE dissipation rate is the rate at which turbulent KE is lost to non-motion forms of energy (heat, sound, etc) due to viscosity. The power spectra are used to depict and quantify this energy in the frequency domain, and creating them are the first step in turbulence analysis.\n", - "\n", - "We'll start by looking at the power spectra, specifically the auto-spectra from the vertical beam (\"auto\" meaning the variance of a single vector direction, e.g. $\\overline{u'^2}$, vs \"cross\", meaning the covariance of two directions, e.g. $\\overline{u'w'}$). This can be done using the `power_spectral_density` function from the `ADPBinner` we created (\"avg_tool\"). We'll create spectra at the middle water column, at a depth of 5 m, and use a number of FFT's equal to 1/3 the bin size." - ] - }, - { - "cell_type": "code", - "execution_count": 22, - "metadata": {}, - "outputs": [], - "source": [ - "rng = 5 # m\n", - "vel_up = ds['vel_b5'].sel(range_b5=rng, method='nearest') # vertical velocity\n", - "U = ds_avg['U_mag'].sel(range=5, method='nearest') # flow speed, for plotting in the next block\n", - "\n", - "ds_avg['auto_spectra_5m'] = avg_tool.power_spectral_density(vel_up, freq_units='Hz', n_fft=ds_avg.n_bin//3)" - ] - }, - { - "attachments": {}, - "cell_type": "markdown", - "metadata": {}, - "source": [ - "In the auto-spectra, we're primarly looking for three components: the energy-producing region, the isotropic turbulence region (so-called \"red noise\"), and the instrument noise floor (termed \"white noise\"). \n", - "\n", - "The block below organizes and plots the power spectra by the corresponding ensemble speed, averaging them by 0.1 m/s velocity bins. Note that if an ensemble is missing data that wasn't filled in, a power spectrum will not be calculated for that ensemble timestamp." - ] - }, - { - "cell_type": "code", - "execution_count": 23, - "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "[Text(0.5, 0, 'Frequency [Hz]'),\n", - " Text(0, 0.5, 'PSD [m2 s-2 Hz-1]'),\n", - " (0.01, 1),\n", - " (0.0005, 0.1)]" - ] - }, - "execution_count": 23, - "metadata": {}, - "output_type": "execute_result" - }, - { - "data": { - "image/png": "", - "text/plain": [ - "
" - ] - }, - "metadata": {}, - "output_type": "display_data" - } - ], - "source": [ - "import numpy as np\n", - "import matplotlib.pyplot as plt\n", - "import matplotlib as mpl\n", - "plt.rcParams.update({'font.size': 18, \"font.family\": \"Times New Roman\"})\n", - "\n", - "\n", - "def plot_spectra_by_color(auto_spectra, U_mag, ax, fig, cbar_max=4.0):\n", - " U = U_mag.values\n", - " U_max = U_mag.max().values\n", - "\n", - " # Average spectra into 0.1 m/s velocity bins\n", - " speed_bins = np.arange(0.5, U_max, 0.1)\n", - " time = [t for t in auto_spectra.dims if 'time' in t][0]\n", - " S_group = auto_spectra.assign_coords({time: U}).rename({time: \"speed\"})\n", - " group = S_group.groupby_bins(\"speed\", speed_bins)\n", - " count = group.count().values\n", - " S = group.mean()\n", - "\n", - " # define the colormap\n", - " cmap = plt.cm.turbo\n", - " # define the bins and normalize\n", - " bounds = np.arange(0.5, cbar_max, 0.1)\n", - " norm = mpl.colors.BoundaryNorm(bounds, cmap.N)\n", - " colors = cmap(norm(speed_bins))\n", - "\n", - " # plot\n", - " for i in range(len(speed_bins)-1):\n", - " ax.loglog(auto_spectra[\"freq\"], S[i], c=colors[i])\n", - " ax.grid()\n", - "\n", - " # create a second axes for the colorbar\n", - " cax = fig.add_axes([0.8, 0.07, 0.03, 0.88])\n", - " #cax, _ = mpl.colorbar.make_axes(fig.gca())\n", - " sm = mpl.colorbar.ColorbarBase(cax, cmap=cmap, norm=norm,\n", - " spacing='proportional', ticks=bounds, boundaries=bounds, \n", - " format='%1.1f', label='Velocity [m/s]')\n", - " \n", - " # Add -5/3 slope line\n", - " m = -5/3\n", - " x = np.logspace(-1, 0.5)\n", - " y = 10**(-3)*x**m\n", - " ax.loglog(x, y, '--', c='black', label='$f^{-5/3}$')\n", - " ax.legend()\n", - "\n", - " return ax, sm\n", - "\n", - "\n", - "# Set up figure\n", - "fig, ax = plt.subplots(1, 1, figsize=(5,5))\n", - "fig.subplots_adjust(left=0.2, right=0.75, top=0.95, bottom=0.1)\n", - "\n", - "# Plot spectra by color\n", - "plot_spectra_by_color(ds_avg['auto_spectra_5m'], U, ax, fig, cbar_max=2.0)\n", - "# Set axes\n", - "ax.set(xlabel=\"Frequency [Hz]\", ylabel=\"PSD [m2 s-2 Hz-1]\", xlim=(0.01, 1), ylim=(0.0005, 0.1))\n" - ] - }, - { - "attachments": {}, - "cell_type": "markdown", - "metadata": {}, - "source": [ - "In the figure above, we can see the energy-producing turbulent structures below a frequency of 0.2 Hz (one tick to the right of \"10^-1\"). The isotropic turbulence cascade, seen by the dashed f^(-5/3) slope (from Kolmogorov's theory of turbulence) begins at around 0.2 Hz and continues until we reach the Nyquist frequency at 0.5 Hz (1/2 the instrument's sampling frequency, 1 Hz). The instrument's noise floor can't be seen here, but will show up as the flattened part of the spectra at the highest frequencies. For this instrument (Nortek Signature1000), the noise floor typically varies around 10^-3, depending on flow speed and range distance.\n", - "\n", - "### 7.3 TKE Dissipation Rate\n", - "\n", - "Because we can see the isotropic turbulence cascade (0.2 - 0.5 Hz) at this depth bin (5 m altitude), we can calculate the TKE dissipation rate at this location from the spectra itself. This can be done using `dissipation_rate_LT83`, whose inputs are the power spectra, the ensemble speed, and the frequency range of the isotropic cascade." - ] - }, - { - "cell_type": "code", - "execution_count": 24, - "metadata": {}, - "outputs": [], - "source": [ - "# Frequency range of isotropic turubulence cascade\n", - "f_rng = [0.2, 0.5]\n", - "# Dissipation rate\n", - "ds_avg['dissipation_rate_5m'] = avg_tool.dissipation_rate_LT83(ds_avg['auto_spectra_5m'], U, freq_range=f_rng)" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "We have just found the spectra and dissipation rate from a single depth bin at an altitude of 5 m from the seafloor, but typically we want the spectra and dissipation rates from the entire measurement profile. If we want to look at the spectra and dissipation rates from all depth bins, we can set up a \"for\" loop on the range coordinate and merge them together:" - ] - }, - { - "cell_type": "code", - "execution_count": 25, - "metadata": {}, - "outputs": [], - "source": [ - "import xarray as xr\n", - "\n", - "spec = [None]*len(ds.range)\n", - "e = [None]*len(ds.range)\n", - "\n", - "for r in range(len(ds['range'])):\n", - " # Calc spectra from each depth bin using the 5th beam\n", - " spec[r] = avg_tool.power_spectral_density(ds['vel_b5'].isel(range_b5=r), freq_units='Hz')\n", - " # Calc dissipation rate from each spectra\n", - " e[r] = avg_tool.dissipation_rate_LT83(spec[r], ds_avg.velds.U_mag.isel(range=r), freq_range=f_rng) # Hz\n", - "\n", - "ds_avg['auto_spectra'] = xr.concat(spec, dim='range')\n", - "ds_avg['dissipation_rate'] = xr.concat(e, dim='range')\n", - "\n", - "del spec, e # save memory" - ] - }, - { - "attachments": {}, - "cell_type": "markdown", - "metadata": {}, - "source": [ - "Now that we have a profile timeseries of dissipation rate, we need apply some quality control (QC). Since we can't look at each individual spectrum to ensure we can see the isotropic turbulence cascade, we want to QC the output from `dissipation_rate_LT83` to make sure what was calculated actually falls on a f^(-5/3) slope. We can do this using the function `check_turbulence_cascade_slope`, which uses linear regression on the log-transformed LT83 equation (ref. to Lumley and Terray, 1983, see docstring) to calculate the spectral slope for the given frequency range. \n", - "\n", - "In our case, we're calculating the slope of each spectrum between 0.2 and 0.5 Hz. We'll use a cutoff of 20% for the error, but this can be lowered if there still appear to be erroneous estimations from visual inspection of the spectra." - ] - }, - { - "cell_type": "code", - "execution_count": 26, - "metadata": {}, - "outputs": [], - "source": [ - "# Quality control dissipation rate estimation\n", - "slope = avg_tool.check_turbulence_cascade_slope(ds_avg['auto_spectra'], freq_range=f_rng)\n", - "\n", - "# Check that percent difference from -5/3 is not greater than 20%\n", - "mask = abs((slope[0].values - (-5/3)) / (-5.3)) <= 0.20\n", - "\n", - "# Keep good data\n", - "ds_avg['dissipation_rate'] = ds_avg['dissipation_rate'].where(mask)" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "If we plot the dissipation rate below in a colormap, we can see that the profile map has a lot of missing data. One of the reasons is that the 1 Hz sampling rate doesn't provide enough information needed to make dissipation rate estimations, and the other part is that turbulence measurements push the boundaries of what ADCPs are capable of.\n", - "\n", - "Also, 5x10^-4 $m^2/s^3$ sounds reasonable for a dissipation rate estimate for the 1.25 m/s current speeds measured here. They can be a magnitude or two greater for faster flow speeds and depend heavily on bathymetry and regional hydrodynamics." - ] - }, - { - "cell_type": "code", - "execution_count": 27, - "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "" - ] - }, - "execution_count": 27, - "metadata": {}, - "output_type": "execute_result" - }, - { - "data": { - "image/png": "", - "text/plain": [ - "
" - ] - }, - "metadata": {}, - "output_type": "display_data" - } - ], - "source": [ - "ds_avg['dissipation_rate'].plot(cmap='turbo', ylim=(0,11))" - ] - }, - { - "attachments": {}, - "cell_type": "markdown", - "metadata": {}, - "source": [ - "### 7.4 Turbulent Kinetic Energy (TKE) Components\n", - "\n", - "The next parameters we'll find here are the vertical TKE component and the total TKE magnitude. Since we're using the vertical beam on the ADCP, we'll directly measure the vertical TKE component from the along-beam velocity using the `turbulent_kinetic_energy` function. This function is capable of calculating TKE for any along-beam velocity.\n", - "\n", - "We can also use the so-called \"beam-variance\" equations to estimate the Reynolds stress tensor components (i.e. $\\overline{u'^2}$, $\\overline{v'^2}$, $\\overline{w'^2}$, $\\overline{u'v'}$, $\\overline{u'w'^2}$, $\\overline{v'w'^2}$), which define the stresses acting on an element of water. These equations are built into the functions `stress_tensor_5beam` and `stress_tensor4beam`. Since we're using a 5-beam ADCP, we can calculate the total TKE as well using `total_turbulent_kinetic_energy`, which is a wrapper around the 5-beam variance function.\n", - "\n", - "#### Quick ADCP lesson before we dive in:\n", - "\n", - "There are a couple caveats to calculating Reynolds stress tensor components:\n", - " 1. Because this instrument only has 5 beams, we can only find 5 of the 6 components (6 unkowns, 5 knowns)\n", - " 2. Because the ADCP's instrument (XYZ) axes weren't aligned with the flow during deployment, we don't know what direction these components are aligned to (i.e. the 'u' direction is not necessarily the streamwise direction)\n", - " 3. It is possible to rotate the tensor, but we'd need to know all 6 components to do so properly.\n", - "\n", - "That being said, even if we don't know which direction the 3 TKE components ($\\overline{u'^2}$, $\\overline{v'^2}$, $\\overline{w'^2}$) are oriented, we can still combine them and get the total TKE magnitude." - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "#### 7.5 ADCP Noise\n", - "\n", - "The first thing we want to do is calculate the Doppler noise floor from the spectrum we calculated above. (We are making the assumption that the noise floor of the vertical beam is the same as the noise floor of the other 4 beams). This gives us a timeseries of the noise floor, which varies by instrument and with flow speed, at that depth bin.\n", - "\n", - "We can do this using the `doppler_noise_level` function. The two inputs for this function are the power spectra and \"pct_fN\", the percent of the Nyquist frequency that the noise floor exists. Because in this particularly dataset we can't see the noise floor, we'll just use 90% or pct_fN=0.9 as an example. If the noise floor began at 0.4 Hz and ran til our maximum frequency of 0.5 Hz, we'd use pct_fN = 0.4 Hz / 0.5 Hz = 0.8.\n", - "\n", - "Because ADCP noise is a function of range as well as flow speed and instrument frequency, we'll use a for loop to measure the noise from each spectra:" - ] - }, - { - "cell_type": "code", - "execution_count": 28, - "metadata": {}, - "outputs": [], - "source": [ - "# Setting up \"for\" loop\n", - "n = [None]*len(ds.range)\n", - "\n", - "for r in range(len(ds.range)):\n", - " # Calculate doppler noise from spectra from each depth bin\n", - " n[r] = avg_tool.doppler_noise_level(ds_avg['auto_spectra'][r], pct_fN=0.9)\n", - "\n", - "ds_avg['noise'] = xr.concat(n, dim='range')\n", - "\n", - "del n # save memory" - ] - }, - { - "attachments": {}, - "cell_type": "markdown", - "metadata": {}, - "source": [ - "Now that we know the Doppler noise level, we can use that as input for the TKE functions. We'll first calculate the vertical TKE component, using the function `turbulent_kinetic_energy`, inputting our raw vertical beam data and the noise floors we calculated above for each ensemble." - ] - }, - { - "cell_type": "code", - "execution_count": 29, - "metadata": {}, - "outputs": [], - "source": [ - "# Vertical TKE component (w'w' bar)\n", - "ds_avg['wpwp_bar'] = avg_tool.turbulent_kinetic_energy(ds['vel_b5'], noise=ds_avg['noise'])" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "Next we can calculate the TKE magnitude using the function `total_turbulent_kinetic_energy`. This method is a wrapper around the `stress_tensor_5beam` function, which calculates the individual Reynolds stress tensor components and takes the same inputs. As an fyi, this function will drop at least one warning every time it's run, primarily the coordinate system warning. This function also requires the input raw data to be in beam coordinates, so we'll create a copy of the raw data and rotate it to 'beam'. If you do not, this function will do so automatically and rotate the original." - ] - }, - { - "cell_type": "code", - "execution_count": 30, - "metadata": {}, - "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "c:\\users\\mcve343\\mhkit-python\\mhkit\\dolfyn\\adp\\turbulence.py:383: UserWarning: The beam-variance algorithms assume the instrument's (XYZ) coordinate system is aligned with the principal flow directions.\n", - " warnings.warn(\" The beam-variance algorithms assume the instrument's \"\n" - ] - } + "cells": [ + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Analyzing ADCP Data with MHKiT\n", + "\n", + "The following example illustrates a straightforward workflow for analyzing Acoustic Doppler Current Profiler (ADCP) data utilizing MHKiT. MHKiT has integrated the DOLfYN codebase as a module to facilitate ADCP and Acoustic Doppler Velocimetry (ADV) data processing.\n", + "\n", + "Here is a standard workflow for ADCP data analysis:\n", + "\n", + "1. **Import Data**\n", + "\n", + "2. **Review, QC, and Prepare the Raw Data**:\n", + " 1. Calculate or verify the correctness of depth bin locations\n", + " 2. Discard data recorded above the water surface or below the seafloor\n", + " 3. Assess the quality of velocity, beam amplitude, and/or beam correlation data\n", + " 4. Rotate Data Coordinate System\n", + "\n", + "3. **Data Averaging**: \n", + " - If not already executed within the instrument, average the data into time bins of a predetermined duration, typically between 5 and 10 minutes\n", + "\n", + "4. **Speed and Direction**\n", + "\n", + "5. **Plotting**\n", + "\n", + "6. **Saving and Loading DOLfYN datasets**\n", + "\n", + "7. **Turbulence Statistics**\n", + " 1. Turbulence Intensity (TI)\n", + " 2. Power Spectral Densities\n", + " 3. Instrument Noise\n", + " 4. TKE Dissipation Rate\n", + " 5. Noise-corrected TI\n", + " 6. TKE Componenets\n", + " 7. TKE Production\n", + " 8. TKE Balance \n", + "\n", + "\n", + "Begin your analysis by importing the requisite tools:" + ] + }, + { + "cell_type": "code", + "execution_count": 1, + "metadata": { + "scrolled": true + }, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "c:\\Users\\mcve343\\anaconda3\\envs\\tsdat-pipelines\\lib\\site-packages\\xarray\\backends\\cfgrib_.py:29: UserWarning: Failed to load cfgrib - most likely there is a problem accessing the ecCodes library. Try `import cfgrib` to get the full error message\n", + " warnings.warn(\n" + ] + } + ], + "source": [ + "from mhkit import dolfyn\n", + "from mhkit.dolfyn.adp import api" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## 1. Importing Raw Instrument Data\n", + "\n", + "One of DOLfYN's key features is its ability to directly import raw data from an Acoustic Doppler Current Profiler (ADCP) right after it has been transferred. In this instance, we are using a Nortek Signature1000 ADCP, with the data stored in files with an '.ad2cp' extension. This specific dataset represents several hours of velocity data, captured at 1 Hz by an ADCP mounted on a bottom lander within a tidal inlet. The list of instruments compatible with DOLfYN can be found in the [MHKiT DOLfYN documentation](https://mhkit-software.github.io/MHKiT/mhkit-python/api.dolfyn.html).\n", + "\n", + "We'll start by importing the raw data file downloaded from the instrument. The `read` function processes the raw file and converts the information into an xarray Dataset. This Dataset includes several groups of variables:\n", + "\n", + "1. **Velocity**: Recorded in the coordinate system saved by the instrument (beam, XYZ, ENU)\n", + "2. **Beam Data**: Includes amplitude and correlation data\n", + "3. **Instrumental & Environmental Measurements**: Captures the instrument's bearing and environmental conditions\n", + "4. **Orientation Matrices**: Used by DOLfYN for rotating through different coordinate frames.\n" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "metadata": { + "scrolled": true + }, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Reading file data/dolfyn/Sig1000_tidal.ad2cp ...\n" + ] + } + ], + "source": [ + "ds = dolfyn.read(\"data/dolfyn/Sig1000_tidal.ad2cp\")" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "There are two ways to see what's in a Dataset. The first is to simply type the dataset's name to see the standard xarray output. To access a particular variable in a dataset, use dict-style (`ds['vel']`) or attribute-style syntax (`ds.vel`). See the [xarray docs](http://xarray.pydata.org/en/stable/getting-started-guide/quick-overview.html) for more details on how to use the xarray format." + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "
<xarray.Dataset>\n",
+       "Dimensions:              (time: 55000, dirIMU: 3, dir: 4, range: 28, beam: 4,\n",
+       "                          earth: 3, inst: 3, q: 4, time_b5: 55000,\n",
+       "                          range_b5: 28, x1: 4, x2: 4)\n",
+       "Coordinates:\n",
+       "  * time                 (time) datetime64[ns] 2020-08-15T00:20:00.500999927 ...\n",
+       "  * dirIMU               (dirIMU) <U1 'E' 'N' 'U'\n",
+       "  * dir                  (dir) <U2 'E' 'N' 'U1' 'U2'\n",
+       "  * range                (range) float64 0.6 1.1 1.6 2.1 ... 12.6 13.1 13.6 14.1\n",
+       "  * beam                 (beam) int32 1 2 3 4\n",
+       "  * earth                (earth) <U1 'E' 'N' 'U'\n",
+       "  * inst                 (inst) <U1 'X' 'Y' 'Z'\n",
+       "  * q                    (q) <U1 'w' 'x' 'y' 'z'\n",
+       "  * time_b5              (time_b5) datetime64[ns] 2020-08-15T00:20:00.4384999...\n",
+       "  * range_b5             (range_b5) float64 0.6 1.1 1.6 2.1 ... 13.1 13.6 14.1\n",
+       "  * x1                   (x1) int32 1 2 3 4\n",
+       "  * x2                   (x2) int32 1 2 3 4\n",
+       "Data variables: (12/38)\n",
+       "    c_sound              (time) float32 1.502e+03 1.502e+03 ... 1.498e+03\n",
+       "    temp                 (time) float32 14.55 14.55 14.55 ... 13.47 13.47 13.47\n",
+       "    pressure             (time) float32 9.713 9.718 9.718 ... 9.596 9.594 9.596\n",
+       "    mag                  (dirIMU, time) float32 72.5 72.7 72.6 ... -197.2 -195.7\n",
+       "    accel                (dirIMU, time) float32 -0.00479 -0.01437 ... 9.729\n",
+       "    batt                 (time) float32 16.6 16.6 16.6 16.6 ... 16.4 16.4 15.2\n",
+       "    ...                   ...\n",
+       "    telemetry_data       (time) uint8 0 0 0 0 0 0 0 0 0 0 ... 0 0 0 0 0 0 0 0 0\n",
+       "    boost_running        (time) uint8 0 0 0 0 0 0 0 0 1 0 ... 0 1 0 0 0 0 0 0 1\n",
+       "    heading              (time) float32 -12.52 -12.51 -12.51 ... -12.52 -12.5\n",
+       "    pitch                (time) float32 -0.065 -0.06 -0.06 ... -0.06 -0.05 -0.05\n",
+       "    roll                 (time) float32 -7.425 -7.42 -7.42 ... -6.45 -6.45 -6.45\n",
+       "    beam2inst_orientmat  (x1, x2) float32 1.183 0.0 -1.183 ... 0.5518 0.0 0.5518\n",
+       "Attributes: (12/34)\n",
+       "    filehead_config:       {"CLOCKSTR": {"TIME": "\\"2020-08-13 13:56:21\\""}, ...\n",
+       "    inst_model:            Signature1000\n",
+       "    inst_make:             Nortek\n",
+       "    inst_type:             ADCP\n",
+       "    burst_config:          {"press_valid": true, "temp_valid": true, "compass...\n",
+       "    n_cells:               28\n",
+       "    ...                    ...\n",
+       "    proc_idle_less_12pct:  0\n",
+       "    rotate_vars:           ['vel', 'accel', 'accel_b5', 'angrt', 'angrt_b5', ...\n",
+       "    coord_sys:             earth\n",
+       "    fs:                    1\n",
+       "    has_imu:               1\n",
+       "    beam_angle:            25
" ], - "source": [ - "ds_beam = dolfyn.rotate2(ds, 'beam', inplace=False)\n", - "ds_avg['TKE'] = avg_tool.total_turbulent_kinetic_energy(ds_beam, noise=ds_avg['noise'], orientation='up', beam_angle=25)" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "And plotting TKE:" - ] - }, - { - "cell_type": "code", - "execution_count": 31, - "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "" - ] - }, - "execution_count": 31, - "metadata": {}, - "output_type": "execute_result" - }, - { - "data": { - "image/png": "", - "text/plain": [ - "
" - ] - }, - "metadata": {}, - "output_type": "display_data" - } + "text/plain": [ + "\n", + "Dimensions: (time: 55000, dirIMU: 3, dir: 4, range: 28, beam: 4,\n", + " earth: 3, inst: 3, q: 4, time_b5: 55000,\n", + " range_b5: 28, x1: 4, x2: 4)\n", + "Coordinates:\n", + " * time (time) datetime64[ns] 2020-08-15T00:20:00.500999927 ...\n", + " * dirIMU (dirIMU) : Nortek Signature1000\n", + " . 15.28 hours (started: Aug 15, 2020 00:20)\n", + " . earth-frame\n", + " . (55000 pings @ 1Hz)\n", + " Variables:\n", + " - time ('time',)\n", + " - time_b5 ('time_b5',)\n", + " - vel ('dir', 'range', 'time')\n", + " - vel_b5 ('range_b5', 'time_b5')\n", + " - range ('range',)\n", + " - orientmat ('earth', 'inst', 'time')\n", + " - heading ('time',)\n", + " - pitch ('time',)\n", + " - roll ('time',)\n", + " - temp ('time',)\n", + " - pressure ('time',)\n", + " - amp ('beam', 'range', 'time')\n", + " - amp_b5 ('range_b5', 'time_b5')\n", + " - corr ('beam', 'range', 'time')\n", + " - corr_b5 ('range_b5', 'time_b5')\n", + " - accel ('dirIMU', 'time')\n", + " - angrt ('dirIMU', 'time')\n", + " - mag ('dirIMU', 'time')\n", + " ... and others (see `.variables`)" + ] + }, + "execution_count": 4, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "ds_dolfyn = ds.velds\n", + "ds_dolfyn" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## 2. Initial Steps for Data Quality Control (QC)\n", + "\n", + "### 2.1: Set the Deployment Height\n", + "\n", + "When using Nortek instruments, the deployment software does not factor in the deployment height. The deployment height represents the position of the Acoustic Doppler Current Profiler (ADCP) within the water column. \n", + "\n", + "In this context, the center of the first depth bin is situated at a distance that is the sum of three elements: \n", + "1. Deployment height (the ADCP's position in the water column)\n", + "2. Blanking distance (the minimum distance from the ADCP to the first measurement point)\n", + "3. Cell size (the vertical distance of each measurement bin in the water column)\n", + "\n", + "To ensure accurate readings, it is critical to calibrate the 'range' coordinate to make '0' correspond to the seafloor. This calibration can be achieved using the `set_range_offset` function. This function is also useful when working with a down-facing instrument as it helps account for the depth below the water surface. \n", + "\n", + "For those using a Teledyne RDI ADCP, the TRDI deployment software will prompt you to specify the deployment height/depth during setup. If there's a need for calibration post-deployment, the `set_range_offset` function can be utilized in the same way as described above." + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "" + ] + }, + "execution_count": 5, + "metadata": {}, + "output_type": "execute_result" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "ds[\"vel\"][1].plot()" + ] + }, + { + "cell_type": "code", + "execution_count": 6, + "metadata": {}, + "outputs": [], + "source": [ + "# The ADCP transducers were measured to be 0.6 m from the feet of the lander\n", + "api.clean.set_range_offset(ds, 0.6)" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "So, the center of bin 1 is located at 1.2 m:" + ] + }, + { + "cell_type": "code", + "execution_count": 7, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "
<xarray.DataArray 'range' (range: 28)>\n",
+       "array([ 1.2,  1.7,  2.2,  2.7,  3.2,  3.7,  4.2,  4.7,  5.2,  5.7,  6.2,  6.7,\n",
+       "        7.2,  7.7,  8.2,  8.7,  9.2,  9.7, 10.2, 10.7, 11.2, 11.7, 12.2, 12.7,\n",
+       "       13.2, 13.7, 14.2, 14.7])\n",
+       "Coordinates:\n",
+       "  * range    (range) float64 1.2 1.7 2.2 2.7 3.2 ... 12.7 13.2 13.7 14.2 14.7\n",
+       "Attributes:\n",
+       "    units:    m
" ], - "source": [ - "# Remove estimations below 0\n", - "ds_avg['TKE'] = ds_avg['TKE'].where(ds_avg['TKE']>0)\n", - "\n", - "ds_avg['TKE'].plot(cmap='Reds', ylim=(0,11))" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "TKE esimations are generally more complete than those of dissipation rates because they are found directly from the along-beam velocity measurements. Missing TKE estimations exist whenever the noise calculated by the function `doppler_noise_level` is greater than the calculated TKE, as TKE can't be less than zero. Noise levels are affected by the instrument's processor and working frequency, water waves and other sources of \"interference\", instrument motion, current speed, intricacies in the spectra calculation, the ability to see the noise floor in the spectra, etc.\n", - "\n", - "You may also note that high TI doesn't always correlate with high TKE. TI is the ratio of flow speed standard devation to the mean, which is naturally lower when flow speeds are higher. When flow speeds are higher, they also have greater kinetic energy and thereby greater TKE.\n", - "\n", - "There is one other important thing to note on TKE measurements by ADCPs: the minimum turbulence length scale that the ADCP is capable of measuring increases with range from the instrument. This means the instrument is only capable of measuring the TKE of larger and larger turbulent structures as the beams travel farther and farther from the instrument head. One of the benefits of calculating w'w' from the vertical beam is that it isn't limited by this beam spread issue." - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "### 7.6 TKE Production\n", - "\n", - "Though it can't be found from this deployment, we'll go over how to estimate TKE Production. There isn't a specific function in MHKiT-DOLfYN for production, but all the necessary variables are. \n", - "\n", - "If we had aligned the ADCP instrument axes to the flow direction (so \"X\" would align with the main flow), we could use the following equation to estimate production:\n", - "\n", - "$P = -(\\overline{u'w'}\\frac{du}{dz} + \\overline{v'w'}\\frac{dv}{dz} + \\overline{w'w'}\\frac{dw}{dz})$\n", - "\n", - "To start, we need the functions `reynolds_stress_4beam` or `stress_tensor_5beam` to get the stress tensor components $\\overline{u'w'}$ and $\\overline{v'w'}$. We also need the vertical TKE component, $\\overline{w'w'}$. \n", - "\n", - "Both of these functions will give comparable results, but it should be noted that `stress_tensor_4beam` assumes the instrument is oriented with 0 degrees pitch and roll, and will throw a warning if they are greater than 5 degrees. The `stress_tensor_5beam` gives more leeway to instrument tilt, but shouldn't be used if pitch and roll angles are greater than 10 degrees." - ] - }, - { - "cell_type": "code", - "execution_count": 32, - "metadata": {}, - "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "c:\\users\\mcve343\\mhkit-python\\mhkit\\dolfyn\\adp\\turbulence.py:383: UserWarning: The beam-variance algorithms assume the instrument's (XYZ) coordinate system is aligned with the principal flow directions.\n", - " warnings.warn(\" The beam-variance algorithms assume the instrument's \"\n", - "c:\\users\\mcve343\\mhkit-python\\mhkit\\dolfyn\\adp\\turbulence.py:391: UserWarning: 100.0 % of measurements have a tilt greater than 5 degrees.\n", - " warnings.warn(f\" {pct_above_thresh} % of measurements have a tilt \"\n" - ] - } + "text/plain": [ + "\n", + "array([ 1.2, 1.7, 2.2, 2.7, 3.2, 3.7, 4.2, 4.7, 5.2, 5.7, 6.2, 6.7,\n", + " 7.2, 7.7, 8.2, 8.7, 9.2, 9.7, 10.2, 10.7, 11.2, 11.7, 12.2, 12.7,\n", + " 13.2, 13.7, 14.2, 14.7])\n", + "Coordinates:\n", + " * range (range) float64 1.2 1.7 2.2 2.7 3.2 ... 12.7 13.2 13.7 14.2 14.7\n", + "Attributes:\n", + " units: m" + ] + }, + "execution_count": 7, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "ds.range" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### 2.2. Discard Data Above Surface Level\n", + "\n", + "To reduce computational load, we can exclude all data at or above the water surface level. Since the instrument was oriented upwards, we can utilize the pressure sensor data along with the function `find_surface_from_P`. However, this approach necessitates that the pressure sensor was calibrated or 'zeroed' prior to deployment. If the instrument is facing downwards or doesn't include pressure data, the function `find_surface` can be used to detect the seabed or water surface.\n", + "\n", + "It's important to note that Acoustic Doppler Current Profilers (ADCPs) do not measure water salinity, so you'll need to supply this information to the function. The dataset returned by this function includes an additional variable, \"depth\". If `find_surface_from_P` is invoked after `set_range_offset`, \"depth\" represents the distance from the water surface to the seafloor. Otherwise, it indicates the distance to the ADCP pressure sensor.\n", + "\n", + "After determining the \"depth\", you can use the nan_beyond_surface function to discard data in depth bins at or above the actual water surface. Be aware that this function will generate a new dataset." + ] + }, + { + "cell_type": "code", + "execution_count": 8, + "metadata": {}, + "outputs": [], + "source": [ + "api.clean.find_surface_from_P(ds, salinity=31)\n", + "ds = api.clean.nan_beyond_surface(ds)" + ] + }, + { + "cell_type": "code", + "execution_count": 9, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "" + ] + }, + "execution_count": 9, + "metadata": {}, + "output_type": "execute_result" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "ds[\"vel\"][1].plot()" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### 2.3: Apply an Acoustic Signal Correlation Filter\n", + "\n", + "After removing data from bins at or above the water surface, we typically apply a filter based on acoustic signal correlation to the ADCP data. This helps to eliminate erroneous velocity data points, which can be caused by factors such as bubbles, kelp, fish, etc., moving through one or multiple beams.\n", + "\n", + "You can quickly inspect the data to determine an appropriate correlation value by using the built-in plotting feature of xarray. In the following example, we use xarray's slicing capabilities to display data from beam 1 within a range of 0 to 10 m from the ADCP.\n", + "\n", + "It's important to note that not all ADCPs provide acoustic signal correlation data, which serves as a quantitative measure of signal quality. Older ADCPs may not offer this feature, in which case you can skip this step when using such instruments." + ] + }, + { + "cell_type": "code", + "execution_count": 10, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "" + ] + }, + "execution_count": 10, + "metadata": {}, + "output_type": "execute_result" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "%matplotlib inline\n", + "ds[\"corr\"].sel(beam=1, range=slice(0, 10)).plot()" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "It's beneficial to also review data from the other beams. A significant portion of this data is of high quality. To avoid discarding valuable data with lower correlations, which could be due to natural variations, we can use the `correlation_filter`. This function assigns a value of NaN (not a number) to velocity values corresponding to correlations below 50%.\n", + "\n", + "However, it's important to note that the correlation threshold is dependent on the specifics of the deployment environment and the instrument used. It's not unusual to set a threshold as low as 30%, or even to forgo the use of this function entirely." + ] + }, + { + "cell_type": "code", + "execution_count": 11, + "metadata": {}, + "outputs": [], + "source": [ + "ds = api.clean.correlation_filter(ds, thresh=50)" + ] + }, + { + "cell_type": "code", + "execution_count": 12, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "" + ] + }, + "execution_count": 12, + "metadata": {}, + "output_type": "execute_result" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "ds[\"vel\"][1].plot()" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### 2.4 Rotate Data Coordinate System\n", + "\n", + "After cleaning the data, the next step is to rotate the velocity data into accurate East, North, Up (ENU) coordinates.\n", + "\n", + "ADCPs utilize an internal compass or magnetometer to determine magnetic ENU directions. You can use the set_declination function to adjust the velocity data according to the magnetic declination specific to your geographical coordinates. This declination can be looked up online for specific coordinates.\n", + "\n", + "Instruments save vector data in the coordinate system defined in the deployment configuration file. To make this data meaningful, it must be transformed through various coordinate systems (\"beam\"<->\"inst\"<->\"earth\"<->\"principal\"). This transformation is accomplished using the `rotate2` function. If the \"earth\" (ENU) coordinate system is specified, DOLfYN will automatically rotate the dataset through the required coordinate systems to reach the \"earth\" coordinates. Setting `inplace` to true will modify the input dataset directly, meaning it will not create a new dataset.\n", + "\n", + "In this case, since the ADCP data is already in the \"earth\" coordinate system, the `rotate2` function will return the input dataset without modifications. The `set_declination` function will work no matter the coordinate system." + ] + }, + { + "cell_type": "code", + "execution_count": 13, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Data is already in the earth coordinate system\n" + ] + } + ], + "source": [ + "dolfyn.set_declination(ds, 15.8, inplace=True) # 15.8 deg East\n", + "dolfyn.rotate2(ds, \"earth\", inplace=True)" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "To rotate into the principal frame of reference (streamwise, cross-stream, vertical), if desired, we must first calculate the depth-averaged principal flow heading and add it to the dataset attributes. Then the dataset can be rotated using the same `rotate2` function. We use `inplace=False` because we do not want to alter the input dataset here." + ] + }, + { + "cell_type": "code", + "execution_count": 14, + "metadata": {}, + "outputs": [], + "source": [ + "ds.attrs[\"principal_heading\"] = dolfyn.calc_principal_heading(ds[\"vel\"].mean(\"range\"))\n", + "ds_streamwise = dolfyn.rotate2(ds, \"principal\", inplace=False)" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## 3. Average the Data\n", + "\n", + "As this deployment was configured in \"burst mode\", a standard step in the analysis process is to average the velocity data into time bins. \n", + "\n", + "However, if the instrument was set up in an \"averaging mode\" (where a specific profile and/or average interval was set, for instance, averaging 5 minutes of data every 30 minutes), this step would have been performed within the ADCP during deployment and can thus be skipped.\n", + "\n", + "To average the data into time bins (also known as ensembles), you should first initialize the binning tool `ADPBinner`. The parameter \"n_bin\" represents the number of data points in each ensemble. In this case, we're dealing with 300 seconds' worth of data. The \"fs\" parameter stands for the sampling frequency, which for this deployment is 1 Hz. Once the binning tool is initialized, you can use the `bin_average` function to average the data into ensembles." + ] + }, + { + "cell_type": "code", + "execution_count": 15, + "metadata": { + "scrolled": true + }, + "outputs": [], + "source": [ + "avg_tool = api.ADPBinner(n_bin=ds.fs * 300, fs=ds.fs)\n", + "ds_avg = avg_tool.bin_average(ds)" + ] + }, + { + "cell_type": "code", + "execution_count": 16, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "
<xarray.Dataset>\n",
+       "Dimensions:         (time: 183, dirIMU: 3, range: 28, dir: 4, beam: 4,\n",
+       "                     earth: 3, inst: 3, q: 4, time_b5: 183, range_b5: 28)\n",
+       "Coordinates:\n",
+       "  * time            (time) datetime64[ns] 2020-08-15T00:22:30.001030683 ... 2...\n",
+       "  * dirIMU          (dirIMU) <U1 'E' 'N' 'U'\n",
+       "  * range           (range) float64 1.2 1.7 2.2 2.7 3.2 ... 13.2 13.7 14.2 14.7\n",
+       "  * dir             (dir) <U2 'E' 'N' 'U1' 'U2'\n",
+       "  * beam            (beam) int32 1 2 3 4\n",
+       "  * earth           (earth) <U1 'E' 'N' 'U'\n",
+       "  * inst            (inst) <U1 'X' 'Y' 'Z'\n",
+       "  * q               (q) <U1 'w' 'x' 'y' 'z'\n",
+       "  * time_b5         (time_b5) datetime64[ns] 2020-08-15T00:22:29.938495159 .....\n",
+       "  * range_b5        (range_b5) float64 1.2 1.7 2.2 2.7 ... 13.2 13.7 14.2 14.7\n",
+       "Data variables: (12/38)\n",
+       "    c_sound         (time) float32 1.502e+03 1.502e+03 ... 1.499e+03 1.498e+03\n",
+       "    U_std           (range, time) float32 0.04232 0.04293 0.04402 ... nan nan\n",
+       "    temp            (time) float32 14.49 14.59 14.54 14.45 ... 13.62 13.56 13.5\n",
+       "    pressure        (time) float32 9.712 9.699 9.685 9.67 ... 9.58 9.584 9.591\n",
+       "    mag             (dirIMU, time) float32 72.37 72.4 72.38 ... -197.1 -197.1\n",
+       "    accel           (dirIMU, time) float32 -0.3584 -0.361 ... 9.714 9.712\n",
+       "    ...              ...\n",
+       "    boost_running   (time) float32 0.1267 0.1333 0.13 ... 0.2267 0.22 0.22\n",
+       "    heading         (time) float32 3.287 3.261 3.337 3.289 ... 3.331 3.352 3.352\n",
+       "    pitch           (time) float32 -0.05523 -0.07217 ... -0.04288 -0.0429\n",
+       "    roll            (time) float32 -7.414 -7.424 -7.404 ... -6.446 -6.433 -6.436\n",
+       "    water_density   (time) float32 1.023e+03 1.023e+03 ... 1.023e+03 1.023e+03\n",
+       "    depth           (time) float32 10.28 10.26 10.25 10.23 ... 10.14 10.15 10.15\n",
+       "Attributes: (12/41)\n",
+       "    fs:                        1\n",
+       "    n_bin:                     300\n",
+       "    n_fft:                     300\n",
+       "    description:               Binned averages calculated from ensembles of s...\n",
+       "    filehead_config:           {"CLOCKSTR": {"TIME": "\\"2020-08-13 13:56:21\\"...\n",
+       "    inst_model:                Signature1000\n",
+       "    ...                        ...\n",
+       "    has_imu:                   1\n",
+       "    beam_angle:                25\n",
+       "    h_deploy:                  0.6\n",
+       "    declination:               15.8\n",
+       "    declination_in_orientmat:  1\n",
+       "    principal_heading:         11.1898
" ], - "source": [ - "# Beam-variance equation for 4-beam ADCPs\n", - "stress_vec = avg_tool.reynolds_stress_4beam(ds_beam, noise=ds_avg['noise'], orientation='up', beam_angle=25)\n", - "upwp_ = stress_vec[1]\n", - "vpwp_ = stress_vec[2]\n", - "wpwp_ = ds_avg['wpwp_bar'] # Found from the vertical along-beam velocity (vel_b5) above\n", - "\n", - "# OR #\n", - "\n", - "# Beam-variance equation for 5-beam ADCPs\n", - "tke_vec, stress_vec = avg_tool.stress_tensor_5beam(ds_beam, noise=ds_avg['noise'], orientation='up', beam_angle=25)\n", - "upwp_ = stress_vec[1]\n", - "vpwp_ = stress_vec[2]\n", - "wpwp_ = tke_vec[2]" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "The shear components can be found from the aptly named functions `dudz`, `dvdz`, and `dwdz` in ADPBinner. These functions, which are useful alone in their own right, estimate the shear in the velocity vector between respective depth bins. There is always correlation between velocity measurements in adjacent depth bins, based on ADCP operation principles, which is why \"estimation\" is also used here for shear.\n", - "\n", - "The shear functions operate on the raw velocity vector in the principal reference frame and need to be ensemble-averaged here. This can be done by nesting the `d*dz` function within the ADPBinner's `mean` function. With the ensemble shear known, we can put all the components together to get a production estimation." - ] - }, + "text/plain": [ + "\n", + "Dimensions: (time: 183, dirIMU: 3, range: 28, dir: 4, beam: 4,\n", + " earth: 3, inst: 3, q: 4, time_b5: 183, range_b5: 28)\n", + "Coordinates:\n", + " * time (time) datetime64[ns] 2020-08-15T00:22:30.001030683 ... 2...\n", + " * dirIMU (dirIMU) " + ] + }, + "execution_count": 18, + "metadata": {}, + "output_type": "execute_result" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "%matplotlib inline\n", + "from matplotlib import pyplot as plt\n", + "import matplotlib.dates as dt\n", + "\n", + "ax = plt.figure(figsize=(10, 6)).add_axes([0.14, 0.14, 0.8, 0.74])\n", + "# Plot flow speed\n", + "t = dolfyn.time.dt642date(ds_avg[\"time\"])\n", + "plt.pcolormesh(t, ds_avg[\"range\"], ds_avg[\"U_mag\"], cmap=\"Blues\", shading=\"nearest\")\n", + "# Plot the water surface\n", + "ax.plot(t, ds_avg[\"depth\"])\n", + "\n", + "# Set up time on x-axis\n", + "ax.set_xlabel(\"Time\")\n", + "ax.xaxis.set_major_formatter(dt.DateFormatter(\"%H:%M\"))\n", + "\n", + "ax.set_ylabel(\"Altitude [m]\")\n", + "ax.set_ylim([0, 12])\n", + "plt.colorbar(label=\"Speed [m/s]\")" + ] + }, + { + "cell_type": "code", + "execution_count": 19, + "metadata": { + "scrolled": false + }, + "outputs": [ + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "ax = plt.figure(figsize=(10, 6)).add_axes([0.14, 0.14, 0.8, 0.74])\n", + "# Plot flow direction\n", + "plt.pcolormesh(t, ds_avg[\"range\"], ds_avg[\"U_dir\"], cmap=\"twilight\", shading=\"nearest\")\n", + "# Plot the water surface\n", + "ax.plot(t, ds_avg[\"depth\"])\n", + "\n", + "# set up time on x-axis\n", + "ax.set_xlabel(\"Time\")\n", + "ax.xaxis.set_major_formatter(dt.DateFormatter(\"%H:%M\"))\n", + "\n", + "ax.set_ylabel(\"Altitude [m]\")\n", + "ax.set_ylim([0, 12])\n", + "plt.colorbar(label=\"Horizontal Vel Dir [deg CW from true N]\");" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Saving and Loading DOLfYN datasets\n", + "Datasets can be saved and reloaded using the `save` and `load` functions. Xarray is saved natively in netCDF format, hence the \".nc\" extension.\n", + "\n", + "Note: DOLfYN datasets cannot be saved using xarray's native `ds.to_netcdf`; however, DOLfYN datasets can be opened using `xarray.open_dataset`." + ] + }, + { + "cell_type": "code", + "execution_count": 20, + "metadata": {}, + "outputs": [], + "source": [ + "# Uncomment these lines to save and load to your current working directory\n", + "# dolfyn.save(ds, 'your_data.nc')\n", + "# ds_saved = dolfyn.load('your_data.nc')" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## 7. Turbulence Statistics\n", + "\n", + "The next section of this jupyter notebook will run through the turbulence analysis of the data presented here. There was no intention of measuring turbulence in the deployment that collected this data, so results depicted here are not the highest quality. The quality of turbulence measurements from an ADCP depend heavily on the quality of the deployment setup and data collection, particularly instrument frequency, samping frequency and depth bin size.\n", + "\n", + "Read more on proper ADCP setup for turbulence measurements in: Thomson, Jim, et al. \"Measurements of turbulence at two tidal energy sites in Puget Sound, WA.\" IEEE Journal of Oceanic Engineering 37.3 (2012): 363-374.\n", + "\n", + "Most functions related to turbulence statistics in MHKiT-DOLfYN have the papers they originate from referenced in their docstrings.\n", + "\n", + "### 7.1 Turbulence Intensity\n", + "For most users, turbulence intensity (TI), the ratio of the ensemble standard deviation to ensemble flow speed given as a percent, is all most will need. In MHKiT, this can be simply calculated as `.velds.I`, but be aware that this will be a conservative estimate. Another function, `turbulence_intensity`, is capable of subtracting instrument noise from this parameter and is discussed below. The noise-subtracted TI is more accurate and typically 1-2% lower than the non-noise-subtracted estimation.\n", + "\n" + ] + }, + { + "cell_type": "code", + "execution_count": 21, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "" + ] + }, + "execution_count": 21, + "metadata": {}, + "output_type": "execute_result" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "# Turbulence Intensity\n", + "ds_avg[\"TI\"] = ds_avg.velds.I\n", + "ds_avg[\"TI\"].plot(cmap=\"Reds\", ylim=(0, 11))" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### 7.2 Power Spectral Densities (Auto-Spectra)\n", + "\n", + "Other turbulence parameters include the TKE power- and cross-spectral densities (i.e the power spectra), turbulent kinetic energy (TKE, i.e. the variances of velocity vector components), Reynolds stress vector (i.e. the co-variances of velocity vector components), TKE dissipation rate, and TKE production rate. These quantities are primarily used to inform and verify hydrodynamic and coastal models, which take some or all of these quantities as input.\n", + "\n", + "The TKE production rate is the rate at which kinetic energy (KE) transitions from a useful state (able to do \"work\" in the physics sense) to turbulent; TKE is the actual amount of turbulent KE in the water; and TKE dissipation rate is the rate at which turbulent KE is lost to non-motion forms of energy (heat, sound, etc) due to viscosity. The power spectra are used to depict and quantify this energy in the frequency domain, and creating them are the first step in turbulence analysis.\n", + "\n", + "We'll start by looking at the power spectra, specifically the auto-spectra from the vertical beam (\"auto\" meaning the variance of a single vector direction, e.g. $\\overline{u'^2}$, vs \"cross\", meaning the covariance of two directions, e.g. $\\overline{u'w'}$). This can be done using the `power_spectral_density` function from the `ADPBinner` we created (\"avg_tool\"). We'll create spectra at the middle water column, at a depth of 5 m, and use a number of FFT's equal to 1/3 the bin size." + ] + }, + { + "cell_type": "code", + "execution_count": 22, + "metadata": {}, + "outputs": [], + "source": [ + "rng = 5 # m\n", + "vel_up = ds[\"vel_b5\"].sel(range_b5=rng, method=\"nearest\") # vertical velocity\n", + "U = ds_avg[\"U_mag\"].sel(\n", + " range=5, method=\"nearest\"\n", + ") # flow speed, for plotting in the next block\n", + "\n", + "ds_avg[\"auto_spectra_5m\"] = avg_tool.power_spectral_density(\n", + " vel_up, freq_units=\"Hz\", n_fft=ds_avg.n_bin // 3\n", + ")" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "In the auto-spectra, we're primarly looking for three components: the energy-producing region, the isotropic turbulence region (so-called \"red noise\"), and the instrument noise floor (termed \"white noise\"). \n", + "\n", + "The block below organizes and plots the power spectra by the corresponding ensemble speed, averaging them by 0.1 m/s velocity bins. Note that if an ensemble is missing data that wasn't filled in, a power spectrum will not be calculated for that ensemble timestamp." + ] + }, + { + "cell_type": "code", + "execution_count": 23, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "[Text(0.5, 0, 'Frequency [Hz]'),\n", + " Text(0, 0.5, 'PSD [m2 s-2 Hz-1]'),\n", + " (0.01, 1),\n", + " (0.0005, 0.1)]" + ] + }, + "execution_count": 23, + "metadata": {}, + "output_type": "execute_result" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "import numpy as np\n", + "import matplotlib.pyplot as plt\n", + "import matplotlib as mpl\n", + "\n", + "plt.rcParams.update({\"font.size\": 18, \"font.family\": \"Times New Roman\"})\n", + "\n", + "\n", + "def plot_spectra_by_color(auto_spectra, U_mag, ax, fig, cbar_max=4.0):\n", + " U = U_mag.values\n", + " U_max = U_mag.max().values\n", + "\n", + " # Average spectra into 0.1 m/s velocity bins\n", + " speed_bins = np.arange(0.5, U_max, 0.1)\n", + " time = [t for t in auto_spectra.dims if \"time\" in t][0]\n", + " S_group = auto_spectra.assign_coords({time: U}).rename({time: \"speed\"})\n", + " group = S_group.groupby_bins(\"speed\", speed_bins)\n", + " count = group.count().values\n", + " S = group.mean()\n", + "\n", + " # define the colormap\n", + " cmap = plt.cm.turbo\n", + " # define the bins and normalize\n", + " bounds = np.arange(0.5, cbar_max, 0.1)\n", + " norm = mpl.colors.BoundaryNorm(bounds, cmap.N)\n", + " colors = cmap(norm(speed_bins))\n", + "\n", + " # plot\n", + " for i in range(len(speed_bins) - 1):\n", + " ax.loglog(auto_spectra[\"freq\"], S[i], c=colors[i])\n", + " ax.grid()\n", + "\n", + " # create a second axes for the colorbar\n", + " cax = fig.add_axes([0.8, 0.07, 0.03, 0.88])\n", + " # cax, _ = mpl.colorbar.make_axes(fig.gca())\n", + " sm = mpl.colorbar.ColorbarBase(\n", + " cax,\n", + " cmap=cmap,\n", + " norm=norm,\n", + " spacing=\"proportional\",\n", + " ticks=bounds,\n", + " boundaries=bounds,\n", + " format=\"%1.1f\",\n", + " label=\"Velocity [m/s]\",\n", + " )\n", + "\n", + " # Add -5/3 slope line\n", + " m = -5 / 3\n", + " x = np.logspace(-1, 0.5)\n", + " y = 10 ** (-3) * x**m\n", + " ax.loglog(x, y, \"--\", c=\"black\", label=\"$f^{-5/3}$\")\n", + " ax.legend()\n", + "\n", + " return ax, sm\n", + "\n", + "\n", + "# Set up figure\n", + "fig, ax = plt.subplots(1, 1, figsize=(5, 5))\n", + "fig.subplots_adjust(left=0.2, right=0.75, top=0.95, bottom=0.1)\n", + "\n", + "# Plot spectra by color\n", + "plot_spectra_by_color(ds_avg[\"auto_spectra_5m\"], U, ax, fig, cbar_max=2.0)\n", + "# Set axes\n", + "ax.set(\n", + " xlabel=\"Frequency [Hz]\",\n", + " ylabel=\"PSD [m2 s-2 Hz-1]\",\n", + " xlim=(0.01, 1),\n", + " ylim=(0.0005, 0.1),\n", + ")" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "In the figure above, we can see the energy-producing turbulent structures below a frequency of 0.2 Hz (one tick to the right of \"10^-1\"). The isotropic turbulence cascade, seen by the dashed f^(-5/3) slope (from Kolmogorov's theory of turbulence) begins at around 0.2 Hz and continues until we reach the Nyquist frequency at 0.5 Hz (1/2 the instrument's sampling frequency, 1 Hz). The instrument's noise floor can't be seen here, but will show up as the flattened part of the spectra at the highest frequencies. For this instrument (Nortek Signature1000), the noise floor typically varies around 10^-3, depending on flow speed and range distance." + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### 7.3 Instrument Noise\n", + "\n", + "The next thing we want to do is calculate the instrument's Doppler noise floor from the spectrum we calculated above. (We are making the assumption that the noise floor of the vertical beam is the same as the noise floor of the other 4 beams). This gives us a timeseries of the noise floor, which varies by instrument and with flow speed, at that depth bin.\n", + "\n", + "We can do this using the `doppler_noise_level` function. The two inputs for this function are the power spectra and \"pct_fN\", the percent of the Nyquist frequency that the noise floor exists. Because in this particularly dataset we can't see the noise floor, we'll just use 90% or pct_fN=0.9 as an example. If the noise floor began at 0.4 Hz and ran til our maximum frequency of 0.5 Hz, we'd use pct_fN = 0.4 Hz / 0.5 Hz = 0.8." + ] + }, + { + "cell_type": "code", + "execution_count": 24, + "metadata": {}, + "outputs": [], + "source": [ + "ds_avg[\"noise_5m\"] = avg_tool.doppler_noise_level(ds_avg[\"auto_spectra_5m\"], pct_fN=0.9)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### 7.4 TKE Dissipation Rate\n", + "\n", + "Because we can see the isotropic turbulence cascade (0.2 - 0.5 Hz) at this depth bin (5 m altitude), we can calculate the TKE dissipation rate at this location from the spectra itself. This can be done using `dissipation_rate_LT83`, whose inputs are the power spectra, the ensemble speed, the frequency range of the isotropic cascade, and the instrument's noise." + ] + }, + { + "cell_type": "code", + "execution_count": 25, + "metadata": {}, + "outputs": [], + "source": [ + "# Frequency range of isotropic turubulence cascade in same units as PSD frequency vector\n", + "f_rng = [0.2, 0.5]\n", + "# Dissipation rate\n", + "ds_avg[\"dissipation_rate_5m\"] = avg_tool.dissipation_rate_LT83(\n", + " ds_avg[\"auto_spectra_5m\"], U, freq_range=f_rng, noise=ds_avg[\"noise_5m\"]\n", + ")" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "We have just found the spectra and dissipation rate from a single depth bin at an altitude of 5 m from the seafloor, but typically we want the spectra and dissipation rates from the entire measurement profile. If we want to look at the spectra and dissipation rates from all depth bins, we can set up a \"for\" loop on the range coordinate and merge them together:" + ] + }, + { + "cell_type": "code", + "execution_count": 26, + "metadata": {}, + "outputs": [], + "source": [ + "import xarray as xr\n", + "\n", + "spec = [None] * len(ds.range)\n", + "e = [None] * len(ds.range)\n", + "n = [None] * len(ds.range)\n", + "\n", + "for r in range(len(ds[\"range\"])):\n", + " # Calc spectra from each depth bin using the 5th beam\n", + " spec[r] = avg_tool.power_spectral_density(\n", + " ds[\"vel_b5\"].isel(range_b5=r), freq_units=\"Hz\"\n", + " )\n", + "\n", + " # Calculate doppler noise from spectra from each depth bin\n", + " n[r] = avg_tool.doppler_noise_level(spec[r], pct_fN=0.9)\n", + "\n", + " # Calc dissipation rate from each spectra\n", + " e[r] = avg_tool.dissipation_rate_LT83(\n", + " spec[r], ds_avg.velds.U_mag.isel(range=r), freq_range=f_rng, noise=n[r]\n", + " )\n", + "\n", + "ds_avg[\"auto_spectra\"] = xr.concat(spec, dim=\"range\")\n", + "ds_avg[\"noise\"] = xr.concat(n, dim=\"range\")\n", + "ds_avg[\"dissipation_rate\"] = xr.concat(e, dim=\"range\")\n", + "\n", + "del spec, n, e # save memory" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Now that we have a profile timeseries of dissipation rate, we need apply some quality control (QC). Since we can't look at each individual spectrum to ensure we can see the isotropic turbulence cascade, we want to QC the output from `dissipation_rate_LT83` to make sure what was calculated actually falls on a f^(-5/3) slope. We can do this using the function `check_turbulence_cascade_slope`, which uses linear regression on the log-transformed LT83 equation (ref. to Lumley and Terray, 1983, see docstring) to calculate the spectral slope for the given frequency range. \n", + "\n", + "In our case, we're calculating the slope of each spectrum between 0.2 and 0.5 Hz. We'll use a cutoff of 20% for the error, but this can be lowered if there still appear to be erroneous estimations from visual inspection of the spectra." + ] + }, + { + "cell_type": "code", + "execution_count": 27, + "metadata": {}, + "outputs": [], + "source": [ + "# Quality control dissipation rate estimation\n", + "slope = avg_tool.check_turbulence_cascade_slope(\n", + " ds_avg[\"auto_spectra\"], freq_range=f_rng\n", + ")\n", + "\n", + "# Check that percent difference from -5/3 is not greater than 20%\n", + "mask = abs((slope[0].values - (-5 / 3)) / (-5.3)) <= 0.20\n", + "\n", + "# Keep good data\n", + "ds_avg[\"dissipation_rate\"] = ds_avg[\"dissipation_rate\"].where(mask)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "If we plot the dissipation rate below in a colormap, we can see that the profile map has a lot of missing data. One of the reasons is that the 1 Hz sampling rate doesn't provide enough information needed to make dissipation rate estimations, and the other part is that turbulence measurements push the boundaries of what ADCPs are capable of.\n", + "\n", + "Also, 1x10^-4 to 3x10^-4 $m^2/s^3$ is reasonable for a dissipation rate estimate for the 1 - 1.5 m/s current speeds measured here. They can be a magnitude greater for faster flow speeds, typically increase closer to the seafloor, and depend heavily on bathymetry and regional hydrodynamics." + ] + }, + { + "cell_type": "code", + "execution_count": 28, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "" + ] + }, + "execution_count": 28, + "metadata": {}, + "output_type": "execute_result" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "ds_avg[\"dissipation_rate\"].plot(cmap=\"turbo\", ylim=(0, 11))" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### 7.5 Noise-Corrected Turbulence Intensity\n", + "\n", + "Now that we've calculated the noise floor for each ping, we can recalculate TI and include subtracting instrument noise using the `turbulence_intensity` function. If we subtract this from the non-noise corrected function, we can see there's a large difference\n", + "at slower slow speeds, but the average difference is about 0.008 (0.8%). Notice this will also remove measurements where noise is \n", + "high." + ] + }, + { + "cell_type": "code", + "execution_count": 29, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "Text(0.5, 1.0, 'TI Difference')" + ] + }, + "execution_count": 29, + "metadata": {}, + "output_type": "execute_result" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "ds_avg[\"turbulence_intensity\"] = avg_tool.turbulence_intensity(\n", + " ds.velds.U_mag, noise=ds_avg[\"noise\"]\n", + ")\n", + "\n", + "(ds_avg[\"TI\"] - ds_avg[\"turbulence_intensity\"]).plot(cmap=\"Greens\", ylim=(0, 11))\n", + "plt.title(\"TI Difference\")" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### 7.6 Turbulent Kinetic Energy (TKE) Components\n", + "\n", + "The next parameters we'll find here are the vertical TKE component and the total TKE magnitude. Since we're using the vertical beam on the ADCP, we'll directly measure the vertical TKE component from the along-beam velocity using the `turbulent_kinetic_energy` function. This function is capable of calculating TKE for any along-beam velocity.\n", + "\n", + "We can also use the so-called \"beam-variance\" equations to estimate the Reynolds stress tensor components (i.e. $\\overline{u'^2}$, $\\overline{v'^2}$, $\\overline{w'^2}$, $\\overline{u'v'}$, $\\overline{u'w'^2}$, $\\overline{v'w'^2}$), which define the stresses acting on an element of water. These equations are built into the functions `stress_tensor_5beam` and `stress_tensor4beam`. Since we're using a 5-beam ADCP, we can calculate the total TKE as well using `total_turbulent_kinetic_energy`, which is a wrapper around the 5-beam variance function.\n", + "\n", + "#### Quick 5-beam ADCP lesson before we dive in:\n", + "\n", + "There are a couple caveats to calculating Reynolds stress tensor components:\n", + " 1. Because this instrument only has 5 beams, we can only find 5 of the 6 components (6 unkowns, 5 knowns)\n", + " 2. Because the ADCP's instrument (XYZ) axes weren't aligned with the flow during deployment, we don't know what direction these components are aligned to (i.e. the 'u' direction is not necessarily the streamwise direction)\n", + " 3. It is possible to rotate the tensor, but we'd need to know all 6 components to do so properly.\n", + "\n", + "That being said, even if we don't know which direction the 3 TKE components ($\\overline{u'^2}$, $\\overline{v'^2}$, $\\overline{w'^2}$) are oriented, we can still combine them and get the total TKE magnitude.\n", + "\n", + "We'll first calculate the vertical TKE component, using the function `turbulent_kinetic_energy`, inputting our raw vertical beam data and the noise floors we calculated above for each ensemble." + ] + }, + { + "cell_type": "code", + "execution_count": 30, + "metadata": {}, + "outputs": [], + "source": [ + "# Vertical TKE component (w'w' bar)\n", + "ds_avg[\"wpwp_bar\"] = avg_tool.turbulent_kinetic_energy(\n", + " ds[\"vel_b5\"], noise=ds_avg[\"noise\"]\n", + ")" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Next we can calculate the TKE magnitude using the function `total_turbulent_kinetic_energy`. This method is a wrapper around the `stress_tensor_5beam` function, which calculates the individual Reynolds stress tensor components and takes the same inputs. As an fyi, this function will drop at least one warning every time it's run, primarily the coordinate system warning. This function also requires the input raw data to be in beam coordinates, so we'll create a copy of the raw data and rotate it to 'beam'. If you do not, this function will do so automatically and rotate the original." + ] + }, + { + "cell_type": "code", + "execution_count": 31, + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "c:\\users\\mcve343\\mhkit-python\\mhkit\\dolfyn\\adp\\turbulence.py:401: UserWarning: The beam-variance algorithms assume the instrument's (XYZ) coordinate system is aligned with the principal flow directions.\n", + " warnings.warn(\n" + ] + } + ], + "source": [ + "ds_beam = dolfyn.rotate2(ds, \"beam\", inplace=False)\n", + "ds_avg[\"TKE\"] = avg_tool.total_turbulent_kinetic_energy(\n", + " ds_beam, noise=ds_avg[\"noise\"], orientation=\"up\", beam_angle=25\n", + ")" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "And plotting TKE:" + ] + }, + { + "cell_type": "code", + "execution_count": 32, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "" + ] + }, + "execution_count": 32, + "metadata": {}, + "output_type": "execute_result" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "# Remove estimations below 0\n", + "ds_avg[\"TKE\"] = ds_avg[\"TKE\"].where(ds_avg[\"TKE\"] > 0)\n", + "\n", + "ds_avg[\"TKE\"].plot(cmap=\"Reds\", ylim=(0, 11))" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "TKE esimations are generally more complete than those of dissipation rates because they are found directly from the along-beam velocity measurements. Missing TKE estimations exist whenever the noise calculated by the function `doppler_noise_level` is greater than the calculated TKE, as TKE can't be less than zero. Noise levels are affected by the instrument's processor and working frequency, water waves and other sources of \"interference\", instrument motion, current speed, intricacies in the spectra calculation, the ability to see the noise floor in the spectra, etc.\n", + "\n", + "You may also note that high TI doesn't always correlate with high TKE. TI is the ratio of flow speed standard devation to the mean, which is naturally lower when flow speeds are higher. When flow speeds are higher, they also have greater kinetic energy and thereby greater TKE.\n", + "\n", + "There is one other important thing to note on TKE measurements by ADCPs: the minimum turbulence length scale that the ADCP is capable of measuring increases with range from the instrument. This means the instrument is only capable of measuring the TKE of larger and larger turbulent structures as the beams travel farther and farther from the instrument head. One of the benefits of calculating w'w' from the vertical beam is that it isn't limited by this beam spread issue." + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### 7.7 TKE Production\n", + "\n", + "Though it can't be found from this deployment, we'll go over how to estimate TKE Production. There isn't a specific function in MHKiT-DOLfYN for production, but all the necessary variables are. \n", + "\n", + "If we had aligned the ADCP instrument axes to the flow direction (so \"X\" would align with the main flow), we could use the following equation to estimate production:\n", + "\n", + "$P = -(\\overline{u'w'}\\frac{du}{dz} + \\overline{v'w'}\\frac{dv}{dz} + \\overline{w'w'}\\frac{dw}{dz})$\n", + "\n", + "To start, we need the functions `reynolds_stress_4beam` or `stress_tensor_5beam` to get the stress tensor components $\\overline{u'w'}$ and $\\overline{v'w'}$. We also need the vertical TKE component, $\\overline{w'w'}$. \n", + "\n", + "Both of these functions will give comparable results, but it should be noted that `stress_tensor_4beam` assumes the instrument is oriented with 0 degrees pitch and roll, and will throw a warning if they are greater than 5 degrees. The `stress_tensor_5beam` gives more leeway to instrument tilt, but shouldn't be used if pitch and roll angles are greater than 10 degrees." + ] + }, + { + "cell_type": "code", + "execution_count": 33, + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "c:\\users\\mcve343\\mhkit-python\\mhkit\\dolfyn\\adp\\turbulence.py:401: UserWarning: The beam-variance algorithms assume the instrument's (XYZ) coordinate system is aligned with the principal flow directions.\n", + " warnings.warn(\n", + "c:\\users\\mcve343\\mhkit-python\\mhkit\\dolfyn\\adp\\turbulence.py:411: UserWarning: 100.0 % of measurements have a tilt greater than 5 degrees.\n", + " warnings.warn(\n" + ] + } + ], + "source": [ + "# Beam-variance equation for 4-beam ADCPs\n", + "stress_vec = avg_tool.reynolds_stress_4beam(\n", + " ds_beam, noise=ds_avg[\"noise\"], orientation=\"up\", beam_angle=25\n", + ")\n", + "upwp_ = stress_vec[1]\n", + "vpwp_ = stress_vec[2]\n", + "wpwp_ = ds_avg[\"wpwp_bar\"] # Found from the vertical along-beam velocity (vel_b5) above\n", + "\n", + "# OR #\n", + "\n", + "# Beam-variance equation for 5-beam ADCPs\n", + "tke_vec, stress_vec = avg_tool.stress_tensor_5beam(\n", + " ds_beam, noise=ds_avg[\"noise\"], orientation=\"up\", beam_angle=25\n", + ")\n", + "upwp_ = stress_vec[1]\n", + "vpwp_ = stress_vec[2]\n", + "wpwp_ = tke_vec[2]" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "The shear components can be found from the aptly named functions `dudz`, `dvdz`, and `dwdz` in ADPBinner. These functions, which are useful alone in their own right, estimate the shear in the velocity vector between respective depth bins. There is always correlation between velocity measurements in adjacent depth bins, based on ADCP operation principles, which is why \"estimation\" is also used here for shear.\n", + "\n", + "The shear functions operate on the raw velocity vector in the principal reference frame and need to be ensemble-averaged here. This can be done by nesting the `d*dz` function within the ADPBinner's `mean` function. With the ensemble shear known, we can put all the components together to get a production estimation." + ] + }, + { + "cell_type": "code", + "execution_count": 34, + "metadata": {}, + "outputs": [], + "source": [ + "# Find and ensemble-average shear\n", + "dudz = avg_tool.mean(avg_tool.dudz(ds_streamwise[\"vel\"]).values)\n", + "dvdz = avg_tool.mean(avg_tool.dvdz(ds_streamwise[\"vel\"]).values)\n", + "dwdz = avg_tool.mean(avg_tool.dwdz(ds_streamwise[\"vel\"]).values)\n", + "\n", + "# Calculate Production\n", + "P = -(upwp_ * dudz + vpwp_ * dvdz + wpwp_ * dwdz)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### 7.8 TKE Balance \n", + "\n", + "We can plot TKE Production and compare it to our dissipation rate calculations to get an understanding of the TKE balance. In a well mixed coastal environment, we expect production and dissipation to be approximately equal. Our production estimates aren't accurate because our stress components aren't aligned with the flow, so if we plot them, we see drastic differences (1x10^-3 $m^2/s^3$ is quite large) profile here." + ] + }, + { + "cell_type": "code", + "execution_count": 35, + "metadata": {}, + "outputs": [ { - "cell_type": "code", - "execution_count": 33, - "metadata": {}, - "outputs": [], - "source": [ - "# Find and ensemble-average shear\n", - "dudz = avg_tool.mean(avg_tool.dudz(ds_streamwise['vel']).values)\n", - "dvdz = avg_tool.mean(avg_tool.dvdz(ds_streamwise['vel']).values)\n", - "dwdz = avg_tool.mean(avg_tool.dwdz(ds_streamwise['vel']).values)\n", - "\n", - "# Calculate Production\n", - "P = -(upwp_*dudz + vpwp_*dvdz + wpwp_*dwdz)" + "data": { + "text/plain": [ + "Text(0.5, 1.0, 'TKE Balance')" ] + }, + "execution_count": 35, + "metadata": {}, + "output_type": "execute_result" }, { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "### 7.7 TKE Balance \n", - "\n", - "We can plot TKE Production and compare it to our dissipation rate calculations to get an understanding of the TKE balance. In a well mixed coastal environment, we expect production and dissipation to be approximately equal. Our production estimates aren't accurate because our stress components aren't aligned with the flow, so if we plot them, we see drastic differences (1x10^-3 $m^2/s^3$ is quite large) profile here." + "data": { + "image/png": "", + "text/plain": [ + "
" ] + }, + "metadata": {}, + "output_type": "display_data" }, { - "cell_type": "code", - "execution_count": 34, - "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "Text(0.5, 1.0, 'TKE Balance')" - ] - }, - "execution_count": 34, - "metadata": {}, - "output_type": "execute_result" - }, - { - "data": { - "image/png": "", - "text/plain": [ - "
" - ] - }, - "metadata": {}, - "output_type": "display_data" - }, - { - "data": { - "image/png": "", - "text/plain": [ - "
" - ] - }, - "metadata": {}, - "output_type": "display_data" - } - ], - "source": [ - "# Remove estimations below 0\n", - "P = P.where(P>0)\n", - "P.plot(cmap='turbo', ylim=(0,11))\n", - "plt.title('TKE Production') # remove bogus title\n", - "\n", - "\n", - "\n", - "# Plot difference between production and dissipation\n", - "plt.figure()\n", - "(P - ds_avg['dissipation_rate'].values).plot(ylim=(0,11))\n", - "plt.title('TKE Balance')" + "data": { + "image/png": "", + "text/plain": [ + "
" ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [] - } - ], - "metadata": { - "interpreter": { - "hash": "5cfd453a1a1cce2f32ea80f99ff7da863344217116d39185ac62b248c2577445" - }, - "kernelspec": { - "display_name": "Python 3 (ipykernel)", - "language": "python", - "name": "python3" - }, - "language_info": { - "codemirror_mode": { - "name": "ipython", - "version": 3 - }, - "file_extension": ".py", - "mimetype": "text/x-python", - "name": "python", - "nbconvert_exporter": "python", - "pygments_lexer": "ipython3", - "version": "3.9.12" + }, + "metadata": {}, + "output_type": "display_data" } + ], + "source": [ + "# Remove estimations below 0\n", + "P = P.where(P > 0)\n", + "P.plot(cmap=\"turbo\", ylim=(0, 11))\n", + "plt.title(\"TKE Production\") # remove bogus title\n", + "\n", + "\n", + "# Plot difference between production and dissipation\n", + "plt.figure()\n", + "(P - ds_avg[\"dissipation_rate\"].values).plot(ylim=(0, 11))\n", + "plt.title(\"TKE Balance\")" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [] + } + ], + "metadata": { + "interpreter": { + "hash": "5cfd453a1a1cce2f32ea80f99ff7da863344217116d39185ac62b248c2577445" + }, + "kernelspec": { + "display_name": "Python 3 (ipykernel)", + "language": "python", + "name": "python3" }, - "nbformat": 4, - "nbformat_minor": 4 + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.10.13" + } + }, + "nbformat": 4, + "nbformat_minor": 4 } diff --git a/examples/adv_example.ipynb b/examples/adv_example.ipynb index 3773578c4..1fe898ede 100644 --- a/examples/adv_example.ipynb +++ b/examples/adv_example.ipynb @@ -1,915 +1,922 @@ { - "cells": [ - { - "attachments": {}, - "cell_type": "markdown", - "metadata": {}, - "source": [ - "# Reading ADV Data with MHKiT\n", - "\n", - "This example presents a simplified workflow for analyzing Acoustic Doppler Velocimetry (ADV) data using MHKiT. MHKiT incorporates the DOLfYN codebase as a module to handle ADV and Acoustic Doppler Current Profiler (ADCP) data.\n", - "\n", - "A standard ADV data analysis workflow can be segmented into the following steps:\n", - "\n", - "1. **Raw Data Review**: Evaluate the original data by verifying timestamps and assessing the quality of velocity data, specifically looking for any data spikes.\n", - "\n", - "2. **Data Cleaning**: Identify and eliminate any spurious data points. If needed, bad data points can be replaced with interpolated values.\n", - "\n", - "3. **Data Rotation**: Transform the data into the principal flow coordinates, which are the streamwise, cross-stream, and vertical directions.\n", - "\n", - "4. **Data Averaging**: Aggregate the data into bins or ensembles, each of which spans a predefined time length, typically between 5 and 10 minutes.\n", - "\n", - "5. **Statistical Analysis**: Compute turbulence statistics such as turbulence intensity, Turbulent Kinetic Energy (TKE), and Reynolds stresses for the observed flow field.\n", - "\n", - "Start your analysis by importing the necessary tools:" - ] - }, - { - "cell_type": "code", - "execution_count": 1, - "metadata": {}, - "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "c:\\Users\\mcve343\\Anaconda3\\lib\\site-packages\\xarray\\backends\\cfgrib_.py:29: UserWarning: Failed to load cfgrib - most likely there is a problem accessing the ecCodes library. Try `import cfgrib` to get the full error message\n", - " warnings.warn(\n" - ] - } - ], - "source": [ - "from mhkit import dolfyn\n", - "from mhkit.dolfyn.adv import api" - ] - }, - { - "attachments": {}, - "cell_type": "markdown", - "metadata": {}, - "source": [ - "## Read Raw Instrument Data" - ] - }, - { - "attachments": {}, - "cell_type": "markdown", - "metadata": {}, - "source": [ - "DOLfYN currently only carries support for the Nortek Vector ADV. The example loaded here is a short clip of data from a test deployment to show DOLfYN's capabilities.\n", - "\n", - "Start by reading in the raw datafile downloaded from the instrument. The `dolfyn.read` function reads the raw file and dumps the information into an xarray Dataset, which contains three groups of variables:\n", - "\n", - "1. Velocity, amplitude, and correlation of the Doppler velocimetry\n", - "2. Measurements of the instrument's bearing and environment\n", - "3. Orientation matrices DOLfYN uses for rotating through coordinate frames." - ] - }, - { - "cell_type": "code", - "execution_count": 2, - "metadata": { - "scrolled": true - }, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "Reading file data/dolfyn/vector_data01.VEC ...\n" - ] - } - ], - "source": [ - "ds = dolfyn.read('data/dolfyn/vector_data01.VEC')" - ] - }, - { - "attachments": {}, - "cell_type": "markdown", - "metadata": {}, - "source": [ - "There are two ways to see what's in a Dataset. The first is to simply type the dataset's name to see the standard xarray output. To access a particular variable in a dataset, use dict-style (`ds['vel']`) or attribute-style syntax (`ds.vel`). See the [xarray docs](http://xarray.pydata.org/en/stable/getting-started-guide/quick-overview.html) for more details on how to use the xarray format." - ] - }, - { - "cell_type": "code", - "execution_count": 3, - "metadata": {}, - "outputs": [ - { - "data": { - "text/html": [ - "
\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "
<xarray.Dataset>\n",
-              "Dimensions:              (x1: 3, x2: 3, time: 122912, dir: 3, beam: 3,\n",
-              "                          earth: 3, inst: 3)\n",
-              "Coordinates:\n",
-              "  * x1                   (x1) int32 1 2 3\n",
-              "  * x2                   (x2) int32 1 2 3\n",
-              "  * time                 (time) datetime64[ns] 2012-06-12T12:00:02.968749046 ...\n",
-              "  * dir                  (dir) <U1 'X' 'Y' 'Z'\n",
-              "  * beam                 (beam) int32 1 2 3\n",
-              "  * earth                (earth) <U1 'E' 'N' 'U'\n",
-              "  * inst                 (inst) <U1 'X' 'Y' 'Z'\n",
-              "Data variables: (12/15)\n",
-              "    beam2inst_orientmat  (x1, x2) float64 2.709 -1.34 -1.364 ... -0.3438 -0.3499\n",
-              "    batt                 (time) float32 13.2 13.2 13.2 13.2 ... nan nan nan nan\n",
-              "    c_sound              (time) float32 1.493e+03 1.493e+03 ... nan nan\n",
-              "    heading              (time) float32 5.6 10.5 10.51 10.52 ... nan nan nan nan\n",
-              "    pitch                (time) float32 -31.5 -31.7 -31.69 ... nan nan nan\n",
-              "    roll                 (time) float32 0.4 4.2 4.253 4.306 ... nan nan nan nan\n",
-              "    ...                   ...\n",
-              "    orientation_down     (time) bool True True True True ... True True True True\n",
-              "    vel                  (dir, time) float32 -1.002 -1.008 -0.944 ... nan nan\n",
-              "    amp                  (beam, time) uint8 104 110 111 113 108 ... 0 0 0 0 0\n",
-              "    corr                 (beam, time) uint8 97 91 97 98 90 95 95 ... 0 0 0 0 0 0\n",
-              "    pressure             (time) float64 5.448 5.436 5.484 5.448 ... 0.0 0.0 0.0\n",
-              "    orientmat            (earth, inst, time) float32 0.0832 0.155 ... -0.7065\n",
-              "Attributes: (12/39)\n",
-              "    inst_make:                   Nortek\n",
-              "    inst_model:                  Vector\n",
-              "    inst_type:                   ADV\n",
-              "    rotate_vars:                 ['vel']\n",
-              "    n_beams:                     3\n",
-              "    profile_mode:                continuous\n",
-              "    ...                          ...\n",
-              "    recorder_size_bytes:         4074766336\n",
-              "    vel_range:                   normal\n",
-              "    firmware_version:            3.34\n",
-              "    fs:                          32.0\n",
-              "    coord_sys:                   inst\n",
-              "    has_imu:                     0
" - ], - "text/plain": [ - "\n", - "Dimensions: (x1: 3, x2: 3, time: 122912, dir: 3, beam: 3,\n", - " earth: 3, inst: 3)\n", - "Coordinates:\n", - " * x1 (x1) int32 1 2 3\n", - " * x2 (x2) int32 1 2 3\n", - " * time (time) datetime64[ns] 2012-06-12T12:00:02.968749046 ...\n", - " * dir (dir) : Nortek Vector\n", - " . 1.07 hours (started: Jun 12, 2012 12:00)\n", - " . inst-frame\n", - " . (122912 pings @ 32.0Hz)\n", - " Variables:\n", - " - time ('time',)\n", - " - vel ('dir', 'time')\n", - " - orientmat ('earth', 'inst', 'time')\n", - " - heading ('time',)\n", - " - pitch ('time',)\n", - " - roll ('time',)\n", - " - temp ('time',)\n", - " - pressure ('time',)\n", - " - amp ('beam', 'time')\n", - " - corr ('beam', 'time')\n", - " ... and others (see `.variables`)" - ] - }, - "execution_count": 4, - "metadata": {}, - "output_type": "execute_result" - } - ], - "source": [ - "ds_dolfyn = ds.velds\n", - "ds_dolfyn" - ] - }, + "cells": [ + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Reading ADV Data with MHKiT\n", + "\n", + "This example presents a simplified workflow for analyzing Acoustic Doppler Velocimetry (ADV) data using MHKiT. MHKiT incorporates the DOLfYN codebase as a module to handle ADV and Acoustic Doppler Current Profiler (ADCP) data.\n", + "\n", + "A standard ADV data analysis workflow can be segmented into the following steps:\n", + "\n", + "1. **Raw Data Review**: Evaluate the original data by verifying timestamps and assessing the quality of velocity data, specifically looking for any data spikes.\n", + "\n", + "2. **Data Cleaning**: Identify and eliminate any spurious data points. If needed, bad data points can be replaced with interpolated values.\n", + "\n", + "3. **Data Rotation**: Transform the data into the principal flow coordinates, which are the streamwise, cross-stream, and vertical directions.\n", + "\n", + "4. **Data Averaging**: Aggregate the data into bins or ensembles, each of which spans a predefined time length, typically between 5 and 10 minutes.\n", + "\n", + "5. **Statistical Analysis**: Compute turbulence statistics such as turbulence intensity, Turbulent Kinetic Energy (TKE), and Reynolds stresses for the observed flow field.\n", + "\n", + "Start your analysis by importing the necessary tools:" + ] + }, + { + "cell_type": "code", + "execution_count": 1, + "metadata": {}, + "outputs": [ { - "attachments": {}, - "cell_type": "markdown", - "metadata": {}, - "source": [ - "## Quality Control" - ] - }, + "name": "stderr", + "output_type": "stream", + "text": [ + "c:\\Users\\mcve343\\Anaconda3\\lib\\site-packages\\xarray\\backends\\cfgrib_.py:29: UserWarning: Failed to load cfgrib - most likely there is a problem accessing the ecCodes library. Try `import cfgrib` to get the full error message\n", + " warnings.warn(\n" + ] + } + ], + "source": [ + "from mhkit import dolfyn\n", + "from mhkit.dolfyn.adv import api" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Read Raw Instrument Data" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "DOLfYN currently only carries support for the Nortek Vector ADV. The example loaded here is a short clip of data from a test deployment to show DOLfYN's capabilities.\n", + "\n", + "Start by reading in the raw datafile downloaded from the instrument. The `dolfyn.read` function reads the raw file and dumps the information into an xarray Dataset, which contains three groups of variables:\n", + "\n", + "1. Velocity, amplitude, and correlation of the Doppler velocimetry\n", + "2. Measurements of the instrument's bearing and environment\n", + "3. Orientation matrices DOLfYN uses for rotating through coordinate frames." + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "metadata": { + "scrolled": true + }, + "outputs": [ { - "attachments": {}, - "cell_type": "markdown", - "metadata": {}, - "source": [ - "ADV velocity data tends to have spikes due to Doppler noise, and the common way to \"despike\" the data is by using the phase-space algorithm by Goring and Nikora (2002). DOLfYN integrates this function using a 2-step approach: create a logical mask where True corresponds to a spike detection, and then utilize an interpolation function to replace the spikes." - ] - }, + "name": "stdout", + "output_type": "stream", + "text": [ + "Reading file data/dolfyn/vector_data01.VEC ...\n" + ] + } + ], + "source": [ + "ds = dolfyn.read(\"data/dolfyn/vector_data01.VEC\")" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "There are two ways to see what's in a Dataset. The first is to simply type the dataset's name to see the standard xarray output. To access a particular variable in a dataset, use dict-style (`ds['vel']`) or attribute-style syntax (`ds.vel`). See the [xarray docs](http://xarray.pydata.org/en/stable/getting-started-guide/quick-overview.html) for more details on how to use the xarray format." + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "metadata": {}, + "outputs": [ { - "cell_type": "code", - "execution_count": 5, - "metadata": { - "scrolled": false - }, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "Percent of data containing spikes: 0.73%\n" - ] - } + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "
<xarray.Dataset>\n",
+       "Dimensions:              (x1: 3, x2: 3, time: 122912, dir: 3, beam: 3,\n",
+       "                          earth: 3, inst: 3)\n",
+       "Coordinates:\n",
+       "  * x1                   (x1) int32 1 2 3\n",
+       "  * x2                   (x2) int32 1 2 3\n",
+       "  * time                 (time) datetime64[ns] 2012-06-12T12:00:02.968749046 ...\n",
+       "  * dir                  (dir) <U1 'X' 'Y' 'Z'\n",
+       "  * beam                 (beam) int32 1 2 3\n",
+       "  * earth                (earth) <U1 'E' 'N' 'U'\n",
+       "  * inst                 (inst) <U1 'X' 'Y' 'Z'\n",
+       "Data variables: (12/15)\n",
+       "    beam2inst_orientmat  (x1, x2) float64 2.709 -1.34 -1.364 ... -0.3438 -0.3499\n",
+       "    batt                 (time) float32 13.2 13.2 13.2 13.2 ... nan nan nan nan\n",
+       "    c_sound              (time) float32 1.493e+03 1.493e+03 ... nan nan\n",
+       "    heading              (time) float32 5.6 10.5 10.51 10.52 ... nan nan nan nan\n",
+       "    pitch                (time) float32 -31.5 -31.7 -31.69 ... nan nan nan\n",
+       "    roll                 (time) float32 0.4 4.2 4.253 4.306 ... nan nan nan nan\n",
+       "    ...                   ...\n",
+       "    orientation_down     (time) bool True True True True ... True True True True\n",
+       "    vel                  (dir, time) float32 -1.002 -1.008 -0.944 ... nan nan\n",
+       "    amp                  (beam, time) uint8 104 110 111 113 108 ... 0 0 0 0 0\n",
+       "    corr                 (beam, time) uint8 97 91 97 98 90 95 95 ... 0 0 0 0 0 0\n",
+       "    pressure             (time) float64 5.448 5.436 5.484 5.448 ... 0.0 0.0 0.0\n",
+       "    orientmat            (earth, inst, time) float32 0.0832 0.155 ... -0.7065\n",
+       "Attributes: (12/39)\n",
+       "    inst_make:                   Nortek\n",
+       "    inst_model:                  Vector\n",
+       "    inst_type:                   ADV\n",
+       "    rotate_vars:                 ['vel']\n",
+       "    n_beams:                     3\n",
+       "    profile_mode:                continuous\n",
+       "    ...                          ...\n",
+       "    recorder_size_bytes:         4074766336\n",
+       "    vel_range:                   normal\n",
+       "    firmware_version:            3.34\n",
+       "    fs:                          32.0\n",
+       "    coord_sys:                   inst\n",
+       "    has_imu:                     0
" ], - "source": [ - "# Clean the file using the Goring+Nikora method:\n", - "mask = api.clean.GN2002(ds.vel, npt=5000)\n", - "# Replace bad datapoints via cubic spline interpolation\n", - "ds['vel'] = api.clean.clean_fill(ds['vel'], mask, npt=12, method='cubic', maxgap=None)\n", - "\n", - "print('Percent of data containing spikes: {0:.2f}%'.format(100*mask.mean()))\n", - "\n", - "# If interpolation isn't desired:\n", - "ds_nan = ds.copy(deep=True)\n", - "ds_nan.coords['mask'] = (('dir','time'), ~mask)\n", - "ds_nan['vel'] = ds_nan['vel'].where(ds_nan['mask'])" - ] - }, - { - "attachments": {}, - "cell_type": "markdown", - "metadata": {}, - "source": [ - "## Coordinate Rotations" - ] - }, - { - "attachments": {}, - "cell_type": "markdown", - "metadata": {}, - "source": [ - "Now that the data has been cleaned, the next step is to rotate the velocity data into true East, North, Up (ENU) coordinates.\n", - "\n", - "ADVs use an internal compass or magnetometer to determine magnetic ENU directions. The `set_declination` function takes the user supplied magnetic declination (which can be looked up online for specific coordinates) and adjusts the orientation matrix saved within the dataset.\n", - "\n", - "Instruments save vector data in the coordinate system specified in the deployment configuration file. To make the data useful, it must be rotated through coordinate systems (\"beam\"<->\"inst\"<->\"earth\"<->\"principal\"), done through the `rotate2` function. If the \"earth\" (ENU) coordinate system is specified, DOLfYN will automatically rotate the dataset through the necessary coordinate systems to get there. The `inplace` set as true will alter the input dataset \"in place\", a.k.a. it not create a new dataset." - ] - }, - { - "cell_type": "code", - "execution_count": 6, - "metadata": {}, - "outputs": [], - "source": [ - "# First set the magnetic declination\n", - "dolfyn.set_declination(ds, declin=10, inplace=True) # declination points 10 degrees East\n", - "\n", - "# Rotate that data from the instrument to earth frame (ENU):\n", - "dolfyn.rotate2(ds, 'earth', inplace=True)" + "text/plain": [ + "\n", + "Dimensions: (x1: 3, x2: 3, time: 122912, dir: 3, beam: 3,\n", + " earth: 3, inst: 3)\n", + "Coordinates:\n", + " * x1 (x1) int32 1 2 3\n", + " * x2 (x2) int32 1 2 3\n", + " * time (time) datetime64[ns] 2012-06-12T12:00:02.968749046 ...\n", + " * dir (dir) : Nortek Vector\n", + " . 1.07 hours (started: Jun 12, 2012 12:00)\n", + " . inst-frame\n", + " . (122912 pings @ 32.0Hz)\n", + " Variables:\n", + " - time ('time',)\n", + " - vel ('dir', 'time')\n", + " - orientmat ('earth', 'inst', 'time')\n", + " - heading ('time',)\n", + " - pitch ('time',)\n", + " - roll ('time',)\n", + " - temp ('time',)\n", + " - pressure ('time',)\n", + " - amp ('beam', 'time')\n", + " - corr ('beam', 'time')\n", + " ... and others (see `.variables`)" ] - }, + }, + "execution_count": 4, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "ds_dolfyn = ds.velds\n", + "ds_dolfyn" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Quality Control" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "ADV velocity data tends to have spikes due to Doppler noise, and the common way to \"despike\" the data is by using the phase-space algorithm by Goring and Nikora (2002). DOLfYN integrates this function using a 2-step approach: create a logical mask where True corresponds to a spike detection, and then utilize an interpolation function to replace the spikes." + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "metadata": { + "scrolled": false + }, + "outputs": [ { - "cell_type": "code", - "execution_count": 10, - "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "Text(0.5, 1.0, 'Streamwise Direction')" - ] - }, - "execution_count": 10, - "metadata": {}, - "output_type": "execute_result" - }, - { - "data": { - "image/png": "", - "text/plain": [ - "
" - ] - }, - "metadata": { - "needs_background": "light" - }, - "output_type": "display_data" - } - ], - "source": [ - "import matplotlib.pyplot as plt\n", - "%matplotlib inline\n", - "\n", - "plt.figure()\n", - "plt.loglog(ds_binned['freq'], ds_binned['auto_spectra'].sel(S='Sxx').mean(dim='time'))\n", - "plt.xlabel('Frequency [Hz]')\n", - "plt.ylabel('Energy Density $\\mathrm{[m^2/s^s/Hz]}$')\n", - "plt.title('Streamwise Direction')" - ] - }, + "name": "stdout", + "output_type": "stream", + "text": [ + "Percent of data containing spikes: 0.73%\n" + ] + } + ], + "source": [ + "# Clean the file using the Goring+Nikora method:\n", + "mask = api.clean.GN2002(ds.vel, npt=5000)\n", + "# Replace bad datapoints via cubic spline interpolation\n", + "ds[\"vel\"] = api.clean.clean_fill(ds[\"vel\"], mask, npt=12, method=\"cubic\", maxgap=None)\n", + "\n", + "print(\"Percent of data containing spikes: {0:.2f}%\".format(100 * mask.mean()))\n", + "\n", + "# If interpolation isn't desired:\n", + "ds_nan = ds.copy(deep=True)\n", + "ds_nan.coords[\"mask\"] = ((\"dir\", \"time\"), ~mask)\n", + "ds_nan[\"vel\"] = ds_nan[\"vel\"].where(ds_nan[\"mask\"])" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Coordinate Rotations" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Now that the data has been cleaned, the next step is to rotate the velocity data into true East, North, Up (ENU) coordinates.\n", + "\n", + "ADVs use an internal compass or magnetometer to determine magnetic ENU directions. The `set_declination` function takes the user supplied magnetic declination (which can be looked up online for specific coordinates) and adjusts the orientation matrix saved within the dataset.\n", + "\n", + "Instruments save vector data in the coordinate system specified in the deployment configuration file. To make the data useful, it must be rotated through coordinate systems (\"beam\"<->\"inst\"<->\"earth\"<->\"principal\"), done through the `rotate2` function. If the \"earth\" (ENU) coordinate system is specified, DOLfYN will automatically rotate the dataset through the necessary coordinate systems to get there. The `inplace` set as true will alter the input dataset \"in place\", a.k.a. it not create a new dataset." + ] + }, + { + "cell_type": "code", + "execution_count": 6, + "metadata": {}, + "outputs": [], + "source": [ + "# First set the magnetic declination\n", + "dolfyn.set_declination(\n", + " ds, declin=10, inplace=True\n", + ") # declination points 10 degrees East\n", + "\n", + "# Rotate that data from the instrument to earth frame (ENU):\n", + "dolfyn.rotate2(ds, \"earth\", inplace=True)" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Once in the true ENU frame of reference, we can calculate the principal flow direction for the velocity data and rotate it into the principal frame of reference (streamwise, cross-stream, vertical). Principal flow directions are aligned with and orthogonal to the flow streamlines at the measurement location. \n", + "\n", + "First, the principal flow direction must be calculated through `calc_principal_heading`. As a standard for DOLfYN functions, those that begin with \"calc_*\" require the velocity data for input. This function is different from others in DOLfYN in that it requires place the output in an attribute called \"principal_heading\", as shown below.\n", + "\n", + "Again we use `rotate2` to change coordinate systems." + ] + }, + { + "cell_type": "code", + "execution_count": 7, + "metadata": {}, + "outputs": [], + "source": [ + "ds.attrs[\"principal_heading\"] = dolfyn.calc_principal_heading(ds[\"vel\"])\n", + "dolfyn.rotate2(ds, \"principal\", inplace=True)" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Averaging Data\n", + "The next step in ADV analysis is to average the velocity data into time bins (ensembles) and calculate turbulence statistics. These averaged values are then used to calculate turbulence statistics. There are two distinct methods for performing this operation, both of which utilize the same variable inputs and produce identical datasets.\n", + "\n", + "1. **Object-Oriented Approach** (standard): Define an 'averaging object', create a dataset binned in time, and calculate basic turbulence statistics. This is accomplished by initiating an object from the ADVBinner class and then feeding that object with our dataset.\n", + "\n", + "2. **Functional Approach** (simple): The same operations can be performed using the functional counterpart of ADVBinner, turbulence_statistics.\n", + "\n", + "Function inputs shown here are the dataset itself: \n", + " - `n_bin`: the number of elements in each bin; \n", + " - `fs`: the ADV's sampling frequency in Hz; \n", + " - `n_fft`: optional, the number of elements per FFT for spectral analysis; \n", + " - `freq_units`: optional, either in Hz or rad/s, of the calculated spectral frequency vector.\n", + "\n", + "All of the variables in the returned dataset have been bin-averaged, where each average is computed using the number of elements specified in `n_bins`. Additional variables in this dataset include the turbulent kinetic energy (TKE) vector (\"ds_binned.tke_vec\"), the Reynold's stresses (\"ds_binned.stress\"), and the power spectral densities (\"ds_binned.psd\"), calculated for each bin." + ] + }, + { + "cell_type": "code", + "execution_count": 8, + "metadata": { + "scrolled": true + }, + "outputs": [], + "source": [ + "# Option 1 (standard)\n", + "binner = api.ADVBinner(n_bin=ds.fs * 600, fs=ds.fs, n_fft=1024)\n", + "ds_binned = binner.bin_average(ds)\n", + "\n", + "# Option 2 (simple)\n", + "# ds_binned = api.calc_turbulence(ds, n_bin=ds.fs*600, fs=ds.fs, n_fft=1024, freq_units=\"Hz\")" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "The benefit to using `ADVBinner` is that one has access to all of the velocity and turbulence analysis functions that DOLfYN contains. If basic analysis will suffice, the `turbulence_statistics` function is the most convienent. Either option can still utilize DOLfYN's shortcuts.\n", + "\n", + "See the [DOLfYN API](https://dolfyn.readthedocs.io/en/latest/apidoc/dolfyn.binners.html) for the full list of functions and shortcuts. A few examples are shown below.\n", + "\n", + "Some things to know:\n", + "- All functions operate bin-by-bin.\n", + "- Some functions will fail if there are NaN's in the data stream (Notably the PSD functions)\n", + "- \"Shorcuts\", as referred to in DOLfYN, are functions accessible by the xarray accessor `velds`, as shown below. The list of \"shorcuts\" available through `velds` are listed [here](https://dolfyn.readthedocs.io/en/latest/apidoc/dolfyn.shortcuts.html). Some shorcut variables require the raw dataset, some an averaged dataset.\n", + "\n", + "For instance, \n", + "- `bin_variance` calculates the binned-variance of each variable in the raw dataset, the complementary to `bin_average`. Variables returned by this function contain a \"_var\" suffix to their name.\n", + "- `cross_spectral_density` calculates the cross spectral power density between each direction of the supplied DataArray. Note that inputs specified in creating the `ADVBinner` object can be overridden or additionally specified for a particular function call.\n", + "- `velds.I` is the shortcut for turbulence intensity. This particular shortcut requires a dataset created by `bin_average`, because it requires bin-averaged data to calculate.\n" + ] + }, + { + "cell_type": "code", + "execution_count": 9, + "metadata": { + "scrolled": true + }, + "outputs": [], + "source": [ + "# Calculate the variance of each variable in the dataset and add to the averaged dataset\n", + "ds_binned = binner.bin_variance(ds, out_ds=ds_binned)\n", + "\n", + "# Calculate the power spectral density\n", + "ds_binned[\"auto_spectra\"] = binner.power_spectral_density(ds[\"vel\"], freq_units=\"Hz\")\n", + "# Calculate dissipation rate from isotropic turbulence cascade\n", + "ds_binned[\"dissipation\"] = binner.dissipation_rate_LT83(\n", + " ds_binned[\"auto_spectra\"], ds_binned.velds.U_mag, freq_range=[0.5, 1]\n", + ")\n", + "\n", + "# Calculate the cross power spectral density\n", + "ds_binned[\"cross_spectra\"] = binner.cross_spectral_density(\n", + " ds[\"vel\"], freq_units=\"Hz\", n_fft_coh=512\n", + ")\n", + "\n", + "# Calculated the turbulence intensity (requires a binned dataset)\n", + "ds_binned[\"TI\"] = ds_binned.velds.I" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Plotting can be performed using matplotlib. As an example, the mean spectrum in the streamwise direction is plotted here. This spectrum shows the mean energy density in the flow at a particular flow frequency." + ] + }, + { + "cell_type": "code", + "execution_count": 10, + "metadata": {}, + "outputs": [ { - "attachments": {}, - "cell_type": "markdown", - "metadata": {}, - "source": [ - "## Saving and Loading DOLfYN datasets\n", - "Datasets can be saved and reloaded using the `save` and `load` functions. Xarray is saved natively in netCDF format, hence the \".nc\" extension.\n", - "\n", - "Note: DOLfYN datasets cannot be saved using xarray's native `ds.to_netcdf`; however, DOLfYN datasets can be opened using `xarray.open_dataset`." + "data": { + "text/plain": [ + "Text(0.5, 1.0, 'Streamwise Direction')" ] + }, + "execution_count": 10, + "metadata": {}, + "output_type": "execute_result" }, { - "cell_type": "code", - "execution_count": 11, - "metadata": {}, - "outputs": [], - "source": [ - "# Uncomment these lines to save and load to your current working directory\n", - "#dolfyn.save(ds, 'your_data.nc')\n", - "#ds_saved = dolfyn.load('your_data.nc')" + "data": { + "image/png": "", + "text/plain": [ + "
" ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" } - ], - "metadata": { - "kernelspec": { - "display_name": "Python 3.9.12 ('base')", - "language": "python", - "name": "python3" - }, - "language_info": { - "codemirror_mode": { - "name": "ipython", - "version": 3 - }, - "file_extension": ".py", - "mimetype": "text/x-python", - "name": "python", - "nbconvert_exporter": "python", - "pygments_lexer": "ipython3", - "version": "3.9.15" - }, - "vscode": { - "interpreter": { - "hash": "357206ab7e4935423e95e994af80e27e7e6c0672abcebb9d86ab743298213348" - } - } + ], + "source": [ + "import matplotlib.pyplot as plt\n", + "\n", + "%matplotlib inline\n", + "\n", + "plt.figure()\n", + "plt.loglog(ds_binned[\"freq\"], ds_binned[\"auto_spectra\"].sel(S=\"Sxx\").mean(dim=\"time\"))\n", + "plt.xlabel(\"Frequency [Hz]\")\n", + "plt.ylabel(\"Energy Density $\\mathrm{[m^2/s^s/Hz]}$\")\n", + "plt.title(\"Streamwise Direction\")" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Saving and Loading DOLfYN datasets\n", + "Datasets can be saved and reloaded using the `save` and `load` functions. Xarray is saved natively in netCDF format, hence the \".nc\" extension.\n", + "\n", + "Note: DOLfYN datasets cannot be saved using xarray's native `ds.to_netcdf`; however, DOLfYN datasets can be opened using `xarray.open_dataset`." + ] + }, + { + "cell_type": "code", + "execution_count": 11, + "metadata": {}, + "outputs": [], + "source": [ + "# Uncomment these lines to save and load to your current working directory\n", + "# dolfyn.save(ds, 'your_data.nc')\n", + "# ds_saved = dolfyn.load('your_data.nc')" + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3.9.12 ('base')", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.9.15" }, - "nbformat": 4, - "nbformat_minor": 4 + "vscode": { + "interpreter": { + "hash": "357206ab7e4935423e95e994af80e27e7e6c0672abcebb9d86ab743298213348" + } + } + }, + "nbformat": 4, + "nbformat_minor": 4 } diff --git a/examples/cdip_example.ipynb b/examples/cdip_example.ipynb index f435d6b76..df2cee51c 100644 --- a/examples/cdip_example.ipynb +++ b/examples/cdip_example.ipynb @@ -51,16 +51,21 @@ "source": [ "from mhkit.wave.io import cdip\n", "import matplotlib.pyplot as plt\n", - "station_number = '100'\n", - "start_date = '2020-04-01'\n", - "end_date= '2020-04-30'\n", - "parameters =['waveHs', 'waveTp', 'waveMeanDirection']\n", "\n", - "data = cdip.request_parse_workflow(station_number=station_number, parameters=parameters, \n", - " start_date=start_date, end_date=end_date)\n", + "station_number = \"100\"\n", + "start_date = \"2020-04-01\"\n", + "end_date = \"2020-04-30\"\n", + "parameters = [\"waveHs\", \"waveTp\", \"waveMeanDirection\"]\n", "\n", - "print('\\n')\n", - "print(f'Returned data: {data.keys()} \\n')\n" + "data = cdip.request_parse_workflow(\n", + " station_number=station_number,\n", + " parameters=parameters,\n", + " start_date=start_date,\n", + " end_date=end_date,\n", + ")\n", + "\n", + "print(\"\\n\")\n", + "print(f\"Returned data: {data.keys()} \\n\")" ] }, { @@ -82,8 +87,8 @@ "metadata": {}, "outputs": [], "source": [ - "station_number='100'\n", - "data_type='historic'\n", + "station_number = \"100\"\n", + "data_type = \"historic\"\n", "nc = cdip.request_netCDF(station_number, data_type)" ] }, @@ -113,7 +118,7 @@ "source": [ "buoy_data = cdip.get_netcdf_variables(nc)\n", "\n", - "print(f'Returned data: {buoy_data.keys()} \\n')" + "print(f\"Returned data: {buoy_data.keys()} \\n\")" ] }, { @@ -405,7 +410,7 @@ } ], "source": [ - "buoy_data['metadata'].keys()" + "buoy_data[\"metadata\"].keys()" ] }, { @@ -447,7 +452,7 @@ } ], "source": [ - "buoy_data['metadata']['meta']\n" + "buoy_data[\"metadata\"][\"meta\"]" ] }, { @@ -481,7 +486,7 @@ } ], "source": [ - "Hs_2011_data = buoy_data[\"data\"][\"wave\"][\"waveHs\"]['2011']\n", + "Hs_2011_data = buoy_data[\"data\"][\"wave\"][\"waveHs\"][\"2011\"]\n", "buoy_name = buoy_data[\"data\"][\"wave\"].name\n", "ax = graphics.plot_boxplot(Hs_2011_data, buoy_title=buoy_name)" ] @@ -514,12 +519,12 @@ } ], "source": [ - "wave_data_May_2011= buoy_data['data']['wave']['2011-05']\n", - "Hs = wave_data_May_2011['waveHs']\n", - "Tp = wave_data_May_2011['waveTp']\n", - "Dp = wave_data_May_2011['waveDp']\n", + "wave_data_May_2011 = buoy_data[\"data\"][\"wave\"][\"2011-05\"]\n", + "Hs = wave_data_May_2011[\"waveHs\"]\n", + "Tp = wave_data_May_2011[\"waveTp\"]\n", + "Dp = wave_data_May_2011[\"waveDp\"]\n", "\n", - "ax = graphics.plot_compendium(Hs, Tp, Dp, buoy_name )" + "ax = graphics.plot_compendium(Hs, Tp, Dp, buoy_name)" ] }, { @@ -555,7 +560,9 @@ } ], "source": [ - "buoy_data = cdip.get_netcdf_variables(nc, start_date='2011-01-01', end_date='2011-12-31', parameters='waveHs')\n", + "buoy_data = cdip.get_netcdf_variables(\n", + " nc, start_date=\"2011-01-01\", end_date=\"2011-12-31\", parameters=\"waveHs\"\n", + ")\n", "buoy_name = buoy_data[\"data\"][\"wave\"].name\n", "ax = graphics.plot_boxplot(buoy_data[\"data\"][\"wave\"][\"waveHs\"], buoy_title=buoy_name)" ] @@ -566,7 +573,9 @@ "source": [ "## 4.b. `request_parse_workflow`\n", "\n", - "In the previous example we requested the NetCDF file and then processed the data. This workflow has been codified into a single function to streamline the process and adds additional functionality as well. The `request_parse_workflow` function accepts a netCDF object or a station number. This means the user may pass a CDIP ndetCDF file loaded from file, pull the data with `request_netcdf` and then pass, or just pass a station number letting the function know what data to parse and return. Secondly, the `request_parse_workflow` function accepts parameters allowing the user to specify to only return specific parameters reducing processing requirements. This is especially useful for processing 2D data which is only processed is specifically requested due to the amount of time it takes to process all the 2D data. Next, `request_parse_workflow` will slice on time by years, start_date, or end date. Years can be a single integer or a list of integers and is not required to be consecutive. If specified the start date will remove any data prior to the specified string (e.g. '2011-01-01') and end_date will remove any data after the speficied date. start_date and end_date may be used together, seperatly or not at all. Years works indpendently of start and end date. Next, the data_type defaults to historic but specifying this as realtime will return realtime data from the buoy. Lastly, there is a the boolean `all_2D_variables`. If set to true the function will return all of the wave 2D variables. It is not reccomended to do this due to the computational expense to do so, Instead it is reccomended to specify 2D quantities of interest using the `parameters` keyword.\n", + "In the previous example we requested the NetCDF file and then processed the data. This workflow has been codified into a single function to streamline the process and adds additional functionality as well. The `request_parse_workflow` function accepts a netCDF object or a station number. This means the user may pass a CDIP netCDF file loaded from file, pull the data with `request_netcdf` and then pass, or just pass a station number letting the function know what data to parse and return. Secondly, the `request_parse_workflow` function accepts parameters allowing the user to specify to only return specific parameters reducing processing requirements. This is especially useful for processing 2D data which is only processed is specifically requested due to the amount of time it takes to process all the 2D data. A print statement indicates whether the function is currently still processing 2D variables. Use the `silent=True` keyword argument to turn off this print statement in production environments.\n", + "\n", + "Next, `request_parse_workflow` will slice on time by years, start_date, or end date. Years can be a single integer or a list of integers and is not required to be consecutive. If specified the start date will remove any data prior to the specified string (e.g. '2011-01-01') and end_date will remove any data after the speficied date. start_date and end_date may be used together, seperatly or not at all. Years works indpendently of start and end date. Next, the data_type defaults to historic but specifying this as realtime will return realtime data from the buoy. Lastly, there is a the boolean `all_2D_variables`. If set to true the function will return all of the wave 2D variables. It is not recommended to do this due to the computational expense to do so, Instead it is recommended to specify 2D quantities of interest using the `parameters` keyword.\n", "\n", "For an example we will create a compendium of HS for the year 2011 from the nc file requested earlier. In this case we can use the years parameter instead of start and end dates.\n" ] @@ -590,13 +599,15 @@ } ], "source": [ - "buoy_data = cdip.request_parse_workflow(station_number='100', years=2011, parameters=['waveHs', 'waveTp', 'waveDp'])\n", + "buoy_data = cdip.request_parse_workflow(\n", + " station_number=\"100\", years=2011, parameters=[\"waveHs\", \"waveTp\", \"waveDp\"]\n", + ")\n", "\n", - "Hs = buoy_data['data']['wave']['waveHs']\n", - "Tp = buoy_data['data']['wave']['waveTp']\n", - "Dp = buoy_data['data']['wave']['waveDp']\n", + "Hs = buoy_data[\"data\"][\"wave\"][\"waveHs\"]\n", + "Tp = buoy_data[\"data\"][\"wave\"][\"waveTp\"]\n", + "Dp = buoy_data[\"data\"][\"wave\"][\"waveDp\"]\n", "buoy_name = buoy_data[\"data\"][\"wave\"].name\n", - "ax = graphics.plot_compendium(Hs, Tp, Dp, buoy_name )" + "ax = graphics.plot_compendium(Hs, Tp, Dp, buoy_name)" ] }, { diff --git a/examples/data/dolfyn/RDI_7f79_2.000 b/examples/data/dolfyn/RDI_7f79_2.000 new file mode 100644 index 000000000..f1d773c2a Binary files /dev/null and b/examples/data/dolfyn/RDI_7f79_2.000 differ diff --git a/examples/data/dolfyn/dual_profile.ad2cp b/examples/data/dolfyn/dual_profile.ad2cp new file mode 100644 index 000000000..7839b3285 Binary files /dev/null and b/examples/data/dolfyn/dual_profile.ad2cp differ diff --git a/examples/data/dolfyn/test_data/AWAC_test01.nc b/examples/data/dolfyn/test_data/AWAC_test01.nc index d15ed510e..bcb760986 100644 Binary files a/examples/data/dolfyn/test_data/AWAC_test01.nc and b/examples/data/dolfyn/test_data/AWAC_test01.nc differ diff --git a/examples/data/dolfyn/test_data/AWAC_test01_clean.nc b/examples/data/dolfyn/test_data/AWAC_test01_clean.nc index 90d68996d..96613baf0 100644 Binary files a/examples/data/dolfyn/test_data/AWAC_test01_clean.nc and b/examples/data/dolfyn/test_data/AWAC_test01_clean.nc differ diff --git a/examples/data/dolfyn/test_data/AWAC_test01_earth2inst.nc b/examples/data/dolfyn/test_data/AWAC_test01_earth2inst.nc index 5657ea3d1..6d2946c83 100644 Binary files a/examples/data/dolfyn/test_data/AWAC_test01_earth2inst.nc and b/examples/data/dolfyn/test_data/AWAC_test01_earth2inst.nc differ diff --git a/examples/data/dolfyn/test_data/AWAC_test01_earth2principal.nc b/examples/data/dolfyn/test_data/AWAC_test01_earth2principal.nc index c45535ca1..f5b5c3256 100644 Binary files a/examples/data/dolfyn/test_data/AWAC_test01_earth2principal.nc and b/examples/data/dolfyn/test_data/AWAC_test01_earth2principal.nc differ diff --git a/examples/data/dolfyn/test_data/AWAC_test01_inst2beam.nc b/examples/data/dolfyn/test_data/AWAC_test01_inst2beam.nc index 6b8b687b7..3ccd55d68 100644 Binary files a/examples/data/dolfyn/test_data/AWAC_test01_inst2beam.nc and b/examples/data/dolfyn/test_data/AWAC_test01_inst2beam.nc differ diff --git a/examples/data/dolfyn/test_data/AWAC_test01_ud.nc b/examples/data/dolfyn/test_data/AWAC_test01_ud.nc index dc3555932..e7dfa248f 100644 Binary files a/examples/data/dolfyn/test_data/AWAC_test01_ud.nc and b/examples/data/dolfyn/test_data/AWAC_test01_ud.nc differ diff --git a/examples/data/dolfyn/test_data/BenchFile01.nc b/examples/data/dolfyn/test_data/BenchFile01.nc index fc3f4bcdc..3b2af8fc4 100644 Binary files a/examples/data/dolfyn/test_data/BenchFile01.nc and b/examples/data/dolfyn/test_data/BenchFile01.nc differ diff --git a/examples/data/dolfyn/test_data/BenchFile01.repr.txt b/examples/data/dolfyn/test_data/BenchFile01.repr.txt index 557298fc2..5e5d563c7 100644 --- a/examples/data/dolfyn/test_data/BenchFile01.repr.txt +++ b/examples/data/dolfyn/test_data/BenchFile01.repr.txt @@ -4,6 +4,7 @@ . (100 pings @ 2Hz) Variables: - time ('time',) + - time_altraw ('time_altraw',) - time_b5 ('time_b5',) - vel ('dir', 'range', 'time') - vel_b5 ('range_b5', 'time_b5') @@ -14,6 +15,8 @@ - roll ('time',) - temp ('time',) - pressure ('time',) + - pressure_alt ('time',) + - pressure_altraw ('time_altraw',) - amp ('beam', 'range', 'time') - amp_b5 ('range_b5', 'time_b5') - corr ('beam', 'range', 'time') diff --git a/examples/data/dolfyn/test_data/BenchFile01_avg.nc b/examples/data/dolfyn/test_data/BenchFile01_avg.nc index ddd0e0327..24d488138 100644 Binary files a/examples/data/dolfyn/test_data/BenchFile01_avg.nc and b/examples/data/dolfyn/test_data/BenchFile01_avg.nc differ diff --git a/examples/data/dolfyn/test_data/BenchFile01_crop.nc b/examples/data/dolfyn/test_data/BenchFile01_crop.nc new file mode 100644 index 000000000..278a872bf Binary files /dev/null and b/examples/data/dolfyn/test_data/BenchFile01_crop.nc differ diff --git a/examples/data/dolfyn/test_data/BenchFile01_rotate_beam2inst.nc b/examples/data/dolfyn/test_data/BenchFile01_rotate_beam2inst.nc index dc10c6ef6..2004de5f4 100644 Binary files a/examples/data/dolfyn/test_data/BenchFile01_rotate_beam2inst.nc and b/examples/data/dolfyn/test_data/BenchFile01_rotate_beam2inst.nc differ diff --git a/examples/data/dolfyn/test_data/BenchFile01_rotate_earth2principal.nc b/examples/data/dolfyn/test_data/BenchFile01_rotate_earth2principal.nc index 5acd192b1..a71cbbbdd 100644 Binary files a/examples/data/dolfyn/test_data/BenchFile01_rotate_earth2principal.nc and b/examples/data/dolfyn/test_data/BenchFile01_rotate_earth2principal.nc differ diff --git a/examples/data/dolfyn/test_data/BenchFile01_rotate_inst2earth.nc b/examples/data/dolfyn/test_data/BenchFile01_rotate_inst2earth.nc index 2a8e4b67c..bbfeaf37e 100644 Binary files a/examples/data/dolfyn/test_data/BenchFile01_rotate_inst2earth.nc and b/examples/data/dolfyn/test_data/BenchFile01_rotate_inst2earth.nc differ diff --git a/examples/data/dolfyn/test_data/H-AWAC_test01.nc b/examples/data/dolfyn/test_data/H-AWAC_test01.nc index 0c87e671c..880168335 100644 Binary files a/examples/data/dolfyn/test_data/H-AWAC_test01.nc and b/examples/data/dolfyn/test_data/H-AWAC_test01.nc differ diff --git a/examples/data/dolfyn/test_data/RDI_7f79_2.nc b/examples/data/dolfyn/test_data/RDI_7f79_2.nc new file mode 100644 index 000000000..4874189da Binary files /dev/null and b/examples/data/dolfyn/test_data/RDI_7f79_2.nc differ diff --git a/examples/data/dolfyn/test_data/RDI_withBT.dolfyn.log b/examples/data/dolfyn/test_data/RDI_withBT.dolfyn.log index 4ec945bdf..d79f07fcd 100644 --- a/examples/data/dolfyn/test_data/RDI_withBT.dolfyn.log +++ b/examples/data/dolfyn/test_data/RDI_withBT.dolfyn.log @@ -1,33 +1,29 @@ root - INFO - pos 2 root - INFO - cfgid0: [7f, 7f] -root - INFO - ###In checkheader. -root - INFO - pos 2 -root - INFO - ###Leaving checkheader. root - INFO - {'nbyte': 579, 'dat_offsets': array([ 20, 79, 144, 282, 352, 422, 492])} root - INFO - pos 20 -root - INFO - pos 20 id 0 +root - INFO - id 0 offset 20 +root - INFO - Number of cells set to 17 +root - INFO - Cell size set to 1.0 root - INFO - Read Config root - INFO - Read Fixed -root - INFO - pos 79 id 128 -root - INFO - pos 144 id 256 -root - INFO - pos 282 id 512 -root - INFO - pos 352 id 768 -root - INFO - pos 422 id 1024 -root - INFO - pos 492 id 1536 +root - INFO - id 128 offset 79 +root - INFO - id 256 offset 144 +root - INFO - id 512 offset 282 +root - INFO - id 768 offset 352 +root - INFO - id 1024 offset 422 +root - INFO - id 1536 offset 492 root - INFO - Done: {'prog_ver': 51.41, 'inst_model': 'Workhorse', 'beam_angle': 20, 'freq': 600, 'beam_pattern': 'convex', 'orientation': 'down', 'n_beams': 4, 'n_cells': 17, 'pings_per_ensemble': 1, 'cell_size': 1.0, 'blank_dist': 0.88, 'profiling_mode': 1, 'min_corr_threshold': 64, 'n_code_reps': 5, 'min_prcnt_gd': 0, 'max_error_vel': 2.0, 'sec_between_ping_groups': 0.5, 'coord_sys': 'earth', 'use_pitchroll': 'yes', 'use_3beam': 'yes', 'bin_mapping': 'yes', 'heading_misalign_deg': 0.0, 'magnetic_var_deg': 0.0, 'sensors_src': '01111101', 'sensors_avail': '00111101', 'bin1_dist_m': 2.09, 'transmit_pulse_m': 1.18, 'water_ref_cells': [1, 5], 'false_target_threshold': 50, 'transmit_lag_m': 0.24, 'bandwidth': 0, 'power_level': 255, 'serialnum': 18655} root - INFO - self._bb False -root - INFO - {} -root - INFO - 1723 pings estimated in this file -root - INFO - taking data from pings 0 - 1723 -root - INFO - 1723 ensembles will be produced. +root - INFO - self.cfgbb: {} +root - INFO - taking data from pings 0 - 1721 +root - INFO - 1721 ensembles will be produced. root - INFO - 17 ncells, not BB root - DEBUG - pos 0mb/1mb -root - INFO - -->In search_buffer... -root - INFO - ###In checkheader. root - INFO - pos 2 -root - INFO - ###Leaving checkheader. +root - INFO - cfgid0: [7f, 7f] root - INFO - Read Header root - INFO - n 0: 0 0000 root - DEBUG - pos: 22, pos_: 0, nbyte: 18, k: -1, byte_offset: -1 @@ -75,10 +71,8 @@ root - INFO - success! root - DEBUG - pos: 581, pos_: 0, nbyte: 85, k: 0, byte_offset: 577 root - DEBUG - pos 0mb/1mb -root - INFO - -->In search_buffer... -root - INFO - ###In checkheader. root - INFO - pos 583 -root - INFO - ###Leaving checkheader. +root - INFO - cfgid0: [7f, 7f] root - INFO - Read Header root - INFO - n 0: 0 0000 root - DEBUG - pos: 603, pos_: 0, nbyte: 18, k: -1, byte_offset: -1 @@ -99,3 +93,9 @@ root - DEBUG - Trying to Read 256 root - INFO - Reading code 0x100... root - INFO - Read Vel root - INFO - success! +root - INFO - n 3: 512 0200 +root - DEBUG - pos: 865, pos_: 0, nbyte: 138, k: 0, byte_offset: -1 +root - DEBUG - Trying to Read 512 +root - INFO - Reading code 0x200... +root - INFO - Read Corr +root - INFO - success! diff --git a/examples/data/dolfyn/test_data/RiverPro_test01.nc b/examples/data/dolfyn/test_data/RiverPro_test01.nc index 7fa3e6d34..719ad6102 100644 Binary files a/examples/data/dolfyn/test_data/RiverPro_test01.nc and b/examples/data/dolfyn/test_data/RiverPro_test01.nc differ diff --git a/examples/data/dolfyn/test_data/Sig1000_BadTime01.nc b/examples/data/dolfyn/test_data/Sig1000_BadTime01.nc index 790d1e578..de929e2e4 100644 Binary files a/examples/data/dolfyn/test_data/Sig1000_BadTime01.nc and b/examples/data/dolfyn/test_data/Sig1000_BadTime01.nc differ diff --git a/examples/data/dolfyn/test_data/Sig1000_IMU.nc b/examples/data/dolfyn/test_data/Sig1000_IMU.nc index bee45bdb1..397475f51 100644 Binary files a/examples/data/dolfyn/test_data/Sig1000_IMU.nc and b/examples/data/dolfyn/test_data/Sig1000_IMU.nc differ diff --git a/examples/data/dolfyn/test_data/Sig1000_IMU_bin.nc b/examples/data/dolfyn/test_data/Sig1000_IMU_bin.nc deleted file mode 100644 index 317293a7f..000000000 Binary files a/examples/data/dolfyn/test_data/Sig1000_IMU_bin.nc and /dev/null differ diff --git a/examples/data/dolfyn/test_data/Sig1000_IMU_ofilt.nc b/examples/data/dolfyn/test_data/Sig1000_IMU_ofilt.nc index 51c45f146..b46762be3 100644 Binary files a/examples/data/dolfyn/test_data/Sig1000_IMU_ofilt.nc and b/examples/data/dolfyn/test_data/Sig1000_IMU_ofilt.nc differ diff --git a/examples/data/dolfyn/test_data/Sig1000_IMU_rotate_beam2inst.nc b/examples/data/dolfyn/test_data/Sig1000_IMU_rotate_beam2inst.nc index 2edd41f60..6c3337157 100644 Binary files a/examples/data/dolfyn/test_data/Sig1000_IMU_rotate_beam2inst.nc and b/examples/data/dolfyn/test_data/Sig1000_IMU_rotate_beam2inst.nc differ diff --git a/examples/data/dolfyn/test_data/Sig1000_IMU_rotate_inst2earth.nc b/examples/data/dolfyn/test_data/Sig1000_IMU_rotate_inst2earth.nc index 9944aeb7a..f7364c5f0 100644 Binary files a/examples/data/dolfyn/test_data/Sig1000_IMU_rotate_inst2earth.nc and b/examples/data/dolfyn/test_data/Sig1000_IMU_rotate_inst2earth.nc differ diff --git a/examples/data/dolfyn/test_data/Sig1000_IMU_ud.nc b/examples/data/dolfyn/test_data/Sig1000_IMU_ud.nc index f0f847653..05663f604 100644 Binary files a/examples/data/dolfyn/test_data/Sig1000_IMU_ud.nc and b/examples/data/dolfyn/test_data/Sig1000_IMU_ud.nc differ diff --git a/examples/data/dolfyn/test_data/Sig1000_tidal.nc b/examples/data/dolfyn/test_data/Sig1000_tidal.nc index f5bf6ba34..759fe4775 100644 Binary files a/examples/data/dolfyn/test_data/Sig1000_tidal.nc and b/examples/data/dolfyn/test_data/Sig1000_tidal.nc differ diff --git a/examples/data/dolfyn/test_data/Sig1000_tidal_bin.nc b/examples/data/dolfyn/test_data/Sig1000_tidal_bin.nc new file mode 100644 index 000000000..4f5ffec15 Binary files /dev/null and b/examples/data/dolfyn/test_data/Sig1000_tidal_bin.nc differ diff --git a/examples/data/dolfyn/test_data/Sig1000_tidal_clean.nc b/examples/data/dolfyn/test_data/Sig1000_tidal_clean.nc index f5148a480..8cb9e6678 100644 Binary files a/examples/data/dolfyn/test_data/Sig1000_tidal_clean.nc and b/examples/data/dolfyn/test_data/Sig1000_tidal_clean.nc differ diff --git a/examples/data/dolfyn/test_data/Sig500_Echo.nc b/examples/data/dolfyn/test_data/Sig500_Echo.nc index e80a279a5..78dbdd06f 100644 Binary files a/examples/data/dolfyn/test_data/Sig500_Echo.nc and b/examples/data/dolfyn/test_data/Sig500_Echo.nc differ diff --git a/examples/data/dolfyn/test_data/Sig500_Echo_clean.nc b/examples/data/dolfyn/test_data/Sig500_Echo_clean.nc index bf913bfa0..099334d74 100644 Binary files a/examples/data/dolfyn/test_data/Sig500_Echo_clean.nc and b/examples/data/dolfyn/test_data/Sig500_Echo_clean.nc differ diff --git a/examples/data/dolfyn/test_data/Sig500_Echo_crop.nc b/examples/data/dolfyn/test_data/Sig500_Echo_crop.nc index ed7fbe512..80d4bca81 100644 Binary files a/examples/data/dolfyn/test_data/Sig500_Echo_crop.nc and b/examples/data/dolfyn/test_data/Sig500_Echo_crop.nc differ diff --git a/examples/data/dolfyn/test_data/Sig500_Echo_earth2inst.nc b/examples/data/dolfyn/test_data/Sig500_Echo_earth2inst.nc index a5e0f5d7d..b44b1d8ca 100644 Binary files a/examples/data/dolfyn/test_data/Sig500_Echo_earth2inst.nc and b/examples/data/dolfyn/test_data/Sig500_Echo_earth2inst.nc differ diff --git a/examples/data/dolfyn/test_data/Sig500_Echo_inst2beam.nc b/examples/data/dolfyn/test_data/Sig500_Echo_inst2beam.nc index 711cdeff1..8e12197df 100644 Binary files a/examples/data/dolfyn/test_data/Sig500_Echo_inst2beam.nc and b/examples/data/dolfyn/test_data/Sig500_Echo_inst2beam.nc differ diff --git a/examples/data/dolfyn/test_data/Sig500_last_ensemble_is_whole.nc b/examples/data/dolfyn/test_data/Sig500_last_ensemble_is_whole.nc index b9aa117df..f52d8df45 100644 Binary files a/examples/data/dolfyn/test_data/Sig500_last_ensemble_is_whole.nc and b/examples/data/dolfyn/test_data/Sig500_last_ensemble_is_whole.nc differ diff --git a/examples/data/dolfyn/test_data/Sig_SkippedPings01.nc b/examples/data/dolfyn/test_data/Sig_SkippedPings01.nc index 2b2f0857c..90b41d3c7 100644 Binary files a/examples/data/dolfyn/test_data/Sig_SkippedPings01.nc and b/examples/data/dolfyn/test_data/Sig_SkippedPings01.nc differ diff --git a/examples/data/dolfyn/test_data/VelEchoBT01.nc b/examples/data/dolfyn/test_data/VelEchoBT01.nc index d7ff5dbcb..f2fb6183e 100644 Binary files a/examples/data/dolfyn/test_data/VelEchoBT01.nc and b/examples/data/dolfyn/test_data/VelEchoBT01.nc differ diff --git a/examples/data/dolfyn/test_data/VelEchoBT01_rotate_beam2inst.nc b/examples/data/dolfyn/test_data/VelEchoBT01_rotate_beam2inst.nc index 2462311e5..6cefd020c 100644 Binary files a/examples/data/dolfyn/test_data/VelEchoBT01_rotate_beam2inst.nc and b/examples/data/dolfyn/test_data/VelEchoBT01_rotate_beam2inst.nc differ diff --git a/examples/data/dolfyn/test_data/dat_vm.mat b/examples/data/dolfyn/test_data/dat_vm.mat index ba8c80bda..b71ba2a93 100644 Binary files a/examples/data/dolfyn/test_data/dat_vm.mat and b/examples/data/dolfyn/test_data/dat_vm.mat differ diff --git a/examples/data/dolfyn/test_data/dual_profile.nc b/examples/data/dolfyn/test_data/dual_profile.nc new file mode 100644 index 000000000..ab63f99da Binary files /dev/null and b/examples/data/dolfyn/test_data/dual_profile.nc differ diff --git a/examples/data/dolfyn/test_data/vector_data01_bin.nc b/examples/data/dolfyn/test_data/vector_data01_bin.nc index baa0dba0b..a88effa0d 100644 Binary files a/examples/data/dolfyn/test_data/vector_data01_bin.nc and b/examples/data/dolfyn/test_data/vector_data01_bin.nc differ diff --git a/examples/data/dolfyn/test_data/vmdas01_wh.nc b/examples/data/dolfyn/test_data/vmdas01_wh.nc index 118d8d694..a5dc8a5d8 100644 Binary files a/examples/data/dolfyn/test_data/vmdas01_wh.nc and b/examples/data/dolfyn/test_data/vmdas01_wh.nc differ diff --git a/examples/data/dolfyn/test_data/winriver01.nc b/examples/data/dolfyn/test_data/winriver01.nc index cc0bada6a..b49bc6205 100644 Binary files a/examples/data/dolfyn/test_data/winriver01.nc and b/examples/data/dolfyn/test_data/winriver01.nc differ diff --git a/examples/data/dolfyn/test_data/winriver02.nc b/examples/data/dolfyn/test_data/winriver02.nc index efc7a18a3..295415044 100644 Binary files a/examples/data/dolfyn/test_data/winriver02.nc and b/examples/data/dolfyn/test_data/winriver02.nc differ diff --git a/examples/data/dolfyn/test_data/winriver02_rotate_ship2earth.nc b/examples/data/dolfyn/test_data/winriver02_rotate_ship2earth.nc index 7946bc2ab..5bebdeaf0 100644 Binary files a/examples/data/dolfyn/test_data/winriver02_rotate_ship2earth.nc and b/examples/data/dolfyn/test_data/winriver02_rotate_ship2earth.nc differ diff --git a/examples/data/dolfyn/test_data/winriver02_transect.nc b/examples/data/dolfyn/test_data/winriver02_transect.nc index f6c10fedb..d48140c41 100644 Binary files a/examples/data/dolfyn/test_data/winriver02_transect.nc and b/examples/data/dolfyn/test_data/winriver02_transect.nc differ diff --git a/examples/data/loads/data_loads_hs.csv b/examples/data/loads/data_loads_hs.csv new file mode 100644 index 000000000..b8ce5a644 --- /dev/null +++ b/examples/data/loads/data_loads_hs.csvdiff --git a/examples/data/loads/loads_data_dict.json b/examples/data/loads/loads_data_dict.json index 3351ddbb5..9054afe7d 100644 --- a/examples/data/loads/loads_data_dict.json +++ b/examples/data/loads/loads_data_dict.json @@ -763,24 +763,24 @@ "yawoffset": 0.36065239549512096 }, { - "ActivePower": NaN, - "BL1_EdgeMom": NaN, - "BL1_FlapMom": NaN, - "BL3_EdgeMom": NaN, - "BL3_FlapMom": NaN, - "LSSDW_My": NaN, - "LSSDW_Mz": NaN, - "LSSDW_Tq": NaN, - "TB_ForeAft": NaN, - "TB_SideSide": NaN, - "TTTq": NaN, - "TT_ForeAft": NaN, - "TT_SideSide": NaN, - "WD_ModActive": NaN, - "WD_Nacelle": NaN, - "WD_NacelleMod": NaN, - "uWind_80m": NaN, - "yawoffset": NaN + "ActivePower": 0.0, + "BL1_EdgeMom": 0.0, + "BL1_FlapMom": 0.0, + "BL3_EdgeMom": 0.0, + "BL3_FlapMom": 0.0, + "LSSDW_My": 0.0, + "LSSDW_Mz": 0.0, + "LSSDW_Tq": 0.0, + "TB_ForeAft": 0.0, + "TB_SideSide": 0.0, + "TTTq": 0.0, + "TT_ForeAft": 0.0, + "TT_SideSide": 0.0, + "WD_ModActive": 0.0, + "WD_Nacelle": 0.0, + "WD_NacelleMod": 0.0, + "uWind_80m": 0.0, + "yawoffset": 0.0 }, { "ActivePower": NaN, @@ -823,24 +823,24 @@ "yawoffset": NaN }, { - "ActivePower": NaN, - "BL1_EdgeMom": NaN, - "BL1_FlapMom": NaN, - "BL3_EdgeMom": NaN, - "BL3_FlapMom": NaN, - "LSSDW_My": NaN, - "LSSDW_Mz": NaN, - "LSSDW_Tq": NaN, - "TB_ForeAft": NaN, - "TB_SideSide": NaN, - "TTTq": NaN, - "TT_ForeAft": NaN, - "TT_SideSide": NaN, - "WD_ModActive": NaN, - "WD_Nacelle": NaN, - "WD_NacelleMod": NaN, - "uWind_80m": NaN, - "yawoffset": NaN + "ActivePower": 0.0, + "BL1_EdgeMom": 0.0, + "BL1_FlapMom": 0.0, + "BL3_EdgeMom": 0.0, + "BL3_FlapMom": 0.0, + "LSSDW_My": 0.0, + "LSSDW_Mz": 0.0, + "LSSDW_Tq": 0.0, + "TB_ForeAft": 0.0, + "TB_SideSide": 0.0, + "TTTq": 0.0, + "TT_ForeAft": 0.0, + "TT_SideSide": 0.0, + "WD_ModActive": 0.0, + "WD_Nacelle": 0.0, + "WD_NacelleMod": 0.0, + "uWind_80m": 0.0, + "yawoffset": 0.0 }, { "ActivePower": NaN, @@ -863,24 +863,24 @@ "yawoffset": NaN }, { - "ActivePower": NaN, - "BL1_EdgeMom": NaN, - "BL1_FlapMom": NaN, - "BL3_EdgeMom": NaN, - "BL3_FlapMom": NaN, - "LSSDW_My": NaN, - "LSSDW_Mz": NaN, - "LSSDW_Tq": NaN, - "TB_ForeAft": NaN, - "TB_SideSide": NaN, - "TTTq": NaN, - "TT_ForeAft": NaN, - "TT_SideSide": NaN, - "WD_ModActive": NaN, - "WD_Nacelle": NaN, - "WD_NacelleMod": NaN, - "uWind_80m": NaN, - "yawoffset": NaN + "ActivePower": 0.0, + "BL1_EdgeMom": 0.0, + "BL1_FlapMom": 0.0, + "BL3_EdgeMom": 0.0, + "BL3_FlapMom": 0.0, + "LSSDW_My": 0.0, + "LSSDW_Mz": 0.0, + "LSSDW_Tq": 0.0, + "TB_ForeAft": 0.0, + "TB_SideSide": 0.0, + "TTTq": 0.0, + "TT_ForeAft": 0.0, + "TT_SideSide": 0.0, + "WD_ModActive": 0.0, + "WD_Nacelle": 0.0, + "WD_NacelleMod": 0.0, + "uWind_80m": 0.0, + "yawoffset": 0.0 } ], "bin_means": [ @@ -1647,24 +1647,24 @@ "yawoffset": 0.32465542650598184 }, { - "ActivePower": NaN, - "BL1_EdgeMom": NaN, - "BL1_FlapMom": NaN, - "BL3_EdgeMom": NaN, - "BL3_FlapMom": NaN, - "LSSDW_My": NaN, - "LSSDW_Mz": NaN, - "LSSDW_Tq": NaN, - "TB_ForeAft": NaN, - "TB_SideSide": NaN, - "TTTq": NaN, - "TT_ForeAft": NaN, - "TT_SideSide": NaN, - "WD_ModActive": NaN, - "WD_Nacelle": NaN, - "WD_NacelleMod": NaN, - "uWind_80m": NaN, - "yawoffset": NaN + "ActivePower": 0.0, + "BL1_EdgeMom": 0.0, + "BL1_FlapMom": 0.0, + "BL3_EdgeMom": 0.0, + "BL3_FlapMom": 0.0, + "LSSDW_My": 0.0, + "LSSDW_Mz": 0.0, + "LSSDW_Tq": 0.0, + "TB_ForeAft": 0.0, + "TB_SideSide": 0.0, + "TTTq": 0.0, + "TT_ForeAft": 0.0, + "TT_SideSide": 0.0, + "WD_ModActive": 0.0, + "WD_Nacelle": 0.0, + "WD_NacelleMod": 0.0, + "uWind_80m": 0.0, + "yawoffset": 0.0 }, { "ActivePower": NaN, @@ -1707,24 +1707,24 @@ "yawoffset": NaN }, { - "ActivePower": NaN, - "BL1_EdgeMom": NaN, - "BL1_FlapMom": NaN, - "BL3_EdgeMom": NaN, - "BL3_FlapMom": NaN, - "LSSDW_My": NaN, - "LSSDW_Mz": NaN, - "LSSDW_Tq": NaN, - "TB_ForeAft": NaN, - "TB_SideSide": NaN, - "TTTq": NaN, - "TT_ForeAft": NaN, - "TT_SideSide": NaN, - "WD_ModActive": NaN, - "WD_Nacelle": NaN, - "WD_NacelleMod": NaN, - "uWind_80m": NaN, - "yawoffset": NaN + "ActivePower": 0.0, + "BL1_EdgeMom": 0.0, + "BL1_FlapMom": 0.0, + "BL3_EdgeMom": 0.0, + "BL3_FlapMom": 0.0, + "LSSDW_My": 0.0, + "LSSDW_Mz": 0.0, + "LSSDW_Tq": 0.0, + "TB_ForeAft": 0.0, + "TB_SideSide": 0.0, + "TTTq": 0.0, + "TT_ForeAft": 0.0, + "TT_SideSide": 0.0, + "WD_ModActive": 0.0, + "WD_Nacelle": 0.0, + "WD_NacelleMod": 0.0, + "uWind_80m": 0.0, + "yawoffset": 0.0 }, { "ActivePower": NaN, @@ -1747,24 +1747,24 @@ "yawoffset": NaN }, { - "ActivePower": NaN, - "BL1_EdgeMom": NaN, - "BL1_FlapMom": NaN, - "BL3_EdgeMom": NaN, - "BL3_FlapMom": NaN, - "LSSDW_My": NaN, - "LSSDW_Mz": NaN, - "LSSDW_Tq": NaN, - "TB_ForeAft": NaN, - "TB_SideSide": NaN, - "TTTq": NaN, - "TT_ForeAft": NaN, - "TT_SideSide": NaN, - "WD_ModActive": NaN, - "WD_Nacelle": NaN, - "WD_NacelleMod": NaN, - "uWind_80m": NaN, - "yawoffset": NaN + "ActivePower": 0.0, + "BL1_EdgeMom": 0.0, + "BL1_FlapMom": 0.0, + "BL3_EdgeMom": 0.0, + "BL3_FlapMom": 0.0, + "LSSDW_My": 0.0, + "LSSDW_Mz": 0.0, + "LSSDW_Tq": 0.0, + "TB_ForeAft": 0.0, + "TB_SideSide": 0.0, + "TTTq": 0.0, + "TT_ForeAft": 0.0, + "TT_SideSide": 0.0, + "WD_ModActive": 0.0, + "WD_Nacelle": 0.0, + "WD_NacelleMod": 0.0, + "uWind_80m": 0.0, + "yawoffset": 0.0 } ], "bin_mins": [ @@ -2531,24 +2531,24 @@ "yawoffset": 11.605683455992253 }, { - "ActivePower": NaN, - "BL1_EdgeMom": NaN, - "BL1_FlapMom": NaN, - "BL3_EdgeMom": NaN, - "BL3_FlapMom": NaN, - "LSSDW_My": NaN, - "LSSDW_Mz": NaN, - "LSSDW_Tq": NaN, - "TB_ForeAft": NaN, - "TB_SideSide": NaN, - "TTTq": NaN, - "TT_ForeAft": NaN, - "TT_SideSide": NaN, - "WD_ModActive": NaN, - "WD_Nacelle": NaN, - "WD_NacelleMod": NaN, - "uWind_80m": NaN, - "yawoffset": NaN + "ActivePower": 0.0, + "BL1_EdgeMom": 0.0, + "BL1_FlapMom": 0.0, + "BL3_EdgeMom": 0.0, + "BL3_FlapMom": 0.0, + "LSSDW_My": 0.0, + "LSSDW_Mz": 0.0, + "LSSDW_Tq": 0.0, + "TB_ForeAft": 0.0, + "TB_SideSide": 0.0, + "TTTq": 0.0, + "TT_ForeAft": 0.0, + "TT_SideSide": 0.0, + "WD_ModActive": 0.0, + "WD_Nacelle": 0.0, + "WD_NacelleMod": 0.0, + "uWind_80m": 0.0, + "yawoffset": 0.0 }, { "ActivePower": NaN, @@ -2591,24 +2591,24 @@ "yawoffset": NaN }, { - "ActivePower": NaN, - "BL1_EdgeMom": NaN, - "BL1_FlapMom": NaN, - "BL3_EdgeMom": NaN, - "BL3_FlapMom": NaN, - "LSSDW_My": NaN, - "LSSDW_Mz": NaN, - "LSSDW_Tq": NaN, - "TB_ForeAft": NaN, - "TB_SideSide": NaN, - "TTTq": NaN, - "TT_ForeAft": NaN, - "TT_SideSide": NaN, - "WD_ModActive": NaN, - "WD_Nacelle": NaN, - "WD_NacelleMod": NaN, - "uWind_80m": NaN, - "yawoffset": NaN + "ActivePower": 0.0, + "BL1_EdgeMom": 0.0, + "BL1_FlapMom": 0.0, + "BL3_EdgeMom": 0.0, + "BL3_FlapMom": 0.0, + "LSSDW_My": 0.0, + "LSSDW_Mz": 0.0, + "LSSDW_Tq": 0.0, + "TB_ForeAft": 0.0, + "TB_SideSide": 0.0, + "TTTq": 0.0, + "TT_ForeAft": 0.0, + "TT_SideSide": 0.0, + "WD_ModActive": 0.0, + "WD_Nacelle": 0.0, + "WD_NacelleMod": 0.0, + "uWind_80m": 0.0, + "yawoffset": 0.0 }, { "ActivePower": NaN, @@ -2631,24 +2631,24 @@ "yawoffset": NaN }, { - "ActivePower": NaN, - "BL1_EdgeMom": NaN, - "BL1_FlapMom": NaN, - "BL3_EdgeMom": NaN, - "BL3_FlapMom": NaN, - "LSSDW_My": NaN, - "LSSDW_Mz": NaN, - "LSSDW_Tq": NaN, - "TB_ForeAft": NaN, - "TB_SideSide": NaN, - "TTTq": NaN, - "TT_ForeAft": NaN, - "TT_SideSide": NaN, - "WD_ModActive": NaN, - "WD_Nacelle": NaN, - "WD_NacelleMod": NaN, - "uWind_80m": NaN, - "yawoffset": NaN + "ActivePower": 0.0, + "BL1_EdgeMom": 0.0, + "BL1_FlapMom": 0.0, + "BL3_EdgeMom": 0.0, + "BL3_FlapMom": 0.0, + "LSSDW_My": 0.0, + "LSSDW_Mz": 0.0, + "LSSDW_Tq": 0.0, + "TB_ForeAft": 0.0, + "TB_SideSide": 0.0, + "TTTq": 0.0, + "TT_ForeAft": 0.0, + "TT_SideSide": 0.0, + "WD_ModActive": 0.0, + "WD_Nacelle": 0.0, + "WD_NacelleMod": 0.0, + "uWind_80m": 0.0, + "yawoffset": 0.0 } ], "loads": [ diff --git a/examples/directional_waves.ipynb b/examples/directional_waves.ipynb index 73ed2c6ff..4ee1bc203 100644 --- a/examples/directional_waves.ipynb +++ b/examples/directional_waves.ipynb @@ -182,8 +182,8 @@ } ], "source": [ - "buoy = '42012'\n", - "wave.io.ndbc.available_data('swdir', buoy)" + "buoy = \"42012\"\n", + "wave.io.ndbc.available_data(\"swdir\", buoy)" ] }, { @@ -1084,7 +1084,7 @@ } ], "source": [ - "date = np.datetime64('2021-02-21T12:40:00')\n", + "date = np.datetime64(\"2021-02-21T12:40:00\")\n", "data = data_all.sel(date=date)\n", "directions = np.arange(0, 360, 2.0)\n", "spectrum = wave.io.ndbc.create_directional_spectrum(data, directions)\n", @@ -1165,7 +1165,7 @@ } ], "source": [ - "wave.graphics.plot_directional_spectrum(spectrum, min=0.3)" + "wave.graphics.plot_directional_spectrum(spectrum, color_level_min=0.3)" ] }, { @@ -1195,7 +1195,9 @@ } ], "source": [ - "wave.graphics.plot_directional_spectrum(spectrum, min=0.3, fill=False, nlevels=4)" + "wave.graphics.plot_directional_spectrum(\n", + " spectrum, color_level_min=0.3, fill=False, nlevels=4\n", + ")" ] }, { @@ -1233,7 +1235,7 @@ } ], "source": [ - "data['swden'].plot()" + "data[\"swden\"].plot()" ] }, { @@ -1303,9 +1305,9 @@ } ], "source": [ - "rho = 1025 # kg/m^3\n", - "g = 9.81 # m/s^2\n", - "wave.graphics.plot_directional_spectrum(spectrum*rho*g, name=\"Energy\", units=\"J\")" + "rho = 1025 # kg/m^3\n", + "g = 9.81 # m/s^2\n", + "wave.graphics.plot_directional_spectrum(spectrum * rho * g, name=\"Energy\", units=\"J\")" ] }, { @@ -1318,7 +1320,7 @@ ], "metadata": { "kernelspec": { - "display_name": "Python 3.9.13 ('.venv': venv)", + "display_name": "Python 3 (ipykernel)", "language": "python", "name": "python3" }, @@ -1332,9 +1334,8 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.9.13" + "version": "3.9.17" }, - "orig_nbformat": 4, "vscode": { "interpreter": { "hash": "15fd306e44580d8cf431083454c399b84f9cc4f7f2c761501397671836835f49" diff --git a/examples/environmental_contours_example.ipynb b/examples/environmental_contours_example.ipynb index 82a9ef6cd..5109e2164 100644 --- a/examples/environmental_contours_example.ipynb +++ b/examples/environmental_contours_example.ipynb @@ -132,9 +132,9 @@ ], "source": [ "# Specify the parameter as spectral wave density and the buoy number to be 46022\n", - "parameter = 'swden'\n", - "buoy_number = '46022' \n", - "ndbc_available_data= ndbc.available_data(parameter, buoy_number)\n", + "parameter = \"swden\"\n", + "buoy_number = \"46022\"\n", + "ndbc_available_data = ndbc.available_data(parameter, buoy_number)\n", "ndbc_available_data.head()" ] }, @@ -251,7 +251,7 @@ "outputs": [], "source": [ "# Get dictionary of parameter data by year\n", - "filenames= years_of_interest['filename']\n", + "filenames = years_of_interest[\"filename\"]\n", "ndbc_requested_data = ndbc.request_data(parameter, filenames)" ] }, @@ -497,15 +497,15 @@ } ], "source": [ - "# Lastly we will convert a DateTime Index \n", - "ndbc_data={}\n", + "# Lastly we will convert a DateTime Index\n", + "ndbc_data = {}\n", "# Create a Datetime Index and remove NOAA date columns for each year\n", "for year in ndbc_requested_data:\n", " year_data = ndbc_requested_data[year]\n", " ndbc_data[year] = ndbc.to_datetime_index(parameter, year_data)\n", "\n", "# Display DataFrame of 46022 data from 1996\n", - "ndbc_data['1996'].head()" + "ndbc_data[\"1996\"].head()" ] }, { @@ -638,8 +638,8 @@ ], "source": [ "# Intialize empty lists to store the results from each year\n", - "Hm0_list=[]\n", - "Te_list=[]\n", + "Hm0_list = []\n", + "Te_list = []\n", "\n", "# Iterate over each year and save the result in the initalized dictionary\n", "for year in ndbc_data:\n", @@ -648,9 +648,9 @@ " Te_list.append(resource.energy_period(year_data.T))\n", "\n", "# Concatenate list of Series into a single DataFrame\n", - "Te = pd.concat(Te_list ,axis=0)\n", - "Hm0 = pd.concat(Hm0_list ,axis=0)\n", - "Hm0_Te = pd.concat([Hm0,Te],axis=1)\n", + "Te = pd.concat(Te_list, axis=0)\n", + "Hm0 = pd.concat(Hm0_list, axis=0)\n", + "Hm0_Te = pd.concat([Hm0, Te], axis=1)\n", "\n", "# Drop any NaNs created from the calculation of Hm0 or Te\n", "Hm0_Te.dropna(inplace=True)\n", @@ -680,22 +680,22 @@ "outputs": [], "source": [ "# Return period (years) of interest\n", - "period = 100 \n", + "period = 100\n", "\n", "# Remove Hm0 Outliers\n", "Hm0_Te_clean = Hm0_Te[Hm0_Te.Hm0 < 20]\n", "\n", "# Get only the values from the DataFrame\n", - "Hm0 = Hm0_Te_clean.Hm0.values \n", - "Te = Hm0_Te_clean.Te.values \n", + "Hm0 = Hm0_Te_clean.Hm0.values\n", + "Te = Hm0_Te_clean.Te.values\n", "\n", - "# Delta time of sea-states \n", - "dt = (Hm0_Te_clean.index[2]-Hm0_Te_clean.index[1]).seconds \n", + "# Delta time of sea-states\n", + "dt = (Hm0_Te_clean.index[2] - Hm0_Te_clean.index[1]).seconds\n", "\n", "# Get the contour values\n", - "copula = contours.environmental_contours(Hm0, Te, dt, period, 'PCA', return_PCA=True)\n", - "Hm0_contour=copula['PCA_x1']\n", - "Te_contour=copula['PCA_x2']" + "copula = contours.environmental_contours(Hm0, Te, dt, period, \"PCA\", return_PCA=True)\n", + "Hm0_contour = copula[\"PCA_x1\"]\n", + "Te_contour = copula[\"PCA_x2\"]" ] }, { @@ -725,15 +725,19 @@ } ], "source": [ - "fig,ax=plt.subplots(figsize=(8,4))\n", - "#%matplotlib inline\n", - "ax=graphics.plot_environmental_contour(Te, Hm0, \n", - " Te_contour, Hm0_contour, \n", - " data_label='NDBC 46022', \n", - " contour_label='100 Year Contour',\n", - " x_label = 'Energy Period, $Te$ [s]',\n", - " y_label = 'Sig. wave height, $Hm0$ [m]', \n", - " ax=ax)" + "fig, ax = plt.subplots(figsize=(8, 4))\n", + "# %matplotlib inline\n", + "ax = graphics.plot_environmental_contour(\n", + " Te,\n", + " Hm0,\n", + " Te_contour,\n", + " Hm0_contour,\n", + " data_label=\"NDBC 46022\",\n", + " contour_label=\"100 Year Contour\",\n", + " x_label=\"Energy Period, $Te$ [s]\",\n", + " y_label=\"Sig. wave height, $Hm0$ [m]\",\n", + " ax=ax,\n", + ")" ] }, { @@ -764,24 +768,30 @@ } ], "source": [ - "copulas = contours.environmental_contours(Hm0, Te, dt, period, method=['gaussian', 'nonparametric_gaussian'])\n", + "copulas = contours.environmental_contours(\n", + " Hm0, Te, dt, period, method=[\"gaussian\", \"nonparametric_gaussian\"]\n", + ")\n", "\n", - "fig, ax = plt.subplots(figsize=(9,4))\n", + "fig, ax = plt.subplots(figsize=(9, 4))\n", "\n", - "Tes=[Te_contour]\n", - "Hm0s=[Hm0_contour]\n", - "methods=['gaussian', 'nonparametric_gaussian']\n", - "for method in methods: \n", - " Hm0s.append(copulas[f'{method}_x1'])\n", - " Tes.append(copulas[f'{method}_x2'])\n", + "Tes = [Te_contour]\n", + "Hm0s = [Hm0_contour]\n", + "methods = [\"gaussian\", \"nonparametric_gaussian\"]\n", + "for method in methods:\n", + " Hm0s.append(copulas[f\"{method}_x1\"])\n", + " Tes.append(copulas[f\"{method}_x2\"])\n", "\n", - "ax = graphics.plot_environmental_contour(Te, Hm0, \n", - " Tes, Hm0s,\n", - " data_label='NDBC 46050', \n", - " contour_label=['PCA','Gaussian', 'Nonparametric Gaussian'],\n", - " x_label = 'Energy Period, $Te$ [s]',\n", - " y_label = 'Sig. wave height, $Hm0$ [m]', \n", - " ax=ax)" + "ax = graphics.plot_environmental_contour(\n", + " Te,\n", + " Hm0,\n", + " Tes,\n", + " Hm0s,\n", + " data_label=\"NDBC 46050\",\n", + " contour_label=[\"PCA\", \"Gaussian\", \"Nonparametric Gaussian\"],\n", + " x_label=\"Energy Period, $Te$ [s]\",\n", + " y_label=\"Sig. wave height, $Hm0$ [m]\",\n", + " ax=ax,\n", + ")" ] }, { @@ -914,19 +924,19 @@ ], "source": [ "# Intialize empty lists to store the results from each year\n", - "Hm0_list=[]\n", - "Tp_list=[]\n", + "Hm0_list = []\n", + "Tp_list = []\n", "\n", "# Iterate over each year and save the result in the initalized dictionary\n", "for year in ndbc_data:\n", - " year_data = ndbc_data[year] \n", + " year_data = ndbc_data[year]\n", " Hm0_list.append(resource.significant_wave_height(year_data.T))\n", " Tp_list.append(resource.peak_period(year_data.T))\n", "\n", "# Concatenate list of Series into a single DataFrame\n", - "Tp = pd.concat(Tp_list ,axis=0)\n", - "Hm0 = pd.concat(Hm0_list ,axis=0)\n", - "Hm0_Tp = pd.concat([Hm0,Tp],axis=1)\n", + "Tp = pd.concat(Tp_list, axis=0)\n", + "Hm0 = pd.concat(Hm0_list, axis=0)\n", + "Hm0_Tp = pd.concat([Hm0, Tp], axis=1)\n", "\n", "# Drop any NaNs created from the calculation of Hm0 or Te\n", "Hm0_Tp.dropna(inplace=True)\n", @@ -938,8 +948,8 @@ "Hm0_Tp_clean = Hm0_Tp[Hm0_Tp.Tp < 30]\n", "\n", "# Get only the values from the DataFrame\n", - "Hm0 = Hm0_Tp_clean.Hm0.values \n", - "Tp = Hm0_Tp_clean.Tp.values \n", + "Hm0 = Hm0_Tp_clean.Hm0.values\n", + "Tp = Hm0_Tp_clean.Tp.values\n", "\n", "\n", "Hm0_Tp" @@ -1054,8 +1064,8 @@ "gmm = GaussianMixture(n_components=8).fit(X)\n", "\n", "# Save centers and weights\n", - "results = pd.DataFrame(gmm.means_, columns=['Tp','Hm0'])\n", - "results['weights'] = gmm.weights_\n", + "results = pd.DataFrame(gmm.means_, columns=[\"Tp\", \"Hm0\"])\n", + "results[\"weights\"] = gmm.weights_\n", "results" ] }, @@ -1098,9 +1108,9 @@ "# Plot the Sections of Data\n", "labels = gmm.predict(X)\n", "plt.scatter(Tp, Hm0, c=labels, s=40)\n", - "plt.plot(results.Tp, results.Hm0, 'm+')\n", - "plt.xlabel('Peak Period, $Tp$ [s]')\n", - "plt.ylabel('Sig. wave height, $Hm0$ [m]')" + "plt.plot(results.Tp, results.Hm0, \"m+\")\n", + "plt.xlabel(\"Peak Period, $Tp$ [s]\")\n", + "plt.ylabel(\"Sig. wave height, $Hm0$ [m]\")" ] } ], diff --git a/examples/extreme_response_MLER_example.ipynb b/examples/extreme_response_MLER_example.ipynb index d4737efe8..36c2bf11e 100644 --- a/examples/extreme_response_MLER_example.ipynb +++ b/examples/extreme_response_MLER_example.ipynb @@ -62,9 +62,9 @@ } ], "source": [ - "wave_freq = np.linspace( 0.,1,500)\n", - "mfile = pd.read_csv('data/loads/mler.csv')\n", - "RAO = mfile['RAO'].astype(complex)\n", + "wave_freq = np.linspace(0.0, 1, 500)\n", + "mfile = pd.read_csv(\"data/loads/mler.csv\")\n", + "RAO = mfile[\"RAO\"].astype(complex)\n", "RAO[0:10]" ] }, @@ -114,10 +114,10 @@ } ], "source": [ - "Hs = 9.0 # significant wave height\n", - "Tp = 15.1 # time period of waves\n", - "pm = resource.pierson_moskowitz_spectrum(wave_freq,Tp,Hs)\n", - "pm.plot(xlabel='frequency [Hz]',ylabel='response [m^2/Hz]')" + "Hs = 9.0 # significant wave height\n", + "Tp = 15.1 # time period of waves\n", + "pm = resource.pierson_moskowitz_spectrum(wave_freq, Tp, Hs)\n", + "pm.plot(xlabel=\"frequency [Hz]\", ylabel=\"response [m^2/Hz]\")" ] }, { @@ -168,10 +168,14 @@ } ], "source": [ - "mler_data = extreme.mler_coefficients(RAO,pm,1)\n", + "mler_data = extreme.mler_coefficients(RAO, pm, 1)\n", "\n", - "mler_data.plot(y='WaveSpectrum', ylabel='Conditioned wave spectrum [m^2-s]', xlabel='Frequency [Hz]')\n", - "mler_data.plot(y='Phase', ylabel='[rad]', xlabel='Frequency [Hz]')" + "mler_data.plot(\n", + " y=\"WaveSpectrum\",\n", + " ylabel=\"Conditioned wave spectrum [m^2-s]\",\n", + " xlabel=\"Frequency [Hz]\",\n", + ")\n", + "mler_data.plot(y=\"Phase\", ylabel=\"[rad]\", xlabel=\"Frequency [Hz]\")" ] }, { @@ -202,14 +206,14 @@ "source": [ "# generate parameters dict\n", "params = (\n", - " ('startTime',-150.0),\n", - " ('endTime',150.0),\n", - " ('dT',1.0),\n", - " ('T0',0.0),\n", - " ('startX',-300.0),\n", - " ('endX',300.0),\n", - " ('dX',1.0),\n", - " ('X0',0.0)\n", + " (\"startTime\", -150.0),\n", + " (\"endTime\", 150.0),\n", + " (\"dT\", 1.0),\n", + " (\"T0\", 0.0),\n", + " (\"startX\", -300.0),\n", + " (\"endX\", 300.0),\n", + " (\"dX\", 1.0),\n", + " (\"X0\", 0.0),\n", ")\n", "parameters = dict(params)\n", "\n", @@ -217,11 +221,13 @@ "sim = extreme.mler_simulation(parameters=parameters)\n", "\n", "# generate wave number k\n", - "k = resource.wave_number(wave_freq,70)\n", + "k = resource.wave_number(wave_freq, 70)\n", "k = k.fillna(0)\n", "\n", - "peakHeightDesired = Hs/2 * 1.9\n", - "mler_norm = extreme.mler_wave_amp_normalize(peakHeightDesired, mler_data, sim, k.k.values)" + "peakHeightDesired = Hs / 2 * 1.9\n", + "mler_norm = extreme.mler_wave_amp_normalize(\n", + " peakHeightDesired, mler_data, sim, k.k.values\n", + ")" ] }, { @@ -260,8 +266,8 @@ } ], "source": [ - "mler_ts = extreme.mler_export_time_series(RAO.values,mler_norm,sim,k.k.values)\n", - "mler_ts.plot(xlabel='Time (s)',ylabel='[m] / [*]',xlim=[-100,100],grid=True)" + "mler_ts = extreme.mler_export_time_series(RAO.values, mler_norm, sim, k.k.values)\n", + "mler_ts.plot(xlabel=\"Time (s)\", ylabel=\"[m] / [*]\", xlim=[-100, 100], grid=True)" ] }, { diff --git a/examples/extreme_response_contour_example.ipynb b/examples/extreme_response_contour_example.ipynb index 9fe687e0d..a716aa102 100644 --- a/examples/extreme_response_contour_example.ipynb +++ b/examples/extreme_response_contour_example.ipynb @@ -49,13 +49,13 @@ "metadata": {}, "outputs": [], "source": [ - "parameter = 'swden'\n", - "buoy_number = '46022'\n", + "parameter = \"swden\"\n", + "buoy_number = \"46022\"\n", "ndbc_available_data = ndbc.available_data(parameter, buoy_number)\n", "\n", "years_of_interest = ndbc_available_data[ndbc_available_data.year < 2013]\n", "\n", - "filenames = years_of_interest['filename']\n", + "filenames = years_of_interest[\"filename\"]\n", "ndbc_requested_data = ndbc.request_data(parameter, filenames)\n", "\n", "ndbc_data = {}\n", @@ -87,7 +87,7 @@ "Hm0 = Hm0_Te_clean.Hm0.values\n", "Te = Hm0_Te_clean.Te.values\n", "\n", - "dt = (Hm0_Te_clean.index[2]-Hm0_Te_clean.index[1]).seconds" + "dt = (Hm0_Te_clean.index[2] - Hm0_Te_clean.index[1]).seconds" ] }, { @@ -109,11 +109,11 @@ "source": [ "# 100 year contour\n", "period = 100.0\n", - "copula = contours.environmental_contours(Hm0, Te, dt, period, 'PCA')\n", - "hs_contour = copula['PCA_x1']\n", - "te_contour = copula['PCA_x2']\n", + "copula = contours.environmental_contours(Hm0, Te, dt, period, \"PCA\")\n", + "hs_contour = copula[\"PCA_x1\"]\n", + "te_contour = copula[\"PCA_x2\"]\n", "\n", - "# 5 samples \n", + "# 5 samples\n", "te_samples = np.linspace(15, 22, 5)\n", "hs_samples = contours.samples_contour(te_samples, te_contour, hs_contour);" ] @@ -157,11 +157,17 @@ "# plot\n", "fig, ax = plt.subplots(figsize=(8, 4))\n", "ax = graphics.plot_environmental_contour(\n", - " Te, Hm0, te_contour, hs_contour,\n", - " data_label='bouy data', contour_label='100-year contour',\n", - " x_label='Energy Period, $Te$ [s]',\n", - " y_label='Sig. wave height, $Hm0$ [m]', ax=ax)\n", - "ax.plot(te_samples, hs_samples, 'ro', label='samples')\n", + " Te,\n", + " Hm0,\n", + " te_contour,\n", + " hs_contour,\n", + " data_label=\"bouy data\",\n", + " contour_label=\"100-year contour\",\n", + " x_label=\"Energy Period, $Te$ [s]\",\n", + " y_label=\"Sig. wave height, $Hm0$ [m]\",\n", + " ax=ax,\n", + ")\n", + "ax.plot(te_samples, hs_samples, \"ro\", label=\"samples\")\n", "plt.legend()" ] }, @@ -205,29 +211,29 @@ "source": [ "# create the short-term extreme distribution for each sample sea state\n", "t_st = 3.0 * 60.0 * 60.0\n", - "gamma = 3.3 \n", + "gamma = 3.3\n", "t_sim = 1.0 * 60.0 * 60.0\n", "\n", "ste_all = []\n", "i = 0\n", "n = len(hs_samples)\n", "for hs, te in zip(hs_samples, te_samples):\n", - " tp = te / (0.8255 + 0.03852*gamma - 0.005537*gamma**2 + 0.0003154*gamma**3)\n", + " tp = te / (0.8255 + 0.03852 * gamma - 0.005537 * gamma**2 + 0.0003154 * gamma**3)\n", " i += 1\n", " print(f\"Sea state {i}/{n}. (Hs, Te) = ({hs} m, {te} s). Tp = {tp} s\")\n", " # time & frequency arrays\n", - " df = 1.0/t_sim\n", - " T_min = tp/10.0 # s\n", - " f_max = 1.0/T_min\n", - " Nf = int(f_max/df) + 1\n", - " time = np.linspace(0, t_sim, 2*Nf+1)\n", + " df = 1.0 / t_sim\n", + " T_min = tp / 10.0 # s\n", + " f_max = 1.0 / T_min\n", + " Nf = int(f_max / df) + 1\n", + " time = np.linspace(0, t_sim, 2 * Nf + 1)\n", " f = np.linspace(0.0, f_max, Nf)\n", " # spectrum\n", " S = resource.jonswap_spectrum(f, tp, hs, gamma)\n", " # 1-hour elevation time-series\n", " data = resource.surface_elevation(S, time).values.squeeze()\n", " # 3-hour extreme distribution\n", - " ste = extreme.short_term_extreme(time, data, t_st, 'peaks_weibull_tail_fit')\n", + " ste = extreme.short_term_extreme(time, data, t_st, \"peaks_weibull_tail_fit\")\n", " ste_all.append(ste)" ] }, @@ -271,7 +277,7 @@ "\n", "hs_design = hs_samples[max_ind]\n", "te_design = te_samples[max_ind]\n", - "print(f\"Design sea state (Hs, Te): ({hs_design} m, {te_design} s)\")\n" + "print(f\"Design sea state (Hs, Te): ({hs_design} m, {te_design} s)\")" ] }, { diff --git a/examples/extreme_response_full_sea_state_example.ipynb b/examples/extreme_response_full_sea_state_example.ipynb index 258a3fcb2..28cf6c745 100644 --- a/examples/extreme_response_full_sea_state_example.ipynb +++ b/examples/extreme_response_full_sea_state_example.ipynb @@ -52,13 +52,13 @@ "metadata": {}, "outputs": [], "source": [ - "parameter = 'swden'\n", - "buoy_number = '46022'\n", + "parameter = \"swden\"\n", + "buoy_number = \"46022\"\n", "ndbc_available_data = ndbc.available_data(parameter, buoy_number)\n", "\n", "years_of_interest = ndbc_available_data[ndbc_available_data.year < 2013]\n", "\n", - "filenames = years_of_interest['filename']\n", + "filenames = years_of_interest[\"filename\"]\n", "ndbc_requested_data = ndbc.request_data(parameter, filenames)\n", "\n", "ndbc_data = {}\n", @@ -90,7 +90,7 @@ "Hm0 = Hm0_Te_clean.Hm0.values\n", "Te = Hm0_Te_clean.Te.values\n", "\n", - "dt = (Hm0_Te_clean.index[2]-Hm0_Te_clean.index[1]).seconds" + "dt = (Hm0_Te_clean.index[2] - Hm0_Te_clean.index[1]).seconds" ] }, { @@ -122,7 +122,8 @@ "\n", "# Create samples\n", "sample_hs, sample_te, sample_weights = contours.samples_full_seastate(\n", - " Hm0, Te, npoints, levels, dt)" + " Hm0, Te, npoints, levels, dt\n", + ")" ] }, { @@ -160,9 +161,10 @@ "\n", "for period in levels:\n", " copula = contours.environmental_contours(\n", - " Hm0, Te, dt, period, 'PCA', return_PCA=True)\n", - " Hm0_contours.append(copula['PCA_x1'])\n", - " Te_contours.append(copula['PCA_x2'])\n", + " Hm0, Te, dt, period, \"PCA\", return_PCA=True\n", + " )\n", + " Hm0_contours.append(copula[\"PCA_x1\"])\n", + " Te_contours.append(copula[\"PCA_x2\"])\n", "\n", "# plot\n", "fig, ax = plt.subplots(figsize=(8, 4))\n", @@ -170,10 +172,16 @@ "labels = [f\"{period}-year Contour\" for period in levels]\n", "\n", "ax = graphics.plot_environmental_contour(\n", - " sample_te, sample_hs, Te_contours, Hm0_contours,\n", - " data_label='Samples', contour_label=labels,\n", - " x_label='Energy Period, $Te$ [s]',\n", - " y_label='Sig. wave height, $Hm0$ [m]', ax=ax)\n" + " sample_te,\n", + " sample_hs,\n", + " Te_contours,\n", + " Hm0_contours,\n", + " data_label=\"Samples\",\n", + " contour_label=labels,\n", + " x_label=\"Energy Period, $Te$ [s]\",\n", + " y_label=\"Sig. wave height, $Hm0$ [m]\",\n", + " ax=ax,\n", + ")" ] }, { @@ -423,29 +431,29 @@ "source": [ "# create the short-term extreme distribution for each sample sea state\n", "t_st = 3.0 * 60.0 * 60.0\n", - "gamma = 3.3 \n", + "gamma = 3.3\n", "t_sim = 1.0 * 60.0 * 60.0\n", "\n", "ste_all = []\n", "i = 0\n", "n = len(sample_hs)\n", "for hs, te in zip(sample_hs, sample_te):\n", - " tp = te / (0.8255 + 0.03852*gamma - 0.005537*gamma**2 + 0.0003154*gamma**3)\n", + " tp = te / (0.8255 + 0.03852 * gamma - 0.005537 * gamma**2 + 0.0003154 * gamma**3)\n", " i += 1\n", " print(f\"Sea state {i}/{n}. (Hs, Te) = ({hs} m, {te} s). Tp = {tp} s\")\n", " # time & frequency arrays\n", - " df = 1.0/t_sim\n", - " T_min = tp/10.0 # s\n", - " f_max = 1.0/T_min\n", - " Nf = int(f_max/df) + 1\n", - " time = np.linspace(0, t_sim, 2*Nf+1)\n", + " df = 1.0 / t_sim\n", + " T_min = tp / 10.0 # s\n", + " f_max = 1.0 / T_min\n", + " Nf = int(f_max / df) + 1\n", + " time = np.linspace(0, t_sim, 2 * Nf + 1)\n", " f = np.linspace(0.0, f_max, Nf)\n", " # spectrum\n", " S = resource.jonswap_spectrum(f, tp, hs, gamma)\n", " # 1-hour elevation time-series\n", " data = resource.surface_elevation(S, time).values.squeeze()\n", " # 3-hour extreme distribution\n", - " ste = extreme.short_term_extreme(time, data, t_st, 'peaks_weibull_tail_fit')\n", + " ste = extreme.short_term_extreme(time, data, t_st, \"peaks_weibull_tail_fit\")\n", " ste_all.append(ste)" ] }, @@ -494,7 +502,7 @@ } ], "source": [ - "t_st_hr = t_st/(60.0*60.0)\n", + "t_st_hr = t_st / (60.0 * 60.0)\n", "t_return_yr = 100.0\n", "x_t = extreme.return_year_value(lte.ppf, t_return_yr, t_st_hr)\n", "\n", @@ -547,11 +555,11 @@ "# format plot\n", "plt.grid(True, which=\"major\", linestyle=\":\")\n", "ax.tick_params(axis=\"both\", which=\"major\", direction=\"in\")\n", - "ax.xaxis.set_ticks_position('both')\n", - "ax.yaxis.set_ticks_position('both') \n", + "ax.xaxis.set_ticks_position(\"both\")\n", + "ax.yaxis.set_ticks_position(\"both\")\n", "plt.minorticks_off()\n", "ax.set_xticks([0, 5, 10, 15, 20])\n", - "ax.set_yticks(1.0*10.0**(-1*np.arange(11)))\n", + "ax.set_yticks(1.0 * 10.0 ** (-1 * np.arange(11)))\n", "ax.set_xlabel(\"elevation [m]\")\n", "ax.set_ylabel(\"survival function (1-cdf)\")\n", "ax.set_xlim([0, x[-1]])\n", @@ -560,8 +568,8 @@ "\n", "# 100-year return level\n", "s_t = lte.sf(x_t)\n", - "ax.plot([0, x[-1]], [s_t, s_t], '--', color=\"0.5\", linewidth=1)\n", - "ax.plot([x_t, x_t], ylim, '--', color=\"0.5\", linewidth=1)\n" + "ax.plot([0, x[-1]], [s_t, s_t], \"--\", color=\"0.5\", linewidth=1)\n", + "ax.plot([x_t, x_t], ylim, \"--\", color=\"0.5\", linewidth=1)" ] } ], diff --git a/examples/loads_example.ipynb b/examples/loads_example.ipynb index 978b13e8f..50335034b 100644 --- a/examples/loads_example.ipynb +++ b/examples/loads_example.ipynb @@ -16,11 +16,11 @@ "metadata": {}, "outputs": [], "source": [ - "import pandas as pd \n", - "import numpy as np \n", + "import pandas as pd\n", + "import numpy as np\n", "from mhkit import utils\n", - "from mhkit import loads \n", - "import matplotlib.pyplot as plt " + "from mhkit import loads\n", + "import matplotlib.pyplot as plt" ] }, { @@ -238,7 +238,7 @@ } ], "source": [ - "loads_data_file = './data/loads/data_loads_example.csv'\n", + "loads_data_file = \"./data/loads/data_loads_example.csv\"\n", "\n", "# Import csv data file\n", "raw_loads_data = pd.read_csv(loads_data_file)\n", @@ -488,16 +488,16 @@ ], "source": [ "# Use the datetime conversion from the utils module\n", - "datetime = utils.excel_to_datetime(raw_loads_data['Timestamp'])\n", + "datetime = utils.excel_to_datetime(raw_loads_data[\"Timestamp\"])\n", "\n", "# Replace the 'Timestamp' column with our newly formatted datetime\n", - "raw_loads_data['Timestamp'] = datetime \n", + "raw_loads_data[\"Timestamp\"] = datetime\n", "\n", "# Set this as our index for our DataFrame\n", - "loads_data = raw_loads_data.set_index('Timestamp')\n", + "loads_data = raw_loads_data.set_index(\"Timestamp\")\n", "\n", "# Remove the 'time' column since it will not be used\n", - "loads_data.drop(columns='Time',inplace=True)\n", + "loads_data.drop(columns=\"Time\", inplace=True)\n", "loads_data.head()" ] }, @@ -532,12 +532,14 @@ ], "source": [ "# Calculate the damage equivalent load for blade 1 root momement and tower base moment\n", - "DEL_tower = loads.general.damage_equivalent_load(loads_data['TB_ForeAft'],4,\n", - " bin_num=100,data_length=600)\n", - "DEL_blade = loads.general.damage_equivalent_load(loads_data['BL1_FlapMom'],10,\n", - " bin_num=100,data_length=600)\n", - "print('DEL TB_ForeAft: '+ str(DEL_tower))\n", - "print('DEL BL1_FlapMom: '+ str(DEL_blade))" + "DEL_tower = loads.general.damage_equivalent_load(\n", + " loads_data[\"TB_ForeAft\"], 4, bin_num=100, data_length=600\n", + ")\n", + "DEL_blade = loads.general.damage_equivalent_load(\n", + " loads_data[\"BL1_FlapMom\"], 10, bin_num=100, data_length=600\n", + ")\n", + "print(\"DEL TB_ForeAft: \" + str(DEL_tower))\n", + "print(\"DEL BL1_FlapMom: \" + str(DEL_blade))" ] }, { @@ -647,7 +649,7 @@ ], "source": [ "# Calculate the means, maxs, mins, and stdevs for all data signals in the loads data file\n", - "means,maxs,mins,stdevs = utils.get_statistics(loads_data,50,period=600)\n", + "means, maxs, mins, stdevs = utils.get_statistics(loads_data, 50, period=600)\n", "\n", "# Display the results, indexed by the first timestamp of the corresponding statistical window\n", "means" @@ -874,10 +876,10 @@ ], "source": [ "# Load DataFrames containing load statistics\n", - "means = pd.read_csv('./data/loads/data_loads_means.csv')\n", - "maxs = pd.read_csv('./data/loads/data_loads_maxs.csv')\n", - "mins = pd.read_csv('./data/loads/data_loads_mins.csv')\n", - "std = pd.read_csv('./data/loads/data_loads_std.csv')\n", + "means = pd.read_csv(\"./data/loads/data_loads_means.csv\")\n", + "maxs = pd.read_csv(\"./data/loads/data_loads_maxs.csv\")\n", + "mins = pd.read_csv(\"./data/loads/data_loads_mins.csv\")\n", + "std = pd.read_csv(\"./data/loads/data_loads_std.csv\")\n", "\n", "means.head()" ] @@ -932,23 +934,27 @@ } ], "source": [ - "loads.graphics.plot_statistics(means['uWind_80m'],\n", - " means['BL1_FlapMom'],\n", - " maxs['BL1_FlapMom'],\n", - " mins['BL1_FlapMom'],\n", - " y_stdev=std['BL1_FlapMom'],\n", - " xlabel='Wind Speed [m/s]',\n", - " ylabel='Blade Flap Moment [kNm]',\n", - " title = 'Blade Flap Moment Load Statistics')\n", + "loads.graphics.plot_statistics(\n", + " means[\"uWind_80m\"],\n", + " means[\"BL1_FlapMom\"],\n", + " maxs[\"BL1_FlapMom\"],\n", + " mins[\"BL1_FlapMom\"],\n", + " y_stdev=std[\"BL1_FlapMom\"],\n", + " xlabel=\"Wind Speed [m/s]\",\n", + " ylabel=\"Blade Flap Moment [kNm]\",\n", + " title=\"Blade Flap Moment Load Statistics\",\n", + ")\n", "\n", - "loads.graphics.plot_statistics(means['uWind_80m'],\n", - " means['TB_ForeAft'],\n", - " maxs['TB_ForeAft'],\n", - " mins['TB_ForeAft'],\n", - " y_stdev=std['TB_ForeAft'],\n", - " xlabel='Wind Speed [m/s]',\n", - " ylabel='Tower Base Moment [kNm]',\n", - " title = 'Tower Base Moment Load Statistics')" + "loads.graphics.plot_statistics(\n", + " means[\"uWind_80m\"],\n", + " means[\"TB_ForeAft\"],\n", + " maxs[\"TB_ForeAft\"],\n", + " mins[\"TB_ForeAft\"],\n", + " y_stdev=std[\"TB_ForeAft\"],\n", + " xlabel=\"Wind Speed [m/s]\",\n", + " ylabel=\"Tower Base Moment [kNm]\",\n", + " title=\"Tower Base Moment Load Statistics\",\n", + ")" ] }, { @@ -1587,13 +1593,13 @@ ], "source": [ "# Create array containing wind speeds to use as bin edges\n", - "bin_edges = np.arange(3,26,1)\n", - "bin_against = means['uWind_80m']\n", + "bin_edges = np.arange(3, 26, 1)\n", + "bin_against = means[\"uWind_80m\"]\n", "\n", - "# Apply function for means, maxs, and mins \n", - "[bin_means, bin_means_std] = loads.general.bin_statistics(means,bin_against,bin_edges)\n", - "[bin_maxs, bin_maxs_std] = loads.general.bin_statistics(maxs,bin_against,bin_edges)\n", - "[bin_mins, bin_mins_std] = loads.general.bin_statistics(mins,bin_against,bin_edges)\n", + "# Apply function for means, maxs, and mins\n", + "[bin_means, bin_means_std] = loads.general.bin_statistics(means, bin_against, bin_edges)\n", + "[bin_maxs, bin_maxs_std] = loads.general.bin_statistics(maxs, bin_against, bin_edges)\n", + "[bin_mins, bin_mins_std] = loads.general.bin_statistics(mins, bin_against, bin_edges)\n", "\n", "bin_means" ] @@ -1637,8 +1643,8 @@ ], "source": [ "# Specify center of each wind speed bin, and signal name for analysis\n", - "bin_centers = np.arange(3.5,25.5,step=1) \n", - "signal_name = 'TB_ForeAft' \n", + "bin_centers = np.arange(3.5, 25.5, step=1)\n", + "signal_name = \"TB_ForeAft\"\n", "\n", "# Specify inputs to be used in plotting\n", "bin_mean = bin_means[signal_name]\n", @@ -1649,11 +1655,18 @@ "bin_min_std = bin_mins_std[signal_name]\n", "\n", "# Plot binned statistics\n", - "loads.graphics.plot_bin_statistics(bin_centers,bin_mean,bin_max,bin_min,\n", - " bin_mean_std,bin_max_std,bin_min_std,\n", - " xlabel='Wind Speed [m/s]',\n", - " ylabel=signal_name,\n", - " title='Binned Statistics')\n" + "loads.graphics.plot_bin_statistics(\n", + " bin_centers,\n", + " bin_mean,\n", + " bin_max,\n", + " bin_min,\n", + " bin_mean_std,\n", + " bin_max_std,\n", + " bin_min_std,\n", + " xlabel=\"Wind Speed [m/s]\",\n", + " ylabel=signal_name,\n", + " title=\"Binned Statistics\",\n", + ")" ] } ], diff --git a/examples/metocean_example.ipynb b/examples/metocean_example.ipynb index cc94569d7..c8675ac75 100644 --- a/examples/metocean_example.ipynb +++ b/examples/metocean_example.ipynb @@ -262,8 +262,8 @@ ], "source": [ "# Specify the parameter as continuous wind speeds and the buoy number to be 46022\n", - "ndbc_dict = {'parameter':'cwind','buoy_number':'46022'} \n", - "available_data = ndbc.available_data(ndbc_dict['parameter'], ndbc_dict['buoy_number'])\n", + "ndbc_dict = {\"parameter\": \"cwind\", \"buoy_number\": \"46022\"}\n", + "available_data = ndbc.available_data(ndbc_dict[\"parameter\"], ndbc_dict[\"buoy_number\"])\n", "available_data" ] }, @@ -333,7 +333,7 @@ "source": [ "# Slice the available data to only include 2018 and more recent\n", "years_of_interest = available_data[available_data.year == 2018]\n", - "years_of_interest\n" + "years_of_interest" ] }, { @@ -376,8 +376,8 @@ ], "source": [ "# Get dictionary of parameter data by year\n", - "ndbc_dict['filenames'] = years_of_interest['filename']\n", - "requested_data = ndbc.request_data(ndbc_dict['parameter'], ndbc_dict['filenames'])\n", + "ndbc_dict[\"filenames\"] = years_of_interest[\"filename\"]\n", + "requested_data = ndbc.request_data(ndbc_dict[\"parameter\"], ndbc_dict[\"filenames\"])\n", "requested_data" ] }, @@ -554,13 +554,15 @@ ], "source": [ "# Convert the header dates to a Datetime Index and remove NOAA date columns for each year\n", - "ndbc_dict['2018'] = ndbc.to_datetime_index(ndbc_dict['parameter'], requested_data['2018'])\n", + "ndbc_dict[\"2018\"] = ndbc.to_datetime_index(\n", + " ndbc_dict[\"parameter\"], requested_data[\"2018\"]\n", + ")\n", "\n", "# Replace 99, 999, 9999 with NaN\n", - "ndbc_dict['2018'] = ndbc_dict['2018'].replace({99.0:np.NaN, 999:np.NaN, 9999:np.NaN})\n", + "ndbc_dict[\"2018\"] = ndbc_dict[\"2018\"].replace({99.0: np.NaN, 999: np.NaN, 9999: np.NaN})\n", "\n", "# Display DataFrame of 46022 data from 2018\n", - "ndbc_dict['2018']" + "ndbc_dict[\"2018\"]" ] }, { @@ -648,7 +650,9 @@ ], "source": [ "# Input parameters for site of interest\n", - "temperatures = wind_toolkit.elevation_to_string('temperature',[2, 20, 40, 60, 80, 100, 120, 140, 160])\n", + "temperatures = wind_toolkit.elevation_to_string(\n", + " \"temperature\", [2, 20, 40, 60, 80, 100, 120, 140, 160]\n", + ")\n", "temperatures" ] }, @@ -658,11 +662,13 @@ "metadata": {}, "outputs": [], "source": [ - "wtk_inputs = {'time_interval':'1-hour',\n", - " 'wind_parameters':['windspeed_10m','winddirection_10m'],\n", - " 'temp_parameters':temperatures,\n", - " 'year':[2018],\n", - " 'lat_lon':(40.748, -124.527)}" + "wtk_inputs = {\n", + " \"time_interval\": \"1-hour\",\n", + " \"wind_parameters\": [\"windspeed_10m\", \"winddirection_10m\"],\n", + " \"temp_parameters\": temperatures,\n", + " \"year\": [2018],\n", + " \"lat_lon\": (40.748, -124.527),\n", + "}" ] }, { @@ -692,7 +698,7 @@ } ], "source": [ - "requested_region = wind_toolkit.region_selection(wtk_inputs['lat_lon'])\n", + "requested_region = wind_toolkit.region_selection(wtk_inputs[\"lat_lon\"])\n", "requested_region" ] }, @@ -725,7 +731,7 @@ } ], "source": [ - "wind_toolkit.plot_region(requested_region,lat_lon=wtk_inputs['lat_lon'])" + "wind_toolkit.plot_region(requested_region, lat_lon=wtk_inputs[\"lat_lon\"])" ] }, { @@ -859,8 +865,11 @@ ], "source": [ "wtk_wind, wtk_metadata = wind_toolkit.request_wtk_point_data(\n", - " wtk_inputs['time_interval'],wtk_inputs['wind_parameters'],\n", - " wtk_inputs['lat_lon'],wtk_inputs['year'])\n", + " wtk_inputs[\"time_interval\"],\n", + " wtk_inputs[\"wind_parameters\"],\n", + " wtk_inputs[\"lat_lon\"],\n", + " wtk_inputs[\"year\"],\n", + ")\n", "wtk_wind" ] }, @@ -908,21 +917,31 @@ ], "source": [ "# Get WIND Toolkit and NDBC wind data for 2018-01-11\n", - "ndbc_hourly_data = ndbc_dict['2018']['2018-01-11'].resample('h').nearest()\n", - "wtk_hourly_wind = wtk_wind['2018-01-11']\n", + "ndbc_hourly_data = ndbc_dict[\"2018\"][\"2018-01-11\"].resample(\"h\").nearest()\n", + "wtk_hourly_wind = wtk_wind[\"2018-01-11\"]\n", "\n", "# Plot the timeseries\n", "fig = plt.figure()\n", "ax = fig.add_subplot(111)\n", - "ax.set_xlabel('Time, UTC (h)')\n", - "ax.set_ylabel('Speed (m/s)')\n", - "ax.set_title('Hourly mean wind speeds on January 11, 2018')\n", + "ax.set_xlabel(\"Time, UTC (h)\")\n", + "ax.set_ylabel(\"Speed (m/s)\")\n", + "ax.set_title(\"Hourly mean wind speeds on January 11, 2018\")\n", "ax.grid()\n", "ax.set_ylim([5, 14])\n", "ax.set_xlim([0, 24])\n", - "line1 = ax.plot(ndbc_hourly_data.index.hour,ndbc_hourly_data['WSPD'].values,'o',label='NDBC 4m wind speed')\n", - "line2 = ax.plot(wtk_hourly_wind.index.hour,wtk_hourly_wind['windspeed_10m_0'].values,'x',label='WIND Toolkit 10m wind speed')\n", - "ax.legend()\n" + "line1 = ax.plot(\n", + " ndbc_hourly_data.index.hour,\n", + " ndbc_hourly_data[\"WSPD\"].values,\n", + " \"o\",\n", + " label=\"NDBC 4m wind speed\",\n", + ")\n", + "line2 = ax.plot(\n", + " wtk_hourly_wind.index.hour,\n", + " wtk_hourly_wind[\"windspeed_10m_0\"].values,\n", + " \"x\",\n", + " label=\"WIND Toolkit 10m wind speed\",\n", + ")\n", + "ax.legend()" ] }, { @@ -955,12 +974,13 @@ ], "source": [ "# Set the rose bin widths\n", - "width_direction = 10 # in degrees\n", - "width_velocity = 1 # in m/s\n", + "width_direction = 10 # in degrees\n", + "width_velocity = 1 # in m/s\n", "\n", "# Plot the wind rose\n", - "ax = plot_rose(ndbc_hourly_data['WDIR'],ndbc_hourly_data['WSPD'],\n", - " width_direction,width_velocity)\n" + "ax = plot_rose(\n", + " ndbc_hourly_data[\"WDIR\"], ndbc_hourly_data[\"WSPD\"], width_direction, width_velocity\n", + ")" ] }, { @@ -984,8 +1004,12 @@ } ], "source": [ - "ax2 = plot_rose(wtk_hourly_wind['winddirection_10m_0'],wtk_hourly_wind['windspeed_10m_0'],\n", - " width_direction,width_velocity)" + "ax2 = plot_rose(\n", + " wtk_hourly_wind[\"winddirection_10m_0\"],\n", + " wtk_hourly_wind[\"windspeed_10m_0\"],\n", + " width_direction,\n", + " width_velocity,\n", + ")" ] }, { @@ -1026,31 +1050,34 @@ ], "source": [ "wtk_temp, wtk_metadata = wind_toolkit.request_wtk_point_data(\n", - " wtk_inputs['time_interval'],wtk_inputs['temp_parameters'],\n", - " wtk_inputs['lat_lon'],wtk_inputs['year'])\n", + " wtk_inputs[\"time_interval\"],\n", + " wtk_inputs[\"temp_parameters\"],\n", + " wtk_inputs[\"lat_lon\"],\n", + " wtk_inputs[\"year\"],\n", + ")\n", "# wtk_temp = wtk_temp.shift(-7) # optionally UTC to local time\n", "\n", - "# Pick times corresponding to stable and unstable temperature profiles \n", - "stable_temp = wtk_temp.at_time('2018-01-11 03:00:00').values[0]\n", - "unstable_temp = wtk_temp.at_time('2018-01-11 15:00:00').values[0]\n", + "# Pick times corresponding to stable and unstable temperature profiles\n", + "stable_temp = wtk_temp.at_time(\"2018-01-11 03:00:00\").values[0]\n", + "unstable_temp = wtk_temp.at_time(\"2018-01-11 15:00:00\").values[0]\n", "\n", "# Find heights from temperature DataFrame columns\n", "heights = []\n", "for s in wtk_temp.keys():\n", - " s = s.removeprefix('temperature_')\n", - " s = s.removesuffix('m_0')\n", + " s = s.removeprefix(\"temperature_\")\n", + " s = s.removesuffix(\"m_0\")\n", " heights.append(float(s))\n", "heights = np.array(heights)\n", "\n", "# Plot the profiles\n", "fig = plt.figure()\n", "ax = fig.add_subplot(111)\n", - "ax.set_xlabel('Temperature (C)')\n", - "ax.set_ylabel('Height (m)')\n", - "ax.set_title('Temperature profiles from January 11, 2018')\n", + "ax.set_xlabel(\"Temperature (C)\")\n", + "ax.set_ylabel(\"Height (m)\")\n", + "ax.set_title(\"Temperature profiles from January 11, 2018\")\n", "ax.grid()\n", - "line1 = ax.plot(stable_temp,heights,'o-',label='time=03:00:00 UTC')\n", - "line2 = ax.plot(unstable_temp,heights,'x-',label='time=15:00:00 UTC')\n", + "line1 = ax.plot(stable_temp, heights, \"o-\", label=\"time=03:00:00 UTC\")\n", + "line2 = ax.plot(unstable_temp, heights, \"x-\", label=\"time=15:00:00 UTC\")\n", "ax.legend()" ] } diff --git a/examples/mooring_example.ipynb b/examples/mooring_example.ipynb index 1f0dd5e33..6340c190b 100644 --- a/examples/mooring_example.ipynb +++ b/examples/mooring_example.ipynb @@ -473,8 +473,8 @@ } ], "source": [ - "fpath = '.\\data\\mooring\\line1_test.out'\n", - "inputfile = '.\\data\\mooring\\TestInput.MD.dat'\n", + "fpath = \".\\data\\mooring\\line1_test.out\"\n", + "inputfile = \".\\data\\mooring\\TestInput.MD.dat\"\n", "\n", "ds = mooring.io.read_moordyn(fpath, input_file=inputfile)\n", "ds" @@ -917,7 +917,11 @@ } ], "source": [ - "print('The average lay length of the mooring line is: ' + str(laylength.mean().values.round()) + ' meters')" + "print(\n", + " \"The average lay length of the mooring line is: \"\n", + " + str(laylength.mean().values.round())\n", + " + \" meters\"\n", + ")" ] }, { @@ -273117,9 +273121,18 @@ "%matplotlib agg\n", "from IPython.display import HTML\n", "\n", - "dsani = ds.sel(Time=slice(0,10))\n", + "dsani = ds.sel(Time=slice(0, 10))\n", "\n", - "ani = mooring.graphics.animate(dsani, dimension='3d', interval=10, repeat=True, xlabel='X-axis',ylabel='Y-axis',zlabel='Depth [m]', title='Mooring Line Example')\n", + "ani = mooring.graphics.animate(\n", + " dsani,\n", + " dimension=\"3d\",\n", + " interval=10,\n", + " repeat=True,\n", + " xlabel=\"X-axis\",\n", + " ylabel=\"Y-axis\",\n", + " zlabel=\"Depth [m]\",\n", + " title=\"Mooring Line Example\",\n", + ")\n", "HTML(ani.to_jshtml())" ] }, @@ -391699,8 +391712,16 @@ ], "source": [ "%matplotlib agg\n", - "ani2d = mooring.graphics.animate(dsani, dimension='2d', xaxis='x',yaxis='z', repeat=True, \n", - " xlabel='X-axis',ylabel='Depth [m]', title='Mooring Line Example')\n", + "ani2d = mooring.graphics.animate(\n", + " dsani,\n", + " dimension=\"2d\",\n", + " xaxis=\"x\",\n", + " yaxis=\"z\",\n", + " repeat=True,\n", + " xlabel=\"X-axis\",\n", + " ylabel=\"Depth [m]\",\n", + " title=\"Mooring Line Example\",\n", + ")\n", "\n", "HTML(ani2d.to_jshtml())" ] diff --git a/examples/power_example.ipynb b/examples/power_example.ipynb index 3362958b8..8997df4ab 100644 --- a/examples/power_example.ipynb +++ b/examples/power_example.ipynb @@ -13,7 +13,9 @@ { "cell_type": "code", "execution_count": 1, - "metadata": {}, + "metadata": { + "scrolled": false + }, "outputs": [], "source": [ "import numpy as np\n", @@ -149,9 +151,13 @@ ], "source": [ "# Read in time-series data of voltage (V) and current (I)\n", - "power_data = pd.read_csv('data/power/2020224_181521_PowRaw.csv',skip_blank_lines=True,index_col='Time_UTC') \n", - "# Convert the time index to type \"datetime\" \n", - "power_data.index=pd.to_datetime(power_data.index)\n", + "power_data = pd.read_csv(\n", + " \"data/power/2020224_181521_PowRaw.csv\", skip_blank_lines=True, index_col=\"Time_UTC\"\n", + ")\n", + "\n", + "# Convert the time index to type \"datetime\"\n", + "power_data.index = pd.to_datetime(power_data.index)\n", + "\n", "# Display the data\n", "power_data.head()" ] @@ -174,29 +180,29 @@ "outputs": [ { "data": { - "image/png": "\n", + "image/png": "", "text/plain": [ - "
" + "
" ] }, - "metadata": { - "needs_background": "light" - }, + "metadata": {}, "output_type": "display_data" } ], "source": [ "# First seperate the voltage and current time-series into seperate dataFrames\n", - "voltage = power_data[['MODAQ_Va_V', 'MODAQ_Vb_V', 'MODAQ_Vc_V']]\n", - "current = power_data[['MODAQ_Ia_I','MODAQ_Ib_I','MODAQ_Ic_I']]\n", + "voltage = power_data[[\"MODAQ_Va_V\", \"MODAQ_Vb_V\", \"MODAQ_Vc_V\"]]\n", + "current = power_data[[\"MODAQ_Ia_I\", \"MODAQ_Ib_I\", \"MODAQ_Ic_I\"]]\n", "\n", "# Set the power factor for the system\n", - "power_factor = 0.96 \n", + "power_factor = 0.96\n", "\n", "# Compute the instantaneous AC power in watts\n", - "ac_power = power.characteristics.ac_power_three_phase(voltage, current, power_factor) \n", + "ac_power = power.characteristics.ac_power_three_phase(voltage, current, power_factor)\n", "# Display the result\n", - "ac_power.Power.plot(figsize=(15,5),title='AC Power').set(xlabel='Time',ylabel='Power [W]');" + "ac_power.Power.plot(figsize=(15, 5), title=\"AC Power\").set(\n", + " xlabel=\"Time\", ylabel=\"Power [W]\"\n", + ");" ] }, { @@ -211,7 +217,9 @@ { "cell_type": "code", "execution_count": 4, - "metadata": {}, + "metadata": { + "scrolled": true + }, "outputs": [ { "data": { @@ -238,49 +246,56 @@ " MODAQ_Vb_V\n", " MODAQ_Vc_V\n", " \n", + " \n", + " Time_UTC\n", + " \n", + " \n", + " \n", + " \n", " \n", " \n", " \n", - " 1\n", + " 2020-02-24 18:15:21.499998208\n", " 902.215367\n", " 1218.092331\n", " 433.063162\n", " \n", " \n", - " 2\n", - " 8.499136\n", - " 12.753006\n", - " 28.996487\n", + " 2020-02-24 18:15:21.500018208\n", + " 8.397956\n", + " 12.601184\n", + " 28.651291\n", " \n", " \n", - " 3\n", + " 2020-02-24 18:15:21.500038209\n", " 509.904722\n", " 671.800108\n", " 268.237845\n", " \n", " \n", - " 4\n", + " 2020-02-24 18:15:21.500058210\n", " 10.176332\n", " 15.101179\n", " 26.504936\n", " \n", " \n", - " 5\n", - " 399.622022\n", - " 524.697779\n", - " 217.596577\n", + " 2020-02-24 18:15:21.500078210\n", + " 404.436745\n", + " 531.019439\n", + " 220.218222\n", " \n", " \n", "\n", "" ], "text/plain": [ - " MODAQ_Va_V MODAQ_Vb_V MODAQ_Vc_V\n", - "1 902.215367 1218.092331 433.063162\n", - "2 8.499136 12.753006 28.996487\n", - "3 509.904722 671.800108 268.237845\n", - "4 10.176332 15.101179 26.504936\n", - "5 399.622022 524.697779 217.596577" + " MODAQ_Va_V MODAQ_Vb_V MODAQ_Vc_V\n", + "Time_UTC \n", + "2020-02-24 18:15:21.499998208 902.215367 1218.092331 433.063162\n", + "2020-02-24 18:15:21.500018208 8.397956 12.601184 28.651291\n", + "2020-02-24 18:15:21.500038209 509.904722 671.800108 268.237845\n", + "2020-02-24 18:15:21.500058210 10.176332 15.101179 26.504936\n", + "2020-02-24 18:15:21.500078210 404.436745 531.019439 220.218222" ] }, "execution_count": 4, @@ -289,25 +304,23 @@ }, { "data": { - "image/png": "\n", + "image/png": "", "text/plain": [ - "
" + "
" ] }, - "metadata": { - "needs_background": "light" - }, + "metadata": {}, "output_type": "display_data" } ], "source": [ "# Compute the instantaneous frequency\n", - "inst_freq = power.characteristics.instantaneous_frequency(voltage) \n", + "inst_freq = power.characteristics.instantaneous_frequency(voltage)\n", "\n", "# Display the result\n", - "inst_freq.plot(figsize=(15,5), ylim=(0,100),\n", - " title='Instantaneous Frequency').set(xlabel='Time [s]',\n", - " ylabel='Frequency [Hz]');\n", + "inst_freq.plot(figsize=(15, 5), ylim=(0, 100), title=\"Instantaneous Frequency\").set(\n", + " xlabel=\"Time [s]\", ylabel=\"Frequency [Hz]\"\n", + ")\n", "inst_freq.head()" ] }, @@ -316,7 +329,7 @@ "metadata": {}, "source": [ "## Power Quality\n", - "The `power.quality` module can be used to compute harmonics of current. and voltage and current distortions following IEC/TS 62600-30 and IEC/TS 61000-4-7. Harmonics and harmonic distortion are required as part of a power quality assessment and characterize the stability of the produced power. " + "The `power.quality` module can be used to compute current or voltage harmonics and current distortions following IEC/TS 62600-30 and IEC/TS 61000-4-7. Harmonics and harmonic distortion are required as part of a power quality assessment and characterize the stability of the produced power. " ] }, { @@ -328,23 +341,21 @@ "outputs": [ { "data": { - "image/png": "\n", + "image/png": "", "text/plain": [ - "
" + "
" ] }, - "metadata": { - "needs_background": "light" - }, + "metadata": {}, "output_type": "display_data" } ], "source": [ "# Set the nominal sampling frequency\n", - "sample_freq = 50000 #[Hz]\n", + "sample_freq = 50000 # [Hz]\n", "\n", "# Set the frequency of the grid the device would be conected to\n", - "grid_freq = 60 #[Hz] \n", + "grid_freq = 60 # [Hz]\n", "\n", "# Set the rated current of the device\n", "rated_current = 18.8 # [Amps]\n", @@ -353,9 +364,9 @@ "harmonics = power.quality.harmonics(current, sample_freq, grid_freq)\n", "\n", "# Plot the results\n", - "harmonics.plot(figsize=(15,5),xlim=(0,900),\n", - " title='Current Harmonics').set(ylabel='Harmonic Amplitude',\n", - " xlabel='Frequency [Hz]');" + "harmonics.plot(figsize=(15, 5), xlim=(0, 900), title=\"Current Harmonics\").set(\n", + " ylabel=\"Harmonic Amplitude\", xlabel=\"Frequency [Hz]\"\n", + ");" ] }, { @@ -396,6 +407,12 @@ " MODAQ_Ib_I\n", " MODAQ_Ic_I\n", " \n", + " \n", + " frequency\n", + " \n", + " \n", + " \n", + " \n", " \n", " \n", " \n", @@ -433,12 +450,13 @@ "" ], "text/plain": [ - " MODAQ_Ia_I MODAQ_Ib_I MODAQ_Ic_I\n", - "0 0.247401 1.948879 1.991755\n", - "60 29.761108 29.305038 29.127020\n", - "120 1.870176 1.291483 1.206478\n", - "180 1.007562 0.648012 0.535090\n", - "240 0.727466 0.437456 0.370414" + " MODAQ_Ia_I MODAQ_Ib_I MODAQ_Ic_I\n", + "frequency \n", + "0 0.247401 1.948879 1.991755\n", + "60 29.761108 29.305038 29.127020\n", + "120 1.870176 1.291483 1.206478\n", + "180 1.007562 0.648012 0.535090\n", + "240 0.727466 0.437456 0.370414" ] }, "execution_count": 6, @@ -448,7 +466,7 @@ ], "source": [ "# Calcualte Harmonic Subgroups\n", - "h_s = power.quality.harmonic_subgroups(harmonics,grid_freq) \n", + "h_s = power.quality.harmonic_subgroups(harmonics, grid_freq)\n", "# Display the results\n", "h_s.head()" ] @@ -469,44 +487,11 @@ "outputs": [ { "data": { - "text/html": [ - "
\n", - "\n", - "\n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - "
MODAQ_Ia_IMODAQ_Ib_IMODAQ_Ic_I
THCD8.9725116.0966175.929491
\n", - "
" - ], "text/plain": [ - " MODAQ_Ia_I MODAQ_Ib_I MODAQ_Ic_I\n", - "THCD 8.972511 6.096617 5.929491" + "MODAQ_Ia_I 8.972511\n", + "MODAQ_Ib_I 6.096617\n", + "MODAQ_Ic_I 5.929491\n", + "dtype: float64" ] }, "execution_count": 7, @@ -515,15 +500,15 @@ } ], "source": [ - "#Finally we can compute the total harmonic current distortion as a percentage \n", - "THCD=power.quality.total_harmonic_current_distortion(h_s,rated_current) \n", + "# Finally we can compute the total harmonic current distortion as a percentage\n", + "THCD = power.quality.total_harmonic_current_distortion(h_s)\n", "THCD" ] } ], "metadata": { "kernelspec": { - "display_name": "Python 3", + "display_name": "Python 3 (ipykernel)", "language": "python", "name": "python3" }, @@ -537,7 +522,7 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.8.5" + "version": "3.9.17" } }, "nbformat": 4, diff --git a/examples/qc_example.ipynb b/examples/qc_example.ipynb index d0afc5370..d1b25ad52 100644 --- a/examples/qc_example.ipynb +++ b/examples/qc_example.ipynb @@ -71,13 +71,13 @@ ], "source": [ "# Load data from the csv file into a DataFrame\n", - "data = pd.read_csv('data/qc/wave_elevation_data.csv', index_col='Time') \n", + "data = pd.read_csv(\"data/qc/wave_elevation_data.csv\", index_col=\"Time\")\n", "\n", "# Plot the data\n", - "data.plot(figsize=(15,5), ylim=(-60,60)) \n", + "data.plot(figsize=(15, 5), ylim=(-60, 60))\n", "\n", "# Print the first 5 rows of data\n", - "print(data.head()) " + "print(data.head())" ] }, { @@ -110,7 +110,7 @@ ], "source": [ "# Convert the index to datetime\n", - "data.index = utils.index_to_datetime(data.index, origin='2019-05-20') \n", + "data.index = utils.index_to_datetime(data.index, origin=\"2019-05-20\")\n", "\n", "# Print the first 5 rows of data\n", "print(data.head())" @@ -151,10 +151,10 @@ "outputs": [], "source": [ "# Define expected frequency of the data, in seconds\n", - "frequency = 0.002 \n", + "frequency = 0.002\n", "\n", "# Run the timestamp quality control test\n", - "results = qc.check_timestamp(data, frequency) " + "results = qc.check_timestamp(data, frequency)" ] }, { @@ -196,10 +196,10 @@ ], "source": [ "# Plot cleaned data\n", - "results['cleaned_data'].plot(figsize=(15,5), ylim=(-60,60)) \n", + "results[\"cleaned_data\"].plot(figsize=(15, 5), ylim=(-60, 60))\n", "\n", "# Print the first 5 rows of the cleaned data\n", - "print(results['cleaned_data'].head()) " + "print(results[\"cleaned_data\"].head())" ] }, { @@ -222,7 +222,7 @@ ], "source": [ "# Print the first 5 rows of the mask\n", - "print(results['mask'].head()) " + "print(results[\"mask\"].head())" ] }, { @@ -253,7 +253,7 @@ "source": [ "# Print the test results summary\n", "# The summary is transposed (using .T) so that it is easier to read.\n", - "print(results['test_results'].T) " + "print(results[\"test_results\"].T)" ] }, { @@ -300,16 +300,16 @@ ], "source": [ "# Define corrupt values\n", - "corrupt_values = [-999] \n", + "corrupt_values = [-999]\n", "\n", "# Run the corrupt data quality control test\n", - "results = qc.check_corrupt(results['cleaned_data'], corrupt_values) \n", + "results = qc.check_corrupt(results[\"cleaned_data\"], corrupt_values)\n", "\n", "# Plot cleaned data\n", - "results['cleaned_data'].plot(figsize=(15,5), ylim=(-60,60)) \n", + "results[\"cleaned_data\"].plot(figsize=(15, 5), ylim=(-60, 60))\n", "\n", "# Print test results summary\n", - "print(results['test_results'].T)" + "print(results[\"test_results\"].T)" ] }, { @@ -359,16 +359,16 @@ ], "source": [ "# Define expected lower and upper bound ([lower bound, upper bound])\n", - "expected_bounds = [-50, 50] \n", + "expected_bounds = [-50, 50]\n", "\n", "# Run expected range quality control test\n", - "results = qc.check_range(results['cleaned_data'], expected_bounds) \n", + "results = qc.check_range(results[\"cleaned_data\"], expected_bounds)\n", "\n", "# Plot cleaned data\n", - "results['cleaned_data'].plot(figsize=(15,5), ylim=(-60,60)) \n", + "results[\"cleaned_data\"].plot(figsize=(15, 5), ylim=(-60, 60))\n", "\n", "# Print test results summary\n", - "print(results['test_results'].T) " + "print(results[\"test_results\"].T)" ] }, { @@ -411,19 +411,19 @@ ], "source": [ "# Define expected lower bound (no upper bound is specified in this example)\n", - "expected_bound = [0.001, None] \n", + "expected_bound = [0.001, None]\n", "\n", "# Define the moving window, in seconds\n", - "window = 0.02 \n", + "window = 0.02\n", "\n", "# Run the delta quality control test\n", - "results = qc.check_delta(results['cleaned_data'], expected_bound, window) \n", + "results = qc.check_delta(results[\"cleaned_data\"], expected_bound, window)\n", "\n", "# Plot cleaned data\n", - "results['cleaned_data'].plot(figsize=(15,5), ylim=(-60,60))\n", + "results[\"cleaned_data\"].plot(figsize=(15, 5), ylim=(-60, 60))\n", "\n", "# Print test results summary\n", - "print(results['test_results'].T) " + "print(results[\"test_results\"].T)" ] }, { @@ -442,7 +442,7 @@ "outputs": [], "source": [ "# Extract final cleaned data for MHKiT analysis\n", - "cleaned_data = results['cleaned_data'] " + "cleaned_data = results[\"cleaned_data\"]" ] } ], diff --git a/examples/river_example.ipynb b/examples/river_example.ipynb index c03959924..aadc547fc 100644 --- a/examples/river_example.ipynb +++ b/examples/river_example.ipynb @@ -73,11 +73,13 @@ ], "source": [ "# Use the requests method to obtain 10 years of daily discharge data\n", - "data = river.io.usgs.request_usgs_data(station=\"15515500\",\n", - " parameter='00060',\n", - " start_date='2009-08-01',\n", - " end_date='2019-08-01',\n", - " data_type='Daily')\n", + "data = river.io.usgs.request_usgs_data(\n", + " station=\"15515500\",\n", + " parameter=\"00060\",\n", + " start_date=\"2009-08-01\",\n", + " end_date=\"2019-08-01\",\n", + " data_type=\"Daily\",\n", + ")\n", "\n", "# Print data\n", "print(data)" @@ -113,12 +115,12 @@ "column_name = data.columns[0]\n", "\n", "# Rename to a shorter key name e.g. 'Q'\n", - "data = data.rename(columns={column_name: 'Q'})\n", + "data = data.rename(columns={column_name: \"Q\"})\n", "\n", "# Convert to discharge data from ft3/s to m3/s\n", - "data.Q = data.Q / (3.28084)**3\n", + "data.Q = data.Q / (3.28084) ** 3\n", "\n", - "# Plot the daily discharge \n", + "# Plot the daily discharge\n", "ax = river.graphics.plot_discharge_timeseries(data.Q)" ] }, @@ -155,7 +157,7 @@ ], "source": [ "# Calculate exceedence probability\n", - "data['F'] = river.resource.exceedance_probability(data.Q)\n", + "data[\"F\"] = river.resource.exceedance_probability(data.Q)\n", "\n", "# Plot the flow duration curve (FDC)\n", "ax = river.graphics.plot_flow_duration_curve(data.Q, data.F)" @@ -199,7 +201,7 @@ ], "source": [ "# Load discharge to velocity curve at turbine location\n", - "DV_curve = pd.read_csv('data/river/tanana_DV_curve.csv')\n", + "DV_curve = pd.read_csv(\"data/river/tanana_DV_curve.csv\")\n", "\n", "# Create a polynomial fit of order 2 from the discharge to velocity curve.\n", "# Return the polynomial fit and and R squared value\n", @@ -241,10 +243,10 @@ ], "source": [ "# Use polynomial fit from DV curve to calculate velocity ('V') from discharge at turbine location\n", - "data['V'] = river.resource.discharge_to_velocity(data.Q, p)\n", + "data[\"V\"] = river.resource.discharge_to_velocity(data.Q, p)\n", "\n", - "# Plot the velocity duration curve (VDC) \n", - "ax = river.graphics.plot_velocity_duration_curve(data.V, data.F )" + "# Plot the velocity duration curve (VDC)\n", + "ax = river.graphics.plot_velocity_duration_curve(data.V, data.F)" ] }, { @@ -282,7 +284,7 @@ ], "source": [ "# Calculate the power produced from turbine velocity to power curve\n", - "VP_curve = pd.read_csv('data/river/tanana_VP_curve.csv')\n", + "VP_curve = pd.read_csv(\"data/river/tanana_VP_curve.csv\")\n", "\n", "# Calculate the polynomial fit for the VP curve\n", "p2, r_squared_2 = river.resource.polynomial_fit(VP_curve.V, VP_curve.P, 2)\n", @@ -321,10 +323,12 @@ ], "source": [ "# Calculate power from velocity at the turbine location\n", - "data['P'] = river.resource.velocity_to_power(data.V, \n", - " polynomial_coefficients=p2,\n", - " cut_in=VP_curve.V.min(), \n", - " cut_out=VP_curve.V.max())\n", + "data[\"P\"] = river.resource.velocity_to_power(\n", + " data.V,\n", + " polynomial_coefficients=p2,\n", + " cut_in=VP_curve.V.min(),\n", + " cut_out=VP_curve.V.max(),\n", + ")\n", "# Plot the power duration curve\n", "ax = river.graphics.plot_power_duration_curve(data.P, data.F)" ] @@ -356,7 +360,7 @@ ], "source": [ "# Calculate the Annual Energy produced\n", - "s = 365. * 24 * 3600 # Seconds in a year\n", + "s = 365.0 * 24 * 3600 # Seconds in a year\n", "AEP = river.resource.energy_produced(data.P, s)\n", "\n", "print(f\"Annual Energy Produced: {AEP/3600000:.2f} kWh\")" diff --git a/examples/short_term_extremes_example.ipynb b/examples/short_term_extremes_example.ipynb index 05cf9f8dc..193252ffe 100644 --- a/examples/short_term_extremes_example.ipynb +++ b/examples/short_term_extremes_example.ipynb @@ -39,7 +39,7 @@ "import numpy as np\n", "import matplotlib.pyplot as plt\n", "\n", - "from mhkit.loads import extreme \n", + "from mhkit.loads import extreme\n", "from mhkit.wave.resource import jonswap_spectrum, surface_elevation" ] }, @@ -57,7 +57,7 @@ "outputs": [], "source": [ "# short-term period in seconds\n", - "t_st = 3.0 * 60.0 * 60.0 " + "t_st = 3.0 * 60.0 * 60.0" ] }, { @@ -86,19 +86,18 @@ "T_min = 1 # s\n", "Tp = 8 # s\n", "Hs = 1.5 # m\n", - "df = 1/t_st\n", - "f_max = 1/T_min\n", - "Nf = int(f_max/df) + 1\n", + "df = 1 / t_st\n", + "f_max = 1 / T_min\n", + "Nf = int(f_max / df) + 1\n", "f = np.linspace(0.0, f_max, Nf)\n", "S = jonswap_spectrum(f, Tp, Hs)\n", "\n", "# time in seconds\n", - "time = np.linspace(0, t_st, 2*Nf+1)\n", + "time = np.linspace(0, t_st, 2 * Nf + 1)\n", "\n", "# 10 distinct time-series\n", "N = 10\n", - "qoi_timeseries = [surface_elevation(\n", - " S, time).values.squeeze() for i in range(N)]" + "qoi_timeseries = [surface_elevation(S, time).values.squeeze() for i in range(N)]" ] }, { @@ -145,15 +144,15 @@ "timeseries = qoi_timeseries[i]\n", "plt.plot(time, timeseries)\n", "plt.title(\"Full 3 hours\")\n", - "plt.xlabel('time [s]')\n", - "plt.ylabel('elevation [m]')\n", + "plt.xlabel(\"time [s]\")\n", + "plt.ylabel(\"elevation [m]\")\n", "\n", "plt.figure()\n", "timeseries = qoi_timeseries[i]\n", "plt.plot(time[time <= 120], timeseries[time <= 120])\n", "plt.title(\"First 2 minutes\")\n", - "plt.xlabel('time [s]')\n", - "plt.ylabel('elevation [m]');" + "plt.xlabel(\"time [s]\")\n", + "plt.ylabel(\"elevation [m]\");" ] }, { @@ -225,11 +224,16 @@ "i = 0 # select: 0-9\n", "\n", "plt.figure()\n", - "line, = plt.plot(time, qoi_timeseries[i], alpha=0.5, label='time-series')\n", - "plt.plot(time[np.argmax(qoi_timeseries[i])], block_maxima[i],\n", - " 'o', color=line.get_color(), label='maximum')\n", - "plt.xlabel('time [s]')\n", - "plt.ylabel('elevation [m]')\n", + "(line,) = plt.plot(time, qoi_timeseries[i], alpha=0.5, label=\"time-series\")\n", + "plt.plot(\n", + " time[np.argmax(qoi_timeseries[i])],\n", + " block_maxima[i],\n", + " \"o\",\n", + " color=line.get_color(),\n", + " label=\"maximum\",\n", + ")\n", + "plt.xlabel(\"time [s]\")\n", + "plt.ylabel(\"elevation [m]\")\n", "plt.legend();" ] }, @@ -260,11 +264,11 @@ ], "source": [ "plt.figure()\n", - "plt.plot(block_maxima, 'o')\n", + "plt.plot(block_maxima, \"o\")\n", "plt.title(\"Block maxima\")\n", - "plt.xlabel('time series')\n", - "plt.ylabel('maximum elevation [m]')\n", - "plt.ylim([0, np.max(block_maxima*1.1)]);" + "plt.xlabel(\"time series\")\n", + "plt.ylabel(\"maximum elevation [m]\")\n", + "plt.ylim([0, np.max(block_maxima * 1.1)]);" ] }, { @@ -328,22 +332,26 @@ ], "source": [ "# print distribution statistics\n", - "print(f'GEV:\\n Expected value: {ste_gev.expect()} m\\n 95% interval: ({ste_gev.ppf(0.025)} m, {ste_gev.ppf(0.975)} m)')\n", - "print(f'Gumbel:\\n Expected value: {ste_gum.expect()} m\\n 95% interval: ({ste_gum.ppf(0.025)} m, {ste_gum.ppf(0.975)} m)')\n", + "print(\n", + " f\"GEV:\\n Expected value: {ste_gev.expect()} m\\n 95% interval: ({ste_gev.ppf(0.025)} m, {ste_gev.ppf(0.975)} m)\"\n", + ")\n", + "print(\n", + " f\"Gumbel:\\n Expected value: {ste_gum.expect()} m\\n 95% interval: ({ste_gum.ppf(0.025)} m, {ste_gum.ppf(0.975)} m)\"\n", + ")\n", "\n", "# plot CDF and PDF\n", "x = np.linspace(0, 3, 1000)\n", - "fig, axs = plt.subplots(1,2)\n", + "fig, axs = plt.subplots(1, 2)\n", "axs[0].plot(x, ste_gev.pdf(x))\n", "axs[0].plot(x, ste_gum.pdf(x))\n", - "axs[0].plot(block_maxima, np.zeros(N), 'k.')\n", - "axs[1].plot(x, ste_gev.cdf(x), label='GEV')\n", - "axs[1].plot(x, ste_gum.cdf(x), label='Gumbel')\n", - "axs[0].set_ylabel('PDF')\n", - "axs[1].set_ylabel('CDF')\n", + "axs[0].plot(block_maxima, np.zeros(N), \"k.\")\n", + "axs[1].plot(x, ste_gev.cdf(x), label=\"GEV\")\n", + "axs[1].plot(x, ste_gum.cdf(x), label=\"Gumbel\")\n", + "axs[0].set_ylabel(\"PDF\")\n", + "axs[1].set_ylabel(\"CDF\")\n", "axs[1].legend()\n", - "axs[0].set_xlabel('elevation [m]')\n", - "axs[1].set_xlabel('elevation [m]');" + "axs[0].set_xlabel(\"elevation [m]\")\n", + "axs[1].set_xlabel(\"elevation [m]\");" ] }, { @@ -366,7 +374,7 @@ "outputs": [], "source": [ "t_end = 1.0 * 60.0 * 60.0\n", - "timeseries_1hr = qoi_timeseries[0][time" - ] - }, - "metadata": {}, - "output_type": "display_data" - } - ], - "source": [ - "ax = tidal.graphics.plot_current_timeseries(data.d, data.s, flood)" - ] - }, + "name": "stderr", + "output_type": "stream", + "text": [ + "c:\\Users\\mcve343\\Anaconda3\\lib\\site-packages\\xarray\\backends\\cfgrib_.py:29: UserWarning: Failed to load cfgrib - most likely there is a problem accessing the ecCodes library. Try `import cfgrib` to get the full error message\n", + " warnings.warn(\n" + ] + } + ], + "source": [ + "import matplotlib.pyplot as plt\n", + "from mhkit import tidal" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Loading Data from NOAA-Currents\n", + " \n", + "This example uses 1 year of data from the NOAA-Currents sites. A map of available currents stations is available at https://tidesandcurrents.noaa.gov/map/. The tidal io module includes two functions to import data: `request_noaa_data` which pulls data from the website, and `read_noaa_json` which loads a JSON file. The request function can save the JSON file for later use. \n", + "\n", + "For simplicity, this example loads data from a JSON file into a pandas DataFrame. This data contains 1 year of 6 minute averaged data from the Southampton Shoal Channel LB 6 (Station Number: s08010) in San Francisco Bay. The data includes 6 minute averaged direction [degrees] and speed [cm/s] indexed by time. The DataFrame key names returned by NOAA are 'd' for direction and 's' for speed. Since MHKIT uses SI units, speed is converted to m/s. " + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "metadata": {}, + "outputs": [ { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "The plot above shows missing data for most of early and mid-2017. The IEC standard recommends a minimum of 1 year of 10 minute averaged data (See IEC 201 for full description). For the demonstration, this dataset is sufficient. To look at a specific month we can slice the dataset before passing to the plotting function." - ] - }, + "name": "stdout", + "output_type": "stream", + "text": [ + " s d b\n", + "2016-11-08 12:04:00 0.673 358 4\n", + "2016-11-08 12:34:00 0.689 360 4\n", + "2016-11-08 12:46:00 0.738 356 4\n", + "2016-11-08 12:58:00 0.744 359 4\n", + "2016-11-08 13:10:00 0.648 358 4\n", + "... ... ... ..\n", + "2018-04-01 22:02:00 0.089 296 4\n", + "2018-04-01 22:14:00 0.102 356 4\n", + "2018-04-01 22:26:00 0.011 3 4\n", + "2018-04-01 22:38:00 0.060 193 4\n", + "2018-04-01 23:20:00 0.439 165 4\n", + "\n", + "[18890 rows x 3 columns]\n" + ] + } + ], + "source": [ + "# Load tidal data, South Hampton Shoal LB 6\n", + "data, metadata = tidal.io.noaa.read_noaa_json(\"data/tidal/s08010.json\")\n", + "\n", + "# Convert discharge data from cm/s to m/s\n", + "data.s = data.s / 100\n", + "\n", + "# Print data\n", + "print(data)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "The data can also be obtained using the function `request_noaa_data` in the tidal IO module. \n", + "To use this function, we need a station number, parameter type, start date, and end date.\n", + "The station number can be found on the NOAA tides and currents website linked above. \n", + "The IEC standard recommends 1 year of 10-minute direction and velocity data. The request function allows users to easily pull any timeframe of data although NOAA limits any one pull to 30 days.\n", + "\n", + "The following code, which has been commented out for this demonstration, can be used to pull data from the NOAA website. This function can be used to save data to a JSON for later use." + ] + }, + { + "cell_type": "code", + "execution_count": 14, + "metadata": {}, + "outputs": [ { - "cell_type": "code", - "execution_count": 7, - "metadata": {}, - "outputs": [ - { - "data": { - "image/png": "", - "text/plain": [ - "
" - ] - }, - "metadata": {}, - "output_type": "display_data" - } - ], - "source": [ - "# Slice December of 2017 out of the full dataset\n", - "dec17_data = data.loc['2017-12-01':'2017-12-31']\n", - "\n", - "# Plot December of 2017 as current timeseries\n", - "ax = tidal.graphics.plot_current_timeseries(dec17_data.d, dec17_data.s, flood)" - ] - }, + "name": "stdout", + "output_type": "stream", + "text": [ + "Data request URL: https://tidesandcurrents.noaa.gov/api/datagetter?begin_date=20161101&end_date=20161201&station=s08010&product=currents&units=metric&time_zone=gmt&application=web_services&format=xml\n", + "Data request URL: https://tidesandcurrents.noaa.gov/api/datagetter?begin_date=20161201&end_date=20161231&station=s08010&product=currents&units=metric&time_zone=gmt&application=web_services&format=xml\n", + "Data request URL: https://tidesandcurrents.noaa.gov/api/datagetter?begin_date=20161231&end_date=20170130&station=s08010&product=currents&units=metric&time_zone=gmt&application=web_services&format=xml\n", + "Data request URL: https://tidesandcurrents.noaa.gov/api/datagetter?begin_date=20170130&end_date=20170301&station=s08010&product=currents&units=metric&time_zone=gmt&application=web_services&format=xml\n", + "Data request URL: https://tidesandcurrents.noaa.gov/api/datagetter?begin_date=20170301&end_date=20170331&station=s08010&product=currents&units=metric&time_zone=gmt&application=web_services&format=xml\n", + "Data request URL: https://tidesandcurrents.noaa.gov/api/datagetter?begin_date=20170331&end_date=20170430&station=s08010&product=currents&units=metric&time_zone=gmt&application=web_services&format=xml\n", + "Data request URL: https://tidesandcurrents.noaa.gov/api/datagetter?begin_date=20170430&end_date=20170530&station=s08010&product=currents&units=metric&time_zone=gmt&application=web_services&format=xml\n", + "Data request URL: https://tidesandcurrents.noaa.gov/api/datagetter?begin_date=20170530&end_date=20170629&station=s08010&product=currents&units=metric&time_zone=gmt&application=web_services&format=xml\n", + "Data request URL: https://tidesandcurrents.noaa.gov/api/datagetter?begin_date=20170629&end_date=20170729&station=s08010&product=currents&units=metric&time_zone=gmt&application=web_services&format=xml\n", + "Data request URL: https://tidesandcurrents.noaa.gov/api/datagetter?begin_date=20170729&end_date=20170828&station=s08010&product=currents&units=metric&time_zone=gmt&application=web_services&format=xml\n", + "Data request URL: https://tidesandcurrents.noaa.gov/api/datagetter?begin_date=20170828&end_date=20170927&station=s08010&product=currents&units=metric&time_zone=gmt&application=web_services&format=xml\n", + "Data request URL: https://tidesandcurrents.noaa.gov/api/datagetter?begin_date=20170927&end_date=20171027&station=s08010&product=currents&units=metric&time_zone=gmt&application=web_services&format=xml\n", + "Data request URL: https://tidesandcurrents.noaa.gov/api/datagetter?begin_date=20171027&end_date=20171126&station=s08010&product=currents&units=metric&time_zone=gmt&application=web_services&format=xml\n", + "Data request URL: https://tidesandcurrents.noaa.gov/api/datagetter?begin_date=20171126&end_date=20171226&station=s08010&product=currents&units=metric&time_zone=gmt&application=web_services&format=xml\n", + "Data request URL: https://tidesandcurrents.noaa.gov/api/datagetter?begin_date=20171226&end_date=20180125&station=s08010&product=currents&units=metric&time_zone=gmt&application=web_services&format=xml\n", + "Data request URL: https://tidesandcurrents.noaa.gov/api/datagetter?begin_date=20180125&end_date=20180224&station=s08010&product=currents&units=metric&time_zone=gmt&application=web_services&format=xml\n", + "Data request URL: https://tidesandcurrents.noaa.gov/api/datagetter?begin_date=20180224&end_date=20180326&station=s08010&product=currents&units=metric&time_zone=gmt&application=web_services&format=xml\n", + "Data request URL: https://tidesandcurrents.noaa.gov/api/datagetter?begin_date=20180326&end_date=20180401&station=s08010&product=currents&units=metric&time_zone=gmt&application=web_services&format=xml\n" + ] + } + ], + "source": [ + "# data, metadata = tidal.io.noaa.request_noaa_data(station='s08010', parameter='currents',\n", + "# start_date='20161101', end_date='20180401',\n", + "# proxy=None, write_json='data/s08010.json')" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Principal Flow Directions\n", + "As an initial check on the data, a velocity plot can be created to identify data gaps. To consider the velocity in one of the principal flow directions we apply the `principal_flow_directions` function. This function returns 2 directions (in degrees) corresponding to the flood and ebb directions of the tidal site. Principal flow directions are calculated based on the highest frequency directions. These directions are often close to 180 degrees apart but are not required to be.\n", + "\n", + "The `plot_current_timeseries` function plots velocity in either direction using the speed timeseries. " + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "metadata": {}, + "outputs": [], + "source": [ + "# Specify histogram bin width for directions to calculate the principal flow directions\n", + "width_direction = 1 # in degrees\n", + "\n", + "# Compute two principal flow directions\n", + "direction1, direction2 = tidal.resource.principal_flow_directions(\n", + " data.d, width_direction\n", + ")\n", + "\n", + "# Set flood and ebb directions based on site knowledge\n", + "flood = direction1 # Flow into\n", + "ebb = direction2 # Flow out" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "The time series of current data can be plotted using the `plot_current_timeseries` function, which can include either the flood or ebb directions." + ] + }, + { + "cell_type": "code", + "execution_count": 6, + "metadata": {}, + "outputs": [ { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "## Joint Probability Distribution\n", - "\n", - "Direction and velocity can be viewed as a joint probability distribution on a polar plot. This plot helps visually show the flood and ebb directions and the frequency of particular directional velocities. " + "data": { + "image/png": "", + "text/plain": [ + "
" ] - }, + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "ax = tidal.graphics.plot_current_timeseries(data.d, data.s, flood)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "The plot above shows missing data for most of early and mid-2017. The IEC standard recommends a minimum of 1 year of 10 minute averaged data (See IEC 201 for full description). For the demonstration, this dataset is sufficient. To look at a specific month we can slice the dataset before passing to the plotting function." + ] + }, + { + "cell_type": "code", + "execution_count": 7, + "metadata": {}, + "outputs": [ { - "cell_type": "code", - "execution_count": 8, - "metadata": {}, - "outputs": [ - { - "data": { - "image/png": "", - "text/plain": [ - "
" - ] - }, - "metadata": {}, - "output_type": "display_data" - } - ], - "source": [ - "# Set the joint probability bin widths\n", - "width_direction = 1 # in degrees\n", - "width_velocity = 0.1 # in m/s\n", - "\n", - "# Plot the joint probability distribution\n", - "ax = tidal.graphics.plot_joint_probability_distribution(data.d, data.s, \\\n", - " width_direction, width_velocity, metadata=metadata, flood=flood, ebb=ebb)" + "data": { + "image/png": "", + "text/plain": [ + "
" ] - }, + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "# Slice December of 2017 out of the full dataset\n", + "dec17_data = data.loc[\"2017-12-01\":\"2017-12-31\"]\n", + "\n", + "# Plot December of 2017 as current timeseries\n", + "ax = tidal.graphics.plot_current_timeseries(dec17_data.d, dec17_data.s, flood)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Joint Probability Distribution\n", + "\n", + "Direction and velocity can be viewed as a joint probability distribution on a polar plot. This plot helps visually show the flood and ebb directions and the frequency of particular directional velocities. " + ] + }, + { + "cell_type": "code", + "execution_count": 8, + "metadata": {}, + "outputs": [ { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "## Rose plot\n", - "\n", - "A rose plot shows the same information as the joint probability distribution but the probability is now the r-axis, and the velocity is the contour value. As compared to a joint probability distribution plot, a rose plot can be more readable when using larger bins sizes." + "data": { + "image/png": "", + "text/plain": [ + "
" ] - }, + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "# Set the joint probability bin widths\n", + "width_direction = 1 # in degrees\n", + "width_velocity = 0.1 # in m/s\n", + "\n", + "# Plot the joint probability distribution\n", + "ax = tidal.graphics.plot_joint_probability_distribution(\n", + " data.d,\n", + " data.s,\n", + " width_direction,\n", + " width_velocity,\n", + " metadata=metadata,\n", + " flood=flood,\n", + " ebb=ebb,\n", + ")" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Rose plot\n", + "\n", + "A rose plot shows the same information as the joint probability distribution but the probability is now the r-axis, and the velocity is the contour value. As compared to a joint probability distribution plot, a rose plot can be more readable when using larger bins sizes." + ] + }, + { + "cell_type": "code", + "execution_count": 9, + "metadata": {}, + "outputs": [ { - "cell_type": "code", - "execution_count": 9, - "metadata": {}, - "outputs": [ - { - "data": { - "image/png": "", - "text/plain": [ - "
" - ] - }, - "metadata": {}, - "output_type": "display_data" - } - ], - "source": [ - "# Define bin sizes\n", - "width_direction = 10 # in degrees\n", - "width_velocity = 0.25 # in m/s\n", - "\n", - "# Create a rose plot\n", - "ax = tidal.graphics.plot_rose(data.d, data.s, width_direction, \\\n", - " width_velocity, metadata=metadata, flood=flood, ebb=ebb)" + "data": { + "image/png": "", + "text/plain": [ + "
" ] - }, + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "# Define bin sizes\n", + "width_direction = 10 # in degrees\n", + "width_velocity = 0.25 # in m/s\n", + "\n", + "# Create a rose plot\n", + "ax = tidal.graphics.plot_rose(\n", + " data.d,\n", + " data.s,\n", + " width_direction,\n", + " width_velocity,\n", + " metadata=metadata,\n", + " flood=flood,\n", + " ebb=ebb,\n", + ")" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Velocity Duration Curve\n", + "\n", + "The velocity duration curve shows the probability of achieving a particular velocity value. After computing the exceedance probability, the rank order of velocity values can be plotted as follows." + ] + }, + { + "cell_type": "code", + "execution_count": 10, + "metadata": {}, + "outputs": [ { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "## Velocity Duration Curve\n", - "\n", - "The velocity duration curve shows the probability of achieving a particular velocity value. After computing the exceedance probability, the rank order of velocity values can be plotted as follows." + "data": { + "image/png": "", + "text/plain": [ + "
" ] - }, + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "# Calculate exceedance probability of data\n", + "data[\"F\"] = tidal.resource.exceedance_probability(data.s)\n", + "\n", + "# Plot the velocity duration curve (VDC)\n", + "ax = tidal.graphics.plot_velocity_duration_curve(data.s, data.F)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Plot by phase direction\n", + "\n", + "MHKiT can produce plots of velocity by probability and exceedance probability for each tidal phase. Using the ebb and flood direction calculated earlier we can simply pass our directions, velocities, ebb, and flood direction to createthe following plots:" + ] + }, + { + "cell_type": "code", + "execution_count": 11, + "metadata": {}, + "outputs": [ { - "cell_type": "code", - "execution_count": 10, - "metadata": {}, - "outputs": [ - { - "data": { - "image/png": "", - "text/plain": [ - "
" - ] - }, - "metadata": {}, - "output_type": "display_data" - } - ], - "source": [ - "# Calculate exceedance probability of data\n", - "data['F'] = tidal.resource.exceedance_probability(data.s)\n", - "\n", - "# Plot the velocity duration curve (VDC)\n", - "ax = tidal.graphics.plot_velocity_duration_curve(data.s, data.F)" + "data": { + "text/plain": [ + "" ] + }, + "execution_count": 11, + "metadata": {}, + "output_type": "execute_result" }, { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "## Plot by phase direction\n", - "\n", - "MHKiT can produce plots of velocity by probability and exceedance probability for each tidal phase. Using the ebb and flood direction calculated earlier we can simply pass our directions, velocities, ebb, and flood direction to createthe following plots:" + "data": { + "image/png": "", + "text/plain": [ + "
" ] - }, + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "tidal.graphics.tidal_phase_probability(data.d, data.s, flood, ebb)" + ] + }, + { + "cell_type": "code", + "execution_count": 12, + "metadata": {}, + "outputs": [ { - "cell_type": "code", - "execution_count": 11, - "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "" - ] - }, - "execution_count": 11, - "metadata": {}, - "output_type": "execute_result" - }, - { - "data": { - "image/png": "iVBORw0KGgoAAAANSUhEUgAAA/gAAAK4CAYAAADA9FZPAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjUuMywgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy/NK7nSAAAACXBIWXMAAA9hAAAPYQGoP6dpAADTT0lEQVR4nOzde3yU5Z3//9d9mMwMiByLYkRAxEi/FIEUaYNQpApdbBF3cSvKt1XQ3a5a1HapuLYCrfVEt7au2N1VpNuyYlu/rdhKS4poOcRF5CA/uohIQTBiMUgAYSYz9+H3R8iYyDEkcCf39X4+Hj68yAyTz8X1nuuea+5r7rHCMAwRERERERERkVbNjroAEREREREREWk6LfBFREREREREYkALfBEREREREZEY0AJfREREREREJAa0wBcRERERERGJAS3wRURERERERGJAC3wRERERERGRGNACX0RERERERCQGtMAXERERERERiQEt8EVERERERERioEUu8J999lm+/vWvM2zYMM4880wsy2LixIkn9VjvvPMOkyZN4pxzziGZTNKzZ0/uuOMO9uzZ08xVi4iIiIiIiETHjbqAI7nvvvt4/fXXOeOMMzj33HN54403TupxtmzZQllZGbt27eKqq67ioosu4tVXX+XHP/4xf/jDH1ixYgWdO3du5upFRERERERETr8WeQb/kUce4c0332Tfvn385Cc/OenHueWWW9i1axePPvoozz33HA8++CBLlizhzjvvZNOmTdxzzz3NWLWIiIiIiIhIdKwwDMOoiziWl19+mcsuu4zrr7+eefPmnfDf27JlCxdccAG9evXirbfewrY/ei9j//79dOvWjSAI2LVrF2ecccapKF1ERERERETktGmRZ/Cbw0svvQTAqFGjGizuAdq1a8fQoUPJZDKsXLkyivJEREREREREmlWL/Ax+c9i0aRMAffr0OeLtffr0oby8nDfffJPPf/7zR7xPTU0NNTU1hT8HQcAHH3xA586dsSyr+YsWERERERERqScMQ/bv388555xz2Mnrj4vtAn/v3r0AtG/f/oi31/28urr6qI/xwAMPMHPmzGavTURERERERKQxduzYwbnnnnvM+8R2gX88dZceONaZ+LvvvptvfOMbhT/v3buX8847j23bttGxY0d83wfAcZwGbc/zsCyr0LZtG9u2j9rO5/M4jlNou66LZVmFNoDneQ3aiUSCMAwLPz948CBFRUUkEgmCICAIAlzXPWrb933CMCy0j9SPKPtU1w/f99WnE+hTGIaFOmzbjkWf4jhOp6pPYRhy4MAB2rZti2VZsehTHMfpVPbJcRwOHjxIMpk8Zv9aU5/iOE6nsk+2bZPL5XAch0QiEYs+xXGcTmWffN/H8zyKiooa9KM19ymO43Qq+5TP58nlcrRp0wbf92PRpziO08n06eDBg5x33nm0a9eO44ntAr/uDH3dmfyP27dvX4P7HUkymSSZTB72844dO3LmmWc2Q5XNIwxD2rRpUwiBmKf+mz3KgHnCMKRt27Yaf4PpOCA6DogyIMpAfCUSCeDYJ6frxPYieyUlJQC8+eabR7x98+bNAFx44YWnraZTxfM8Fi5ciOd5UZciEVEGzKbxF2VAlAFRBkQZEDDga/J69uzJli1bjvo1ee+//z5t27Y9ocfct28f7du3Z+/evS3uDL7erTObMmA2jb8oA6IMiDIgykB8NWYd2urP4Ofzed544w22bNnS4Oe9e/dm1KhRbNu2jdmzZze4bfr06Rw4cICvfOUrJ7y4b+n0Tp0oA2bT+IsyIMqAKAOiDEiLXOA/99xz3HDDDdxwww08+OCDALzyyiuFn/3zP/9z4b6VlZX07dv3iF919/jjj9O1a1emTJnCuHHjuPvuuxk5ciSPPPIIF154Id///vdPW59OJc/zKC8v1xPaYMqA2TT+ogyIMiDKgCgDAi10i/6MGTOO+fV0PXr0YNu2bQBs27aNXr16NfhZfTt27ODee+/lD3/4A7t376Zbt26MGzeO6dOn06lTp0bV1VK36IuIiIiIiEg8NWYd2iIX+C1VS13gh2HI/v37adeunT5vYyhlwGwaf1EGRBkQZUCUgfhqzDo0tl+TZxLP81i2bBmjRo0qfIWCmEUZMJvGX5QBUQZEGYiXfD5f+E71xvydiooKhg4dqgy0cI7jnLIx0hn8RmipZ/BFRERERKT127dvH1VVVdTU1ERdipxiyWSSLl26nNC6UmfwDRMEAdXV1XTo0KHB1wGKOZQBs2n8RRkQZUCUgdZv3759VFZWcsYZZ9ClSxcSiUSjttqHYYjv+ziOoy36LVgYhuTzefbu3UtlZSVAs5481gI/BnzfZ9WqVYwcOVITuqGUAbNp/EUZEGVAlIHWr6qqijPOOINzzz33pBboQRCwf/9+2rRpowy0cOl0mnbt2vHOO+9QVVXVrAt8bdFvBG3RFxERERGR5pbP53nrrbcoLi7WOsMgdbs2LrjggmN+Jr8x61C9tRMDQRCwa9cugiCIuhSJiDJgNo2/KAOiDIgy0LrVXVCvKRdeq9v6rfO3rUfdeDf2gorHogV+DARBwIYNGzShG0wZMJvGX5QBUQZEGYiHpn52PpPJNFMlcjqcimslaIt+I2iLvoiIiIiINLdsNsvWrVvp1asXqVQq6nLkNDnRcdcWfcMEQUBlZaXesTWYMmA2jb8oA6IMiDIgYRiSy+W0Rd9wuop+DARBwJYtWzjrrLN0xUxDKQNm0/iLMiDKgCgD8bd9+3aqqqqOensYhhw8eJA2bdpE8jV5Xbp04bzzzjvtv3fGjBnMnDmTl156iREjRpzQ3xkxYgR/+tOfYvlmiBb4MeC6LsOHD4+6DImQMmA2jb8oA6IMiDIQb9u3b6ekpC/Z7MGoSzmqVKoNmzZtbPIi/0TenFi7di0DBgxo0u+JKy3wYyAIAnbs2EH37t31jq2hlAGzafxFGRBlQJSBeKuqqjq0uJ8H9I26nCPYSDY7kaqqqmY7iz99+vSj3nb22Wc3y++IIy3wY6DuM1fFxcWa0A2lDJhN4y/KgCgDogyYoi8wKOoiTosZM2ZEXUKrpGd/DLiuS1lZGa6r92tMpQyYTeMvyoAoA6IMiMB//dd/MXDgQNLpNF27dmXSpEm89957R71/TU0N3/72t+nVqxfJZJLevXszc+ZMcrncaay6eWmBHwO+7/PWW2/h+37UpUhElAGzafxFGRBlQJQBMd0jjzzC1772NS6++GLuuOMOSkpKmDt3LmVlZbz//vtH/Dt///d/z1NPPcWXvvQlbrvtNizLYsaMGfzd3/1dq70An97ii4EwDNmzZw89e/aMuhSJiDJgNo2/KAOiDIgyIHFztC36qVSKadOmHfbz3//+96xcuZKBAwcWfnbnnXfyox/9iGnTpjFnzpzD/s7GjRv585//TMeOHQH4/ve/z2WXXcbvfvc75s2bx//9v/+3eTpzGllha31rIgL79u2jffv27N27lzPPPDPqckREREREJAay2Sxbt26lV69epFKpw25fs2YNpaWlwGpa5mfw1wClrF69mkGDmlbf8a6i3759e6qrqwt/rvuavEmTJh22iN+7dy89evSgpqaG6upqkskk8NHX5P3sZz87bBH/8ssvc9lllzFixAheeumlJvXleI437nUasw7VFv0Y8H2fN954Q1uyDKYMmE3jL8qAKAOiDEjchGF4xP/qL+7r+9znPnfYz9q3b8+AAQPIZrNs3LjxhP7OsGHDcF2XtWvXNrkPUdACPyYymUzUJUjElAGzafxFGRBlQJQBMdlZZ511xJ/XfaXe3r17T+jvOI5D586d2bdvX/MWeJpogR8DjuMwcOBAHMeJuhSJiDJgNo2/KAOiDIgyIKb761//esSf111Fv3379if0d3zfZ/fu3a32I9la4MeA7/ts2LBBW7IMpgyYTeMvyoAoA6IMiOn+9Kc/HfazvXv3sm7dOlKpFH379j2hv7Ns2TI8z2twsb7WRAt8ERERERERadV+/vOfH/a5+RkzZrB3714mTJhQuMBefd/73vfYs2dP4c/ZbJa7774bgBtvvPHUFnyK6GvyYsBxHPr16xd1GRIhZcBsGn9RBkQZEGVA4uZoX5MHMG7cOAYMGNDgZ2PGjGHo0KH8/d//Pd26dWP58uUsX76cnj178uCDDx7xcT75yU/yf/7P/2H8+PEkEgkWLFjAli1buPLKK1vlV+SBFvix4Ps+69evp3///vrclaGUAbNp/EUZEGVAlAFTHH4l+Jah+euaOXPmUW/r2bPnYQv8O+64g6uvvppHHnmEX/ziF5xxxhnccMMN3H///XTt2vWIj/OLX/yC733ve/z3f/837777LsXFxcyYMYNp06Yd9+v6Wiot8GMinU5HXYJETBkwm8ZflAFRBkQZiK8uXbqQSrUhm50YdSlHlUq1oUuXLk1+nDAMG3X/GTNmNDjb/9WvfvW4f+fll18utO+77z7uu+++Rv3OlswKG/svaLB9+/bRvn179u7d22qvqigiIiIiIi1LNptl69at9OrVi1QqdcT7bN++naqqqtNc2Ynr0qUL5513XtRltConMu7QuHWozuDHgOd5rF27loEDB+K6GlITKQNm0/iLMiDKgCgD8XfeeecdcwEdhiEHDx6kTZs2rXZ7uTSdrqIfA5Zl0bFjRz2RDaYMmE3jL8qAKAOiDAig6y+IzuDHgeM4XHDBBVGXIRFSBsym8RdlQJQBUQbEsqxjbvMWM+gMfgx4nkdFRQWe50VdikREGTCbxl+UAVEGRBmQMAz58MMPG32ROokXLfBjwLZtiouLsW0Np6mUAbNp/EUZEGVAlAEBSCQSUZcgEdMW/RiwbZsePXpEXYZESBkwm8ZflAFRBkQZEMuySCaTUZchEdNbfDHgeR5Lly7VliyDKQNm0/iLMiDKgCgDEoYh+/fv1xZ9w2mBHwO2bdO7d29tyTKYMmA2jb8oA6IMiDIggM7gi7box0HdZ67EXMqA2TT+ogyIMiDKgFiWRVFRUdRlSMT0Fl8MeJ7HkiVLtCXLYMqA2TT+ogyIMiDKgIRhyL59+7RF33Ba4MeAbdv069dPW7IMpgyYTeMvyoAoA6IMCEA6nY66BImYtujHgG3bdO3aNeoyJELKgNk0/qIMiDIgyoBYlqWvyRMt8OMgn8+zZMkSRo4cqSe1oZQBs2n8RRkQZUCUgfjbvn07VVVVR709CAIOHDhA27ZtI9nJ0aVLF84777zT/nulIS3wY8BxHAYPHozjOFGXIhFRBsym8RdlQJQBUQbibfv27fS9qISDmWzUpRxVm3SKjW9sOq2L/BtuuIH/+q//YuvWrfTs2fO0/d5j+elPf8qNN97I3LlzueGGG07779cCPwZs26ZTp05RlyERUgbMpvEXZUCUAVEG4q2qqoqDmSzzboG+50RdzeE2vgsTH89SVVXV5AW+ZVnHvD2qhXNroQV+DOTzecrLyxk1apS2ZBlKGTCbxl+UAVEGRBkwQ99zYFCvqKs4PaZPn37Enw8YMOD0FtLKaIEfA67rMmzYMFxXw2kqZcBsGn9RBkQZEGVA4mbGjBlRl9Aq6Xs0YsCyLM4888zjbmeR+FIGzKbxF2VAlAFRBkQa+sUvfsGwYcNo37496XSafv36cf/995PNHvk6Bq+99hp/+7d/S9euXUkmk/To0YN/+qd/4t133z3i/d966y2uueYaOnbsSNu2bSkrK+N3v/vdqezSCdECPwby+TwLFiwgn89HXYpERBkwm8ZflAFRBkQZEPnIXXfdxbXXXsumTZu4/vrrue222wjDkHvuuYdRo0aRy+Ua3H/BggWUlZXxwgsvcMUVV/CNb3yDCy+8kH//93/n05/+NH/5y18a3H/z5s185jOf4dlnn+Wzn/0st99+O+eeey7jxo3j17/+9ens6mG0hycGXNdl1KhR2pJlMGXAbBp/UQZEGRBlQOLmSFv0e/bsedwL7K1YsYKHH36YHj168Oqrr9K1a1cAHnjgAa666ioWLlzIrFmzuOeeewD48MMPmTRpEkEQsHTpUsrKygqP9cADD/Av//Iv/OM//iN//OMfCz+/9dZb2b17Nz/60Y+4/fbbCz9fsGAB48aNO/lONwPNADGhyVyUAbNp/EUZEGVAlAGJk5kzZx72s8997nPHXeDPnTsXgG9/+9uFxT3UPj9++MMf8oc//IE5c+YUFvjPPfccH3zwAddff32DxT3AP//zP/Mf//EfLF68mLfffpsePXrwzjvv8Mc//pFevXpx2223Nbj/VVddxec+9zn+9Kc/nUyXm4W26MeA53ksXLgQz/OiLkUiogyYTeMvyoAoA6IMSNyEYXjYfy+//PJx/97atWsBuOyyyw67raSkhHPPPZetW7dSXV193PsnEgk+97nPNbhf3f8vvfRSHMc57O+MGDHiuDWeSlrgx4DruowZM0bv2hpMGTCbxl+UAVEGRBkQqbV3714Azj777CPe3q1btwb3O9n7n3XWWUe8/9Ee53TRAj8m9G6tKANm0/iLMiDKgCgDItC+fXsA3nvvvSPevnPnzgb3O9n7//Wvfz3i/Y/2OKeLFvgx4Hke5eXlmtQNpgyYTeMvyoAoA6IMiNQaOHAgwBG387/11lu888479OrViw4dOhz3/p7nsXz5cgAGDRrU4P7Lly/H9/3D/s6JfIzgVNICPwYSiQRXXXUViUQi6lIkIsqA2TT+ogyIMiDKgEitSZMmAXDffffx/vvvF37u+z7//M//TBAETJ48ufDzcePG0alTJ+bPn8///M//NHisH/3oR/zlL3/h8ssv57zzzgPg3HPP5YorrmDr1q089thjDe6/YMGCSC+wB7qKfiyEYcj+/ftp164dlmVFXY5EQBkwm8ZflAFRBkQZMMPGd6Ou4MhaUl1lZWV861vf4uGHH6Zfv36MHz+etm3b8vvf/54NGzZw6aWXMnXq1ML9zzjjDJ566imuueYaPve5z3HNNddw3nnnsXr1asrLyzn77LP5j//4jwa/Y/bs2Xz2s5/ljjvuoLy8nIsvvpi33nqL3/zmN3zpS1/it7/97enudoEW+DHgeR7Lli1j1KhRetfWUMqA2TT+ogyIMiDKQLx16dKFNukUEx/PRl3KUbVJp+jSpUvUZQDw0EMPMXDgQB577DF+9rOfkc/n6d27N/fddx/f/OY3KSoqanD/q666ihUrVnD//fezaNEi9u7dy9lnn83XvvY1vvOd73DOOec0uH+fPn34n//5H6ZNm8bixYt5+eWX6d+/P8899xzvv/9+pAt8KwzDMLLf3srs27eP9u3bs3fvXs4888yoyxERERERkRjIZrNs3bqVXr16kUqljnif7du3U1VVdZorO3FdunQpbGOXE3Mi4w6NW4fqDH4MBEFAdXU1HTp0wLZ1WQUTKQNm0/iLMiDKgCgD8XfeeecdcwEdhiG+7+M4jj6mYTA9+2PA931WrVp1xKs4ihmUAbNp/EUZEGVAlAEJw5ADBw6gDdpm0xb9RtAWfRERERERaW4nulVb4uVUbNHXGfwYCIKAXbt2EQRB1KVIRJQBs2n8RRkQZUCUAQnDkHw+rzP4htMCPwaCIGDDhg2a0A2mDJhN4y/KgCgDogwIQCaTiboEiZi26DeCtuiLiIiIiEhz0xZ9M2mLvhxREARUVlbqHVuDKQNm0/iLMiDKgCgD8dCUc69hGJLL5bRFvxU5FWOlBX4MBEHAli1bNKEbTBkwm8ZflAFRBkQZaN0cxwEgn8836XFqamqaoxw5TerGu278m4O26DeCtuiLiIiIiMip8Je//IVEIsG5556r77E3QBiGvPPOO+Tzec4///xj3rcx61C3OYuUaARBwI4dO+jevTu2rU0ZJlIGzKbxF2VAlAFRBlq/Ll26UFlZyTvvvEP79u1JJBKNWujXXUW/sX9PTq+6cdq7dy8ffvghxcXFzfr4WuDHQN1nroqLizWhG0oZMJvGX5QBUQZEGWj96s7MVlVVUVlZ2ei/X/cZ/KKiIi3wW4FkMklxcXGz7wzXFv1G0BZ9ERERERE51fL5PL7vR12GnCKO45BIJE74/tqibxjf9wtfr9CcF2iQ1kMZMJvGX5QBUQZEGYiXRCLRqAUgKANSS/t3YiAMQ/bs2aOvxDCYMmA2jb8oA6IMiDIgyoCAtug3irboi4iIiIiIyOnUmHWozuDHgO/7vPHGG/qcjsGUAbNp/EUZEGVAlAFRBgS0wI+NTCYTdQkSMWXAbBp/UQZEGRBlQJQB0Rb9RtAWfRERERERETmdtEXfML7vs2HDBm3HMZgyYDaNvygDogyIMiDKgIAW+CIiIiIiIiKxoC36jaAt+iIiIiIiInI6aYu+YXzfZ+3atdqOYzBlwGwaf1EGRBkQZUCUAQEt8GMjnU5HXYJETBkwm8ZflAFRBkQZEGVAtEW/EbRFX0RERERERE4nbdE3jOd5rFq1Cs/zoi5FIqIMmE3jL8qAKAOiDIgyIKAFfixYlkXHjh2xLCvqUiQiyoDZNP6iDIgyIMqAKAMC2qLfKNqiLyIiIiIiIqeTtugbxvM8KioqtB3HYMqA2TT+ogyIMiDKgCgDAlrgx4Jt2xQXF2PbGk5TKQNm0/iLMiDKgCgDogwIaIt+o2iLvoiIiIiIiJxO2qJvGM/zWLp0qbbjGEwZMJvGX5QBUQZEGRBlQEAL/FiwbZvevXtrO47BlAGzafxFGRBlQJQBUQYEtEW/UbRFX0RERERERE4nbdE3jOd5LFmyRNtxDKYMmE3jL8qAKAOiDIgyIKAFfizYtk2/fv20HcdgyoDZNP6iDIgyIMqAKAMC2qLfKNqiLyIiIiIiIqeTtugbJp/Ps2jRIvL5fNSlSESUAbNp/EUZEGVAlAFRBgR0Br9RWuoZ/CAIqK6upkOHDtqSYyhlwGwaf1EGRBkQZUCUgfhqzDpUC/xGaKkLfBEREREREYknbdE3TD6f54UXXtB2HIMpA2bT+IsyIMqAKAOiDAjoDH6jtNQz+GEYsn//ftq1a4dlWVGXIxFQBsym8RdlQJQBUQZEGYivxqxD3dNUk5xClmW1qDcc5PRTBsym8RdlQJQBUQZEGRDQFv1YyOfzLFiwQNtxDKYMmE3jL8qAKAOiDIgyIKAt+o3SkrfoZ7NZUqmUtuMYShkwm8ZflAFRBkQZEGUgvnSRPQO5rj5tYTplwGwaf1EGRBkQZUCUAdECPwY8z2PhwoV4nhd1KRIRZcBsGn9RBkQZEGVAlAEBbdFvlJa8Rd/zPFzX1XYcQykDZtP4izIgyoAoA6IMxJe26BtI79SJMmA2jb8oA6IMiDIgyoBogR8DnudRXl6uJ7TBlAGzafxFGRBlQJQBUQYEtEW/UVrqFn0RERERERGJJ23RN0wYhuzbtw+9V2MuZcBsGn9RBkQZEGVAlAEBLfBjwfM8li1bpu04BlMGzKbxF2VAlAFRBkQZENAW/UbRFn0RERERERE5nWKxRf+dd95h0qRJnHPOOSSTSXr27Mkdd9zBnj17GvU4zz//PJdffjnnnnsu6XSa888/n2uuuYZXXnnlFFV++gVBwAcffEAQBFGXIhFRBsym8RdlQJQBUQZEGRBooQv8LVu2UFpayty5c7nkkku48847Of/88/nxj3/MZz/7WXbv3n1Cj/PP//zPXHXVVaxbt44vfOEL3H777QwaNIgFCxYwdOhQfvazn53inpwevu+zatUqfN+PuhSJiDJgNo2/KAOiDIgyIMqAQAvdoj969GjKy8t59NFH+frXv174+Te+8Q0eeeQR/vEf/5F///d/P+ZjvPfeexQXF/OJT3yC9evX07Vr18JtL730EiNHjqRnz55s3br1hOvSFn0RERERERE5nVr1Fv0tW7ZQXl5Or169uPXWWxvcNnPmTNq2bcvPfvYzPvzww2M+zttvv00QBAwZMqTB4h7gsssuo127dlRVVTV7/VEIgoBdu3ZpO47BlAGzafxFGRBlQJQBUQYEWuAC/6WXXgJg1KhR2HbD8tq1a8fQoUPJZDKsXLnymI/Tp08fkskkK1euZNeuXYf9jv3793PFFVc0b/ERCYKADRs26MlsMGXAbBp/UQZEGRBlQJQBgRa4wN+0aRNQu0A/krqfv/nmm8d8nE6dOjFr1izef/99PvnJT3LzzTdz9913c8011/CFL3yBUaNGHXebf01NDfv27WvwH1D4XIvv+0dse57XoF33JDtaO5/PN2jXfWqirh2G4WFtoNB2XZcRI0YU/l4QBIWvxzha2/f9Bu2W1qe6euu31aej98myLEaOHFn4cxz6FMdxOlV9chyHYcOG4ThObPoUx3E6lX1yXZfPfe5zWJYVmz7FcZxOZZ9s22bkyJGFuuPQpziO06nsE8DIkSOxbTs2fYrjOJ3KPgGMGDEC13Vj06c4jtPJ9ulEtbgF/t69ewFo3779EW+v+3l1dfVxH+vrX/86v/nNbwiCgCeffJIHH3yQZ599lvPOO4+vfvWrh23d/7gHHniA9u3bF/7r3r07ABs2bABg48aNbNy4EYD169ezefNmANauXVv4bP+rr77Kjh07AKioqGDnzp0ALF26tPARgSVLlhT6U15ezv79+wFYuHAh2WwWz/NYuHAhnueRzWZZuHAhAPv376e8vJwgCNi8eTNLliwBoKqqiqVLlwKwc+dOKioqANixYwevvvoqAFu3bmXt2rUAbN68mfXr17eoPkHtGKtPJ9anN998k8rKStasWRObPsVxnE5Vn3K5HAsXLiSXy8WmT3Ecp1PZpyAIWL16daz6FMdxOpV9+uCDD6isrIxVn+I4Tqe6T5WVlbz99tux6lMcx+lU9unPf/4zQRDEqk9xHKeT6dMJC1uYm2++OQTCJ5544oi333333SEQPvDAA8d9rPvvvz+0bTu88847wy1btoQHDhwIV69eHY4aNSoEwqlTpx7z72ez2XDv3r2F/3bs2BEC4QcffBCGYRh6nhd6nndYO5/PN2j7vn/Mdi6Xa9AOgqBBOwiCw9phGBba+Xw+fPnll8NMJhOGYRj6vh/m8/ljtj3Pa9A+Uj+i7FNdvfXb6tPR+5TNZsM//elPYTabjU2f4jhOp6pPuVwufPnllxv8ubX3KY7jdCr7VHccyGazselTHMfpVPappqYm/NOf/hQePHgwNn2K4zidyj5lMpnwT3/6U1hTUxObPsVxnE5lnzKZTPjyyy8Xjgtx6FMcx+lk+lRdXR0C4d69e8PjaXFX0Z86dSo/+MEP+MEPfsA3v/nNw26/7bbbmD17No8//jj/9E//dNTHWbJkCZ///Oe5+uqr+fWvf93gtoMHD3LhhReyc+dO3nzzTXr37n1Ctekq+iIiIiIiInI6teqr6JeUlABH/4x93ZaHCy+88JiP88ILLwC1V8z/uDZt2nDJJZcQBEFhm0VrFgRB4VsDxEzKgNk0/qIMiDIgyoAoAwItcIFftyCv+2x5ffv372fFihWk02k+85nPHPNxcrkcAO+///4Rb6/7eTKZbGrJkQuCgMrKSj2ZDaYMmE3jL8qAKAOiDIgyINACF/i9e/dm1KhRbNu2jdmzZze4bfr06Rw4cICvfOUrtG3bFqi9quAbb7zBli1bGtx32LBhAPznf/4nlZWVDW77/e9/z4oVK0ilUpSVlZ3C3pwerutSVlaG67pRlyIRUQbMpvEXZUCUAVEGRBkQgBb3GXyALVu2UFZWxq5du7jqqqvo27cvK1eu5KWXXuLCCy+koqKCzp07A7Bt2zZ69epFjx492LZtW+ExgiBg9OjRLF68mHbt2nH11Vdz9tlns3HjRn73u98RhiE/+tGPuP3220+4rpb6GXzf99m6dSu9evXCcZyoy5EIKANm0/iLMiDKgCgDogzEV6v+DD7UnsV/7bXXuOGGG1i5ciX/+q//ypYtW5gyZQqvvPJKYXF/LLZts3DhQh555BE++clP8pvf/IZ//dd/5X/+538YM2YMixYtatTiviULw5A9e/Y06vsRJV6UAbNp/EUZEGVAlAFRBgRa6Bn8lqqlnsEXERERERGReGr1Z/ClcXzf54033sD3/ahLkYgoA2bT+IsyIMqAKAOiDAhogR8bmUwm6hIkYsqA2TT+ogyIMiDKgCgDoi36jaAt+iIiIiIiInI6aYu+YXzfZ8OGDdqOYzBlwGwaf1EGRBkQZUCUAQEt8EVERERERERiQVv0G0Fb9EVEREREROR00hZ9w/i+z9q1a7Udx2DKgNk0/qIMiDIgyoAoAwJa4MdGOp2OugSJmDJgNo2/KAOiDIgyIMqAaIt+I2iLvoiIiIiIiJxO2qJvGM/zWLVqFZ7nRV2KREQZMJvGX5QBUQZEGRBlQEAL/FiwLIuOHTtiWVbUpUhElAGzafxFGRBlQJQBUQYEtEW/UbRFX0RERERERE4nbdE3jOd5VFRUaDuOwZQBs2n8RRkQZUCUAVEGBLTAjwXbtikuLsa2NZymUgbMpvEXZUCUAVEGRBkQ0Bb9RtEWfRERERERETmdtEXfMJ7nsXTpUm3HMZgyYDaNvygDogyIMiDKgIAW+LFg2za9e/fWdhyDKQNm0/iLMiDKgCgDogwIaIt+o2iLvoiIiIiIiJxO2qJvGM/zWLJkibbjGEwZMJvGX5QBUQZEGRBlQEAL/FiwbZt+/fppO47BlAGzafxFGRBlQJQBUQYEtEW/UbRFX0RERERERE4nbdE3TD6fZ9GiReTz+ahLkYgoA2bT+IsyIMqAKAOiDAjoDH6jtNQz+EEQUF1dTYcOHbQlx1DKgNk0/qIMiDIgyoAoA/HVmHWoFviN0FIX+CIiIiIiIhJP2qJvmHw+zwsvvKDtOAZTBsym8RdlQJQBUQZEGRDQGfxGaaln8MMwZP/+/bRr1w7LsqIuRyKgDJhN4y/KgCgDogyIMhBfjVmHuqepJjmFLMtqUW84yOmnDJhN4y/KgCgDogyIMiCgLfqxkM/nWbBggbbjGEwZMJvGX5QBUQZEGRBlQEBb9BulJW/Rz2azpFIpbccxlDJgNo2/KAOiDIgyIMpAfOkiewZyXX3awnTKgNk0/qIMiDIgyoAoA6IFfgx4nsfChQvxPC/qUiQiyoDZNP6iDIgyIMqAKAMC2qLfKC15i77nebiuq+04hlIGzKbxF2VAlAFRBkQZiC9t0TeQ3qkTZcBsGn9RBkQZEGVAlAHRAj8GPM+jvLxcT2iDKQNm0/iLMiDKgCgDogwIaIt+o7TULfoiIiIiIiIST9qib5gwDNm3bx96r8ZcyoDZNP6iDIgyIMqAKAMCWuDHgud5LFu2TNtxDKYMmE3jL8qAKAOiDIgyIKAt+o3Smrbob9++naqqqqjLOC26dOnCeeedF3UZIiIiIiIiza4x61D3NNUkp1AQBFRXV9OhQwds22b79u30vaiEg5ls1KWdFm3SKTa+scnoRf7HMyBm0fiLMiDKgCgDogwIaIEfC77vs2rVKkaOHIlt21RVVXEwk2XeLdD3nKirO7U2vgsTH89SVVVl9AL/4xkQs2j8RRkQZUCUAVEGBLRFv1Fayxb9NWvWUFpayur7YFCvqKs5tdZshdJvw+rVqxk0aFDU5YiIiIiIiDQrXUXfMEEQsGvXLoIgiLoUiYgyYDaNvygDogyIMiDKgIAW+LEQBAEbNmzQk9lgyoDZNP6iDIgyIMqAKAMC+gx+LLiuy8iRI6MuQyKkDJhN4y/KgCgDogyIMiCgM/ixEAQBlZWVerfOYMqA2TT+ogyIMiDKgCgDAlrgx0IQBGzZskVPZoMpA2bT+IsyIMqAKAOiDAhoi34suK7L8OHDoy6jRdq+fTtVVVVRl3Fa9OzZE9fVU9pEmgNEGRBlQJQBUQYEtMCPhSAI2LFjB927d9d3Xtazfft2+l5UwsFMNupSTjnXdRk16gpmz36cnj17Rl2OnGaaA0QZEGVAlAFRBgS0wI+Fus/bFBcX68lcT1VVFQczWebdAn3PibqaU2vjXx02d7qEqqoqLfANpDlAlAFRBkQZEGVAQAv8WHBdl7KysqjLaLH6ngODekVdxalWw8Rvz2Ts2LFRFyIR0BwgyoAoA6IMiDIgoIvsxYLv+7z11lv4vh91KRKR0HIZO3YsYRhGXYpEQHOAKAOiDIgyIMqAgBb4sRCGIXv27NHizmAhNiUlJcqAoTQHiDIgyoAoA6IMCGiBHwuu6zJ48GBdQd1gdphj1qxZ+ryVoTQHiDIgyoAoA6IMCGiBHwu+7/PGG29oO47BQsvl2muv1Tu2htIcIMqAKAOiDIgyIKAFfmxkMpmoS5AIhdh07txZC3yDaQ4QZUCUAVEGRBkQLfBjwHEcBg4ciOM4UZciEbHDHLNnz9YWfUNpDhBlQJQBUQZEGRDQAj8WfN9nw4YN2o5jsNBKcOONN+oMvqE0B4gyIMqAKAOiDAhogS8iIiIiIiISC1rgx4DjOPTr10/bcQxmhXnmzp2LZVlRlyIR0BwgyoAoA6IMiDIgoAV+LPi+z9q1a7Udx2CBVcStt95KEARRlyIR0BwgyoAoA6IMiDIgoAV+bKTT6ahLkAhZBOzevVtn8A2mOUCUAVEGRBkQZUC0wI8Bx3G46KKLtB3HYFbo8cwzz2iBbyjNAaIMiDIgyoAoAwJa4MeC53msWrUKz/OiLkUiElhFTJ06VVv0DaU5QJQBUQZEGRBlQEAL/FiwLIuOHTvq7K3BLAI2bdqkDBhKc4AoA6IMiDIgyoCAFvix4DgOF1xwgbbjGMwKPZ5//nlN6IbSHCDKgCgDogyIMiCgBX4seJ5HRUWFtuMYLLCSTJ8+XVv0DaU5QJQBUQZEGRBlQEAL/FiwbZvi4mJsW8NpKgufFStW6Ay+oTQHiDIgyoAoA6IMCIAbdQHSdLZt06NHj6jLkAhZocfixYu1wDeU5gBRBkQZEGVAlAEBncGPBc/zWLp0qbbjGCywkjz44IPaom8ozQGiDIgyIMqAKAMCWuDHgm3b9O7dW9txDKaL7JlNc4AoA6IMiDIgyoCAtujHQt3nbcRcFj4VFRVa4BtKc4AoA6IMiDIgyoCAzuDHgud5LFmyRNtxDBbYKR599FFt0TeU5gBRBkQZEGVAlAEBncGPBdu26devn7bjGMwKcjz11FOUlZUddtv27dupqqqKoKrTr0uXLpx33nlRl3HaaQ4QZUCUAVEGRBkQ0AI/FmzbpmvXrlGXIRGyCFi3bt1hW/S3b99O34tKOJjJRlTZ6dUmnWLjG5uMW+RrDhBlQJQBUQZEGRDQAj8W8vk8S5YsYeTIkSQSiajLkQgEdoonn3zssC36VVVVHMxkmXcL9D0nouJOk43vwsTHs1RVVRm3wNccIMqAKAOiDIgyIKAFfiw4jsPgwYNxHCfqUiQiVpBj1qxZ/Pd///cRb+97DgzqdZqLktNGc4AoA6IMiDIgyoCAFvixYNs2nTp1iroMiZBFwKZNm3QVfUNpDhBlQJQBUQZEGRDQVfRjIZ/P88ILL5DP56MuRSIS2GmefvppXUXfUJoDRBkQZUCUAVEGBLTAjwXXdRk2bBiuqw0ZprKCGu666y6dwTeU5gBRBkQZEGVAlAEBbdGPBcuyOPPMM6MuQyJkEbBjxw4t8A2lOUCUAVEGRBkQZUBAZ/BjIZ/Ps2DBAm3HMVhgp3nuuee0Rd9QmgNEGRBlQJQBUQYEdAY/FlzXZdSoUdqOYzAryDJ58mQWLVoUdSkSAc0BogycnO3bt1NVVRV1Gc0iDEO6devG+vXrj7ibq0uXLsZ9hahpNA+IMiCgBX5s6IlsupCDBw9GXYRESHOAKAONs337dkpK+pLNxmfuTKfTZDKZI96WSrVh06aNWuTHnOYBUQZECYgBz/NYuHAhY8aMIZFIRF2ORCC008yfP58wDKMuRSKgOUCUgcarqqo6tLifB/SNupwmS6cD5s+vZMKEYjKZj38CcyPZ7ESqqqq0wI8xzQOiDAhogR8LrusyZswYvWNnMCvIMGHCBJYtWxZ1KRIBzQGiDDRFX2BQ1EU0WSYTMmHCxWQyLqALrppI84AoAwK6yF5seJ4XdQkSKYs2bdpEXYRESHOAKANmsyxo08ZDX6ZiNs0DogyIFvgx4Hke5eXlekIbLLRTzJkzR1v0DaU5QJQBSaU85swpJ5VSBkyleUCUAQFt0Y+FRCLBVVddFXUZEiE7yDBu3DhWr14ddSkSAc0BogxIJpNg3LiTy0Ccvk3geOL8bQKaB0QZENACPxbCMGT//v20a9fuiF+NI/EXYtO9e7HO4BtKc4AoA2LbIcXF+6msbEcQnHgG4vhtAscS528T0DwgyoCAFvix4Hkey5YtY9SoUbpipqFCO8lDDz2kBb6hNAeIMiDJpMdDDy1j8uRRZDInnoG4fZvAscX72wQ0D4gyIKAFfiwkEgmuvPLKqMuQCNlBhuuuu05b9A2lOUCUAclkElx3XVMyEI9vEzCZ5gFRBgR0kb1YCIKADz74gCAIoi5FIhJiU1JSojP4htIcIMqA2HZASckH2LYyYCrNA6IMCGiBHwu+77Nq1Sp834+6FIlIaBcxdepULfANpTlAlAEpKvKZOnUVRUXKgKk0D4gyIKAFfiwkEglGjx6tz9oYzA6y3HTTTdi2ntIm0hwgyoBkswluumk02awyYCrNA6IMCGiBHwtBELBr1y5txzFYiM2AAQN0Bt9QmgNEGRDbDhgwYJe26BtM84AoAwK6yF4sBEHAhg0bGD58uM7gGiq0i5g0aZIW+IbSHCDKgBQVBUyatIFvfWs42awy0Fjbt2+nqqoq6jKaJAgC/vrXv3LWWWcdcx7o0qVLLL9FQHQskFpa4MeA67qMHDky6jIkQnaQZcqUKbqKvqE0B4gyINmsy5QpysDJ2L59OyUlfQ99XWD8pVJt2LRpoxb5MaRjgYAW+LEQBAE7d+6kW7duerfOUCEOZWVDdAbfUJoDRBkQxwkYMmQnK1d2w/eVgcaoqqo6tLifR+3XBbZOjhMyZEiGlSvT+L51lHttJJudSFVVlRb4MaRjgYAW+LEQBAFbtmw57pYsia/Qchk7dqwW+IbSHCDKgLhuwNixW1i9+iwt8E9aX2BQ1EWcNNf1GDu2gtWrL8b39RLfRDoWCOgie7Hgui7Dhw/HdTWZm8oOa5g2bZomc0NpDhBlQGpqXKZNG05NjTJgKmVAdCwQ0AI/FoIg4O2339YVMw0WWi6XX365zuAbSnOAKAPiugGXX/42rqsMmEoZEB0LBLTAj4UgCKisrNST2WAhDkOHDtUC31CaA0QZEMcJGDq0EsdRBkylDIiOBQJa4MeC67qUlZVpO47B7LCGmTNnaou+oTQHiDIgNTUuM2eWaXu2wZQB0bFAQAv8WPB9n7feegvf96MuRSKii+yZTXOAKAPiuj5jx76F6yoDplIGRMcCAS3wYyEMQ/bs2aPFncFCbEpKSpQBQ2kOEGVAbDukpGQPtq0MmEoZEB0LBPQ1ebHgui6DBw+OugyJkB3mmDVrFtdee23UpUgENAfIyWRg+/btVFVVnaKKWpYuXbrE/ju/czmXWbM0D5hMGRC9HhDQAj8WfN9n8+bN9OnTB8dxoi5HIhBaLtdeO17v2BpKc4A0NgPbt2+npKQv2ezB01Bd9FKpNmzatDHWi3zX9Rk/fjPPPtsHz9M8YCJlQPR6QEAL/NjIZDJRlyARCrHp3LmzFvgG0xwgjclAVVXVocX9PKDvKaupZdhINjuRqqqqWC/wbRs6d86ga62aSxkQ0OsBacEL/HfeeYd7772XP/zhD+zevZtu3boxbtw4pk+fTseOHRv1WMuWLeNHP/oRFRUVfPDBB3Tq1IlPfepT3HHHHYwZM+YU9eD0cRyHgQMHRl2GRMgOc8yePZtJkyZFXYpEQHOAnHwG+gKDmrsciUAu5zB7tuYBkykDotcDAi30IntbtmyhtLSUuXPncskll3DnnXdy/vnn8+Mf/5jPfvaz7N69+4Qf67777mP48OEsXbqUL3zhC3zzm9/kS1/6Env27OHll18+dZ04jXzfZ8OGDbpipsFCK8GNN96oM/iG0hwgyoAkEj433riBREIZMJUyIDoWCLTQM/i33HILu3bt4tFHH+XrX/964eff+MY3eOSRR7jnnnv493//9+M+zi9/+Uu+853vcPnll/PrX/+adu3aNbg9n883e+0iIiIiIiIiUWhxZ/C3bNlCeXk5vXr14tZbb21w28yZM2nbti0/+9nP+PDDD4/5OEEQcNddd5FOp3n66acPW9wDJBKJZq09Ko7j0K9fP11Mw2BWmGfu3LlYlhV1KRIBzQGiDEg+7zB3bj/yeWXAVMqA6Fgg0ALP4L/00ksAjBo1CvtjVwlp164dQ4cOpby8nJUrV/L5z3/+qI9TUVHBtm3bGD9+PB07duSFF15gw4YNpFIpLrnkEj772c+e0n6cTr7vs379evr3768ntKECq4hbb72ZIAiiLqXFivNXggVBQHV1NR06dMC2bSO+Ekwa0nFAiop8br55PU880Z9cThkwkTIgOhYItMAF/qZNmwDo06fPEW/v06cP5eXlvPnmm8dc4K9atQqAs88+m9LSUtavX9/g9uHDh/Pss8/yiU984qiPUVNTQ01NTeHP+/btAyh8rqXu/47jNGh7nodlWYW2bdvYtn3Udj6fx3GcQtt1XSzLKrQBPM9r0E4kEoRhWHicVCqF53k4jkMYhqRSKSBLgEOAi0sNAS4BDi41+LiE2Ljk8HEBG4ccPrW7Ghzy+BQBAQ4eHkVYhXYSGx+70Paw8fFIYZPDJiBPCqfQTuNSg1VoZ4EQjzQuGcDCI0WCDCE2HkkSZAiw8SkiQZYAm4Ai3I/1KbRckkmnMB5hGOK6Lr7vFxa7oZXAb0V9Oqlxsmx2795NGIb4vl/IXt1n8gMrSdDa+tTIcQrJAQFBUPtf/efTjh07GDRwAB/sqSYMQ9LpNJlMBsuySKVSZDIZbNsmmUwW2kVFRWSz2QZtx3FwXZeamhpc18VxnELbtm1yuVyDdt0uoXw+T1FREUEQ4Hleg3YymcT3/ULb8zx83yeVSpHL5QiCoEE7nU5TU1NTaNfVde211/LMM8/g+z6dOnZgzdp1dO/evTBfBEGA7/uFdhAEuK571PbHn09HmuuinPfUp4Z9siyrkKUT6RNw6P4hngfJpIfn2fi+TSrlkcvZBIFNKpUnl3MIApt0Ok9NjUsQWKTTebJZlzCEdNojk3GxLEilPDKZBLYdkkzWtQOKinyy2bp2QDbr4jgBrhtQU+PiugGOU9f2se2QXK6uXXvxsLrPFefzDkVFPkEAnudQVOQRBBae55BMevi+jefZ9foEqVSqMB/WjRNw6PkUEgS0sj4dPk5BALt3p0km83ie/bFxqp33wjBskLcwDAvHStsOKSrKt6g+nZrsUfg3qP98AnDdENv2WmGfascpkfDYvTuNbQckk+FRxikgl6PB64XWOu/FcS5vjj7VrgFocp927tzJ+++/TxiG2LZdmD+aow1gWRZBEGBZ1ilpA4XjY137aHV17dqVc889t0VnrzHX2WpxW/T37t0LQPv27Y94e93Pq6urj/k4u3btAuAnP/kJmUyGJUuWsH//fjZs2MDo0aNZunQp11xzzTEf44EHHqB9+/aF/7p37w7Ahg0bANi4cSMbN24EYP369WzevBmAtWvXsnXrVgBeffVVduzYAdTuKti5cycAS5cuLZxNXLJkSaE/5eXl7N+/H4CFCxeSzWbxPI+FCxfieR7ZbJaFCxcCsH//fsrLy3Ech7POOqtw0cBsNsvDDz8MwE5nCBWpmQDscEfwanIaAFvdMaxN3g7A5sR41hfdXNunoolsLJpY26eim9mcGF/bp+TtbHVrv3Hg1eQ0drgjavuUmslOZ0htn9IPU+X0r+1T+jGq7do3acrbzGG/VVzbp7bzyVqd8EizsO18PNJkrU4sbDu/tk9WMeVt5gBQbfdhSfoxAKqc/ixNH96nAx1GMG3aoT5t3cratWtr+7R5c+HftPqs1tWnkxmn/V3G8cwzz7Bnz54G2Ttw4AAA7/dqfX1q7Dhlz6jt03vvvXfY86mqqoo5T81l3h2dWHV/mvnz57Pq/jT/80An5s+fz+r7oOKhYp6ZN4fV98HyWX341c8fY/V9sPSH/Xn2pw+z+j54+ZEh/GbuTFbfBy/+eAQLnpzG6vtg8b+N4bdP3M7q+6D88fG88O83s/o++P1PJvL7n0xk9X3wwr/fTPnj41l9H/z2idtZ/G9jWH0fLHhyGi/+eASr74PfzJ3Jy48MYfV98OxPH2bpD/uz+j741c8fY/msPqy+D56ZN4eKh4pZfR/Mnz+f/3mgE698N8H48eN55bsJ5t3RiTlPzaWqqqowR0DtnLlkyZLacaqqYunSpbXjtHMnFRUVteO0Ywevvvpq7Th97PlU9yZpS5n31KeGfap7QfDnP//5hPs0bdo0RoyonSNmzqxgyJDaPj388FL696/t02OPLaFPn9o+zZlTTnFxbZ/mz19Ip05Z0mmP+fMXkk57dOqUZf782j4VF+9nzpzaPvXpU81jj9X2qX//Kh5+uLZPQ4bsZObM2j6NGLGDadNq+zRmzFZuv712nMaP38zNN9eO08SJG5k4sbZPN9+8nvHja/t0++1rGTOmrk+vMmLEjiP06WGy2exh4zRnzhyKi71W2qeG49Sr136eeeYi/uM/XjzCOIXMnz+fMAwPy9677757qE+5Ften5s/eX4HarxGr/3yqu3jzmDEftsI+fTRO3/nOSp555iIuvfTdY4xT7e+vrq5u9fMexG8ub2qfVq5cyZlnnonjOE3uU0lJX66++mo2b95MaWkp119/Pa+//jqlpaXcdNNNvPLKK5SWljJlyhRefPFFSktLmTZtGr/73e8oLS3lu9/9Lr/85S8pLS3lBz/4AT/96U8pLS1l9uzZzJ49m9LSUn7605/ygx/8gNLSUn75y1/y3e9+l9LSUn73u98xbdo0SktLefHFF5kyZQqlpaW88sor3HTTTZSWlvL6669z/fXXU1payubNm7n66qspLS2lsrKS0aNHM2zYMCorKxk2bBijR4+msrKS0tLSI/appKQv//u//9vis3eirLCFXXb7H/7hH3jiiSd44oknuOmmmw67/V/+5V944IEHeOCBBwoLuyP51re+xaxZs7Btm3Xr1vGpT32qcFsmk+HCCy/knXfeoaKi4qjb9Y90Br979+588MEHdOzYscW8U2hZFmvWrKF///6kUilWr17NpZdeyopvZxnQK95n8Fdvcxn6XYeKigouvvjiBu+qrV27lsGDB/Pa9xMM6Nl6+nQy47TmbZdf7bmV8ePHU1paWsje66+/zqc//WlWfT/JoJ6tq0+NHafXt+b49LcDVq1axaBBgxo8n9auXcull17KsnuyDOrVevp0ouPkkWBN8hsMqvkh67fmGfb9FMuXL2fgwIEt4mxCHM+QtLQ+AaxZs4aLL764cCb/WH16/fXXKSsrw/dX4HmlMT+Dv45UaijLly+ntLS0ME7r1q3j0ksvpaZmGUFQ2sr6dPg4QcjXv/46//mf/di/P/WxcVpDOj2MZcuWMWjQoAbZW716NYMHD8a2X6OoqH+L6lPzZ28N2exgXnvtNS6++OLC82nNmjUMHjwY130N2764lfXpo3Fq0ybH1772//HYYxcTBPZRxmktuVztv8GAAQNa9bwXx7m8qX3KZrOsX7+eQYNqv/70ZPv00bwwj2SyhEzGPrTLJySbbdh2nBDXDampsXHdEMf5qF2bvYbtRKJuN5VFUVFw6DnUsJ1MBvj+R23Ps/B9i1QqIJezCIKG7XQ6oKbmo3Y2ax16PoVkMtah51NY6EcyGdbr0xtksxMPmxdaWvYOHjxIhw4d2Lt3L2eeeSbH0uK26Nedoa87k/9xddvkj3aGv07Hjh0BOP/88xss7qF2S97o0aOZM2cOr7766lEX+MlkkmQyedjP67b21f9sS/123ZPjRNv1L/bXmLZlWSQSidotuZ06Nfh53bs8tQsH/1Dbw6b2TIVz6P+Ht/P12rmP6m3QrjlK+6N3lhIN2pnjtMNC2yIotG0CbLJHaH/UJyv0qKk51KePjUfdNRysME/dLa2hTyczTnYYsGnTJhzHKfw71E0KAHZYU9iu01r6VOdEx6nu8oJ1kyQ0fN5kMhkswGpFfapzvHGyCejs/y82ARYhmcyhPh2aIz7+73Ii7aPNby1l3lOfGvap7jhQV8+J9Kn2DWzrUPujn2ez9dv1n0PHbofhR+0gsOq1bbJZ+7C279cugAA8r3ZhVNv+qN767foXDqv/+eJcrn6fjtzOZrOF+fDj80Ldv0Hr61PDcXJdn02bOnLgQBFB8PE+WYWPJdXPm2VZhSwFgVUY75bSpzrNnT3LsgrPhfrPJ8+zqHtp3Nr65Ps2mUyCTZs6ks87hfoPH6eP/g2O9Hq2Nc17J9o2qU+JRIJOnTo1GN+T6dNH80JfMplBh9pQdxK5ftv3a/8D8Lza/+radeq363+JWS535Ha986sN2vVPYtdvZzLHbtc+nz6qvX47m62dL482L7SU7DXmQtotbot+SUkJAG+++eYRb6/b8nDhhRee0ON06NDhiLfXvQGQqZ+CVspxHC644IIGgRKzWKHH888/r6voG8rB4wLv+QZvLohZdBwQz3N4/vkLGizoxCzKgOhYINACF/iXXXYZUPu5g49fEXz//v2sWLGCdDrNZz7zmWM+zvDhw3Fdl7feeotc/beEDqn7HH3Pnj2bp/AIeZ5HRUUFnqcX96YKrCTTp08/7DkjZvBIUpGcjsfhO47EDDoOSDLpMX16BcmkMmAqZUB0LBBogQv83r17M2rUKLZt28bs2bMb3DZ9+nQOHDjAV77yFdq2bQvUXg33jTfeYMuWLQ3u26VLF7785S9TXV3N/fff3+C2P/7xjyxatIj27dvzhS984dR26DSwbZvi4uLC9hExj4XPihUrdAbfUDY+xf6KwscHxDw6Dojv26xYUVzYTi/mUQZExwKBFvgZfIDHH3+csrKywlUZ+/bty8qVK3nppZe48MIL+f73v1+4b2VlJX379qVHjx5s27atweP88Ic/ZOXKlcycOZOXXnqJwYMH8/bbb/Ob3/wGx3F44oknjrqFvzWxbZsePXpEXYZEyAo9Fi9erAW+oWw8eniLoy5DIqTjgHiezeLFyoDJlAHRsUCgBZ7Bh9qz+K+99ho33HADK1eu5F//9V/ZsmULU6ZM4ZVXXqFz584n9Dhdu3Zl5cqV3HnnnWzfvp1HH32UJUuWcOWVV7Js2bLjfk1ea+F5HkuXLtV2HIMFVpIHH3xQW/QN5ZFkaepBbdE3mI4Dkkx6PPjgUm3PNpgyIDoWCLTQM/gA3bt3Z+7cuce9X8+ePTnWN/116tSJH/7wh/zwhz9szvJaFNu26d27t7bjGKzuInuXX3551KVIBGw8euefL1zVX8yj44B4ns3zz/cuXOVezKMMiI4FAi14gS8nru7zNmIuC5+Kigpt0TdU7WfwK6IuQyKk44D4vk1FhTJgMmVAdCwQaKFb9KVxPM9jyZIl2o5jsMBO8eijj2qLvqE8UixJP4pHKupSJCI6Dkgq5fHoo0tIpZQBUykDomOBgBb4sWDbNv369dN2HINZQY6nnnpKZ/ANZZOjX+4pbA7/SlAxg44DksvZPPVUP3I5ZcBUyoDoWCDQxAX+rl27mqsOaQLbtunatauezAazCFi3bp0W+IayCejqr8NGOzhMpeOABIHNunVdCQJlwFTKgOhYINDEBX737t358pe/zJIlS5qrHjkJ+XyeRYsWkc/noy5FIhLYKZ588klt0TdUnhSL0k+S1xZ9Y+k4IKlUniefXEQqpQyYShkQHQsEmrjAv/DCC/nVr37FFVdcwYUXXsi//uu/snv37uaqTU6Q4zgMHjwYx3GiLkUiYgU5Zs2apTP4hnLIMbhmFo626BtLxwHJ5RxmzRpMLqcMmEoZEB0LBJq4wP///r//j2XLlnH99dfzzjvvMHXqVM4991wmTpzIsmXLmqtGOQ7btunUqZO24xjMImDTpk1a4BvKJqBTsElb9A2m44AEgc2mTZ20PdtgyoDoWCDQDBfZGzp0KD/72c949913+eEPf0ivXr14+umnGTFiBJ/85Cd59NFHqa6uboZS5Wjy+TwvvPCCtuMYLLDTPP3009qib6g8aV5o8zR50lGXIhHRcUDS6TxPP/0C6bQyYCplQHQsEGjGq+h36NCBO+64g//93//l5ZdfZsKECWzdupU777yT4uJibrzxRl577bXm+nVSj+u6DBs2DNd1oy5FImIFNdx11106g28olxqGZe7CpSbqUiQiOg5ITY3LXXcNo6ZGGTCVMiA6Fgicoq/J69atG2effTZt27YlDENqamr4r//6L4YMGcLf/d3f6Yx+M7MsizPPPFOLO4NZBOzYsUMZMJRFwJnhDixt0TeWjgMSBBY7dpxJECgDplIGRMcCgWZc4OfzeX7xi1/w+c9/nosuuogf/vCHfOITn+CRRx6hqqqKxYsXc8UVV/Cb3/yGW2+9tbl+rVD7b79gwQJtxzFYYKd57rnntEXfUHnSLGj7nLboG0zHAUmn8zz33AJtzzaYMiA6FghAk/dvvPXWW/znf/4n//Vf/0VVVRWO43D11Vdzyy23MHLkyML9Ro4cyciRIxk3bhwLFy5s6q+VelzXZdSoUdqOYzAryDJ58mQWLVoUdSkSAZcsow5OxiUbdSkSER0HJJt1mTx5FNmsMmAqZUB0LBBo4gL/8ssv56WXXiIMQ8455xzuvfdebr75Zs4555yj/p3S0lJ++9vfNuXXyhHoiWy6kIMHD0ZdhEQmxA0PAmHUhUiEdBwwWxjCwYMuoaYBYykDAjoWSBO36C9ZsoQRI0bwq1/9irfffpvp06cfc3EPMG7cOJ566qmm/Fr5GM/zWLhwIZ7nRV2KRCS008yfP59QR3UjeaRZ2HY+nrboG0vHAUmnPebPX0g6rQyYShkQHQsEmngGf+PGjZSUlDTq73zqU5/iU5/6VFN+rXyM67qMGTNG79gZzAoyTJgwgWXLlkVdikTAJcOYAxNwyURdikRExwHJZFwmTBhDJqMMmEoZEB0LBJp4Bv8Xv/gFS5cuPeZ9li1bxne/+92m/Bo5AXqnznQWbdq0iboIiYyFZ7UBdNVck+k4YDbLgjZtPHTxbHMpAwI6FkgTF/gzZszg5ZdfPuZ9li5dysyZM5vya+Q4PM+jvLxcT2iDhXaKOXPmaIu+oTxSlLeZg0cq6lIkIjoOSCrlMWdOOamUMmAqZUB0LBBoxq/JOxrP87DtU/5rjJZIJLjqqqtIJBJRlyIRsYMM48aN03PNUAkyXHVgHAlt0TeWjgOSySQYN+4qMhllwFTKgOhYIHAaFvhr166lS5cup/rXGC0MQ/bt26eztwYLsenevbsyYKgQm31Wd8JTP6VLC6XjgNh2SPfu+7BtZcBUyoDoWCBwEhfZq//d9gA//elPj7hN3/d9duzYwdtvv82ECRNOukA5Ps/zWLZsGaNGjdI7doYK7SQPPfSQJnRDeSRZln6IUQcng87iG0nHAUkmPR56aBmTJ4/SGVxDKQOiY4HASSzw6y/mLcti27ZtbNu27bD72bZN586d+fKXv8wjjzzSlBrlOBKJBFdeeWXUZUiE7CDDddddx+rVq6MuRSKQIMOVB6+LugyJkI4DkskkuO46ZcBkzZGB7du3U1VV1UwVtWxdunThvPPOi7qMZqVjgcBJLPCDICi0bdtmxowZ3Hvvvc1alDROEARUV1fToUMHfQbbUCE2JSV9dAbfUAE21XYfOgSbgeC495f40XFAbDugT59qNm/uQBAoAyZqaga2b99OSUlfstmDp6C6lieVasOmTRtjtcjXsUDgJBb49c2dO5eBAwc2Vy1yknzfZ9WqVYwcOVJPZkOFdhFTp07VAt9QPkWsSk5lZOY2IBt1ORIBHQekqMhn6tRV3HbbSLJZZcBETc1AVVXVocX9PKBvs9fXsmwkm51IVVVVrBb4OhYINHGB/9WvfrW56pAmSCQSjB49OuoyJEJ2kOWmm27SFn1DJcgyOnNT1GVIhHQckGw2wU03KQMma74M9AUGNcPjyOmmY4FAIxf4S5cuBeCSSy4hlUoV/nwihg8f3rjK5IQFQUBVVRVdunTRu3WGCrEZMKC/zuAbKsCmyulPF3892qJvJh0HxLYD+vevYv36LtqibyhlQHQsEGjkAn/EiBFYlsXGjRu58MILC38+Eb7vn1SBcnxBELBhwwaGDx+uJ7OhQruISZMmaYFvqIAiNhRNYnjmW2iLvpl0HJCiooBJkzbwrW8N1xZ9QykDzaM1X2gwCAL++te/ctZZZ53QsSCOFxqURi7w7733XizLKnyvfd2fJVqu6x729YViFjvIMmXKFG3RN5RLlpGZKVGXIRHScUCyWZcpU5QBkykDTacLDUocNGqBP2PGjGP+WaIRBAE7d+6kW7duOnNjqBCHsrIhOoNvqACHnc4QuvkrAe2WMpGOA+I4AUOG7GTlym74vjJgImWg6Vr7hQYdJ2TIkAwrV6bx/eOdhI3nhQaliRfZk5YhCAK2bNlywttxJH5Cy2Xs2LFa4BsqwGVLYixn+avRAt9MOg6I6waMHbuF1avP0uLOUMpAc2qdFxp0XY+xYytYvfpifF/LPFPp2R8DrusyfPhwXFdPZFPZYQ3Tpk3TC3tDudQwPDsNl5qoS5GI6DggNTUu06YNp6ZGGTCVMiDKgEAjz+Cf7Of7LMvixRdfPKm/K8cXBAE7duyge/fuWuAZKrRcLr98hM7gGyrAZYc7gu7ey4AXdTkSAR0HxHUDRozYwcsvd8fzlAETKQOiDAg0coH/8ssvn9Qv0YX4Tq0gCKisrKS4uFgv7AwV4jB06FAt8A0V4FDpDKXYW4YW+GbScUAcJ2Do0EqWLSvWC3tDKQOiDAg0cot+EAQn9Z++Iu/Ucl2XsrIybc00mB3WMHPmTL2wN5RLDWU1M7VF32A6DkhNjcvMmWXammswZUCUAQF9Bj8WfN/nrbfe0hspBtNF9szm4/KWOxZf1001lo4D4ro+Y8e+hesqA6ZSBkQZENACPxbCMGTPnj1a3BksxKakpEQZMFSIzR6nhFBTurF0HBDbDikp2YNtKwOmUgZEGRBo5Gfwly5dCsAll1xCKpUq/PlEDB8+vHGVyQlzXZfBgwdHXYZEyA5zzJo1i2uvvTbqUiQCLjkG18w67v22b99OVVXVaagoel26dDnq9/rG9d/BcRzWr1/f4GfH+neQeMnlXGbN0msBkykDogwINHKBP2LECCzLYuPGjVx44YWFP58IbRs8dXzfZ/PmzfTp0wfHcaIuRyIQWi7XXjteZ+8M5eOyOTGePvlnOdpF9rZv307fi0o4mMme3uIi0iadYuMbmw5b3G7fvp2Skr5kswcjquzUcF2X8ePH8+yzz+J5H2UglWrDpk0btcg3gOv6jB+/mWef7YPn6bWAiZQBUQYEGrnAv/fee7Esiy5dujT4s0Qvk8lEXYJEKMSmc+fOWuAbyyZjdeZYn7qqqqriYCbLvFug7zmnr7IobHwXJj6epaqq6rCFbVVV1aHF/TygbyT1nQq2HdC5czW2/U0+ysFGstmJR/x3kPixbejcOYOutWouZUCUAYFGLvBnzJhxzD9LNBzHYeDAgVGXIRGywxyzZ89m0qRJUZciEXDIMTA3+4Tu2/ccGNTrFBfUKvQFBkVdRLPJ5WD2iUVAYiqXc5g9W68FTKYMiDIgoIvsxYLv+2zYsEEfgzBYaCW48cYbdQbfUD4JNhTdiE8i6lIkIomEz403biCR0HHAVMqAKAOiDAg08gz+sSxbtoy1a9eyd+9e2rdvz8CBAxk2bFhzPbyIiIiIiIiIHEOTF/grVqxg0qRJvPXWW0DtV/XUfS6/T58+zJkzh6FDhzb118gxOI5Dv379oi5DImSFeebOncttt90WdSkSAYc8/XJzoy5DIpTPO8ydq+OAyZQBUQZEGRBo4hb91atXc8UVV7B582aGDx/Ovffey09+8hPuvfdehg0bxptvvsmoUaNYs2ZNc9UrR+D7PmvXrtUWfYMFVhG33norQRBEXYpEwKeItUW34lMUdSkSkaIin1tvXUtRkY4DplIGRBkQZUCgiWfw77nnHjzPY8GCBXzpS19qcNv06dNZsGAB48eP55577uH3v/99kwqVY0un01GXIBGyCNi9e7e+1cJYAelwN6A3eEwVBLB7dxq9x2cuZUCUAVEGBJp4Br+iooK//du/PWxxX+eqq67i6quvpqKioim/Ro7DcRwuuugiHEffd2kqK/R45plntMA3lIPHRflncPCOf2eJJc9zeOaZi/S9xwZTBkQZEGVAoIkLfNu2ueCCC455nz59+mjRcYp5nseqVavwPL24N1VgFTF16lRt0TeURxGrklPxtEXfWEVFHlOnrqKoSMcBUykDogyIMiDQxAX+pz/9aV5//fVj3uf111/nkksuacqvkeOwLIuOHTvqjRSDWQRs2rRJGTCURUBHfxOWtugbKwgsNm3qSBBoDjCVMiDKgCgDAk1c4N9333388Y9/5Cc/+ckRb589ezYvvvgi3/ve95rya+Q4HMfhggsu0BZ9g1mhx/PPP68FvqEcPC7wntcWfYN5nsPzz1+gbZkGUwZEGRBlQKCRF9n77ne/e9jPRo4cyW233caPfvQjhg0bxllnncVf//pXli9fzubNm/nCF75AeXk5Q4YMabaipSHP83j11Ve55JJLcN0mf/OhtEKBlWT69Gnaom8ojySvJqdxSc2DQE3U5UgEkkmPadNe5cEHL6GmRscBEykDogyIMiDQyAX+jBkzjnrb5s2b2bx582E///3vf88f/vAHvvOd7zS6ODkxtm1TXFyMbTdpQ4a0YhY+K1asOOoFLyXebHyK/RXY6GtxTOX7NitWFOP7Og6YShkQZUCUAYFGLvBfeumlU1WHNIFt2/To0SPqMiRCVuixePFibdE3lI1HD29x1GVIhDzPZvFiHQdMpgyIMiDKgEAjF/if+9znTlUd0gSe51FRUUFZWZm26BsqsJI8+OBMbdE3lEeSitRMyrLT0RZ9MyWTHjNnVjB9epm2ZRpKGRBlQJQBgSZeZE9aBtu26d27t7boG0wX2TObjUfv/PPYusiesTzP5vnne+N5Og6YShkQZUCUAYFGnsGXlqnuM/hiLgufiooKLfANVfsZ/Iqoy5AI+b5NRYWOAyZTBkQZEGVAoBnO4L/77rvccsstXHDBBaTTaRzHOew/bRs/tTzPY8mSJXiezt6ZKrBTPProo9qibyiPFEvSj+KRiroUiUgq5fHoo0tIpXQcMJUyIMqAKAMCTTyDv2PHDi655BLef/99PvnJT1JTU0OPHj1IJpP85S9/wfM8BgwYQPv27ZurXjkC27bp16+ftugbzApyPPXUU5SVlUVdikTAJke/3FPY5KIuRSKSy9k89VQ/cjkdB0ylDIgyIMqAQBPP4H/ve99j165dvPDCC6xfvx6AG2+8kTfeeIO//OUvjB49mkwmw69//etmKVaOzLZtunbtqgW+wSwC1q1bpy36hrIJ6Oqvw0Y7OEwVBDbr1nUlCHQcMJUyIMqAKAMCTVzgl5eXM3r0aEaPHn3Ybeeeey6/+tWvyGQyTJ8+vSm/Ro4jn8+zaNEi8vl81KVIRAI7xZNPPqkt+obKk2JR+kny2qJvrFQqz5NPLiKV0nHAVMqAKAOiDAg0cYH/3nvv0a9fv8KfHcchk8kU/nzGGWdwxRVXsGDBgqb8GjkOx3EYPHgwjuNEXYpExApyzJo1S2fwDeWQY3DNLBxt0TdWLucwa9ZgcjkdB0ylDIgyIMqAQBM/g3/mmWeSy330grJjx45UVlY2uE/79u15//33m/Jr5Dhs26ZTp05RlyERsgjYtGmTFviGsgnoFGyKugyJUBDYbNqk44DJlAFRBkQZEGjiGfwePXqwY8eOwp8vvvhilixZwsGDBwEIgoDy8nLOPffcplUpx5TP53nhhRe0Rd9ggZ3m6aef1hZ9Q+VJ80Kbp8mTjroUiUg6nefpp18gndZxwFTKgCgDogwINHGB//nPf56XXnqpsLD86le/yrvvvktZWRlTp05l6NCh/PnPf+bLX/5ysxQrR+a6LsOGDdPXERrMCmq46667dAbfUC41DMvchUtN1KVIRGpqXO66axg1NToOmEoZEGVAlAGBJm7Rnzx5Mh07dqSqqopu3boxceJEVq9ezb/9278Vrqp/7bXXcs899zRLsXJklmVx5plnRl2GRMgiYMeOHVrgG8oi4Mxwx/HvKLEVBBY7dug4YDJlQJQBUQYEmngGv0+fPtx1111069at8LNHHnmEnTt38sorr7Bz506efvppUild2flUyufzLFiwQFv0DRbYaZ577jlt0TdUnjQL2j6nLfoGS6fzPPfcAm3LNJgyIMqAKAMCTVzgH80nPvEJhgwZwllnnXUqHl4+xnVdRo0apS36BrOCLJMnT9YZfEO5ZBl1cDIu2ahLkYhksy6TJ48im9VxwFTKgCgDogwINHGLfn07duxg7dq17N27l/bt2zNw4EC6d+/eXA8vx6HFvenCwsUtxUQhbngQCKMuRCIShnDwoEuoCBhLGRBlQJQBgWY4g79582auuOIKevbsydVXX80NN9zA1VdfTc+ePbniiit48803m6NOOQbP81i4cCGe50VdikQktNPMnz+fUDO6kTzSLGw7H09b9I2VTnvMn7+QdFrHAVMpA6IMiDIg0MQz+G+99RZlZWXs3r2b3r17c+mll3L22Wfz3nvvsXz5cl588UUuvfRSKioquOCCC5qrZvkY13UZM2aMzuIbzAoyTJgwgWXLlkVdikTAJcOYAxNwyURdikQkk3GZMGEMmYyOA6ZSBkQZEGVAoIkL/Lvvvpvdu3fz4x//mFtvvRXb/mhDQBAE/Nu//Rt33nkn//Iv/8Ivf/nLJhcrR+d5nhb4RrNo06ZN1EVIZCw8qw1umEXb9E/UxqgLaFaWFdKmjU826xCGddfiiFcf5dgsC9q08chmtT3XVMqAKAMCTVzgv/jii4wZM4avf/3rh91m2za333475eXlLF68uCm/Ro7D8zzKy8sZM2YMiUQi6nIkAqGdYs6cOdqibyiPFOVt5jDmwAQ4zln8je+enpqidKw+7ty5E9uCIJx4+go6DVKpNHPmzGfChAlkMh9lwLZq+yzxl0p5zJlTfujsnV4LmEgZEGVAoIkL/Fwux4ABA455nwEDBrB06dKm/Bo5jkQiwVVXXRV1GRIhO8gwbtw4Vq9eHXUpEoEEGa46MO6Y96ld5NlMfNyUr1K0j7iwra6uJghh3i3Q95wIyjplMrBhHMvv+egnG9+FiY/X9lniL5NJMG6cXguYTBkQZUCgiQv8iy++mLfeeuuY93nrrbfo379/U36NHEcYhuzfv5927drpa9IMFWLTvXuxzuAbKsRmv1VMu7ASOPICvnaRFwDzgL6nr7hIbAQmHnNh2/ccGNTrtBV0ytXPgHWUDEi82XZIcfF+KivbEQR6LWAiZUCUAYFm+Az+3/7t3/L73/+ev/mbvzns9hdeeIHf/OY3LFiwoCm/Ro7D8zyWLVvGqFGjtEXfUKGd5KGHHtIC31AeSZalH2LUwckcb4t+7eJ+0GmoSk6n+hlI6GKLRkomPR56aBmTJ4/S1lxDKQOiDAg0coH/s5/97LCf/c3f/A1f/OIX+fznP8/w4cM566yz+Otf/8qf/vQnlixZwtixY3n//febrWA5XCKR4Morr4y6DImQHWS47rrrtEXfUAkyXHnwuqjLkAgpA5LJJLjuOr0WMJkyIMqAQCMX+DfccMNhW8DrzhguXrz4iBfTW7BgAc8//zxf+cpXmlCmHEsQBFRXV9OhQ4cG32Qg5gixKSnpozP4hgqwqbb70CHYzNG26Eu81c+ArQwYybYD+vSpZvPmDgSBXguYSBkQZUCgkQv8uXPnnqo6pAl832fVqlWMHDlSC3xDhXYRU6dO1QLfUD5FrEpOZWTmNiAbdTkSgfoZsJUBIxUV+UyduorbbhtJNqvXAiZSBkQZEGjkAv+rX/3qqapDmiCRSDB69Oioy5AI2UGWm266SVv0DZUgy+jMTVGXIRFSBiSbTXDTTXotYDJlQJQBAdBbOzEQBAG7du0iCLQt01QhNgMGDNAZfEMF2OxyBhBoSjeWMiC2HTBgwC5sW68FTKUMiDIg0EwL/AMHDjBv3jy+8Y1vMHnyZL7xjW8wb948Dhw40BwPL8cRBAEbNmzQAt9goV3EpEmTtMA3VEARG4omEVAUdSkSEWVAiooCJk3aQFGRXguYShkQZUCgiV+TB/Db3/6WG2+8kT179jRYXFiWxZ133sncuXP54he/2NRfI8fgui4jR46MugyJkB1kmTJlirboG8oly8jMlKjLkAgpA5LNukyZotcCJlMGmtPGqAs4KdksTJnSAVh/AvdunX2U42vSAv+1115j/Pjx+L7PhAkTuPzyy+nWrRs7d+5kyZIlzJ8/n/Hjx7NixQpKS0ubq2b5mCAI2LlzJ926ddNF9gwV4lBWNkRn8A0V4LDTGUI3fyXgR12ORKB+BmxlwEiOEzBkyE5WruyG7+u1gImUgabbuXMntgVBODHqUk6K4zgMGTKElStX4vvHPxbYVm2fJV6atMC///77sW2bl156ibKysga33XDDDdx6662MGDGC+++/n//3//5fkwqVowuCgC1btnDWWWdpgW+o0HIZO3asFviGCnDZkhjLWf5qtMA3U/0MaIFvJtcNGDt2C6tXn6XFnaGUgaarrq4mCGHeLdD3nKirabzAcnm/11g+ceVq7PDYx4KN78LEx2v7LPHSpAX+8uXLueaaaw5b3NcZMmQI48ePZ9GiRU35NXIcrusyfPjwqMuQCNlhDdOmTdMWfUO51DA8Oy3qMiRCyoDU1LhMm6bXAiZTBppP33NgUK+oqzgZNRBOg55R1yFRatICf+/evXTv3v2Y9znvvPPYt29fU36NHEcQBOzYsYPu3bvrDL6hQsvl8stH6Ay+oQJcdrgj6O69DHhRlyMRqJ8BWxkwkusGjBixg5df7o7n6bWAiZovAyZ8NjuefdSxQKCJC/xzzjmHVatWHfM+r732Gt26dWvKr5HjCIKAyspKiouLtcA3VIjD0KFDtcA3VIBDpTOUYm8ZWuCbqX4G9KLOTI4TMHRoJcuWFWuBb6imZqC1f/68seL4+XMdCwSauMD/m7/5G/7jP/6DH/zgB3zjG99osLgMgoBHHnmExYsX87Wvfa3JhcrRua571I9JiBnssIaZM2cyduzYqEuRCLjUUFYzM+oyJELKgNTUuMycqdcCJmtqBlr7588bI66fP9exQKCJC/zvfOc7PPfcc9x11108/vjjDBs2jLPPPpv33nuP5cuXs23bNs4++2y+/e1vN1e9cgS+77N161Z69eqF4zhRlyMRqL3I3hidwTeUj8tWdwy9vIXoDL6Z6mfAUQaM5Lo+Y8ZsZeHCXnieXguYqLky0Ho/fy46FghAk/ZwdevWjeXLl/P5z3+ebdu28fOf/5xZs2bx85//nK1bt3L55ZezfPlybdE/xcIwZM+ePVrcGSzEpqSkRBkwVIjNHqeEsGlTurRiyoDYdkhJyR5sW8cBUykDomOBQBPP4AOcf/75lJeXU1lZydq1a9m7dy/t27dn4MCBFBcXN0eNchyu6zJ48OCoy5AI2WGOWbNmce2110ZdikTAJcfgmllRlyERUgYkl3OZNUuvBUymDIiOBQJNPIN//vnn80//9E8AFBcX88UvfpHrr7+eL37xi1rcn0a+7/PGG2/g+/ruY1OFlsu1116rM/iG8nF5I3EtftPfs5VWShkQ1/W59to3cF29FjCVMiA6Fgg0cYG/a9cuOnTo0EylSFNkMpmoS5AIhdh07txZC3xj2WSszjRxSpdWTRkwnW1D584Z9GU65lIGRMcCgSaO/ic/+Un+8pe/NFctcpIcx2HgwIG6wJ7B7DDH7Nmz9TWJhnLIMTA3G4dc1KVIRJQByeUcZs8eSC6n1wKmUgZExwKBJi7wb7vtNn7729+yfv365qpHToLv+2zYsEFb9A0WWgluvPFGncE3lE+CDUU34pOIuhSJiDIgiYTPjTduIJHQawFTKQOiY4FAEy+y17NnTz7/+c8zdOhQ/uEf/oFLLrmEs88+G8uyDrvv8OHDm/KrREREREREROQYmrTAHzFiBJZlEYYhjzzyyBEX9nV0dvnUcRyHfv36RV2GRMgK88ydO5fbbrst6lIkAg55+uXmRl2GREgZkHzeYe5cvRYwmTIgOhYINHGBf++99x5zUS+nh+/7rF+/nv79++tz+IYKrCJuvfVmgiCIuhSJgE8R64tupn/uCdDn7oxUPwP67KWZiop8br55PU880V+fwTaUMiA6Fgg0cYE/Y8aMZipDmiqdTkddgkTIImD37t16w81YAelwN6A3eMylDJguCGD37jR6n9dcyoDoWCDQhIvs7dixg1//+tf8+te/Zvv27c1ZkzSS4zhcdNFFOntvMCv0eOaZZ7TAN5SDx0X5Z3Dwoi5FIqIMiOc5PPPMRXieXguYShkQHQsETnKBf9ddd3H++edzzTXXcM0113D++eczderU5q5NTpDneaxatQrP05PZVIFVxNSpU7VF31AeRaxKTsWjKOpSJCLKgBQVeUyduoqiIr0WMJUyIDoWCJzEAv8Xv/gFs2bNIggCLrroIkpKSgD44Q9/yPz585u9QDk+y7Lo2LGjzt4azCJg06ZNyoChLAI6+puwtCXPWMqABIHFpk0dCQIdB0ylDIiOBQInscB/4okncF2XxYsX8+c//5n//d//5Y9//COO4zBnzpxTUaMch+M4XHDBBdqibzAr9Hj++ee1wDeUg8cF3vPakmcwZUA8z+H55y/Q9myDKQOiY4HASSzwX3/9dcaNG8dll11W+Nlll13GVVddxbp165qzNjlBnudRUVGhLfoGC6wk06dP1xZ9Q3kkqUhOxyMZdSkSEWVAkkmP6dMrSCb1WsBUyoDoWCBwEgv8PXv2FLbl11dSUkJ1dXVz1CSNZNs2xcXF2PZJXzNRWjkLnxUrVugMvqFsfIr9Fdj4UZciEVEGxPdtVqwoxvf1WsBUyoDoWCBwEl+TFwQBiUTisJ8nEgnCMGyWoqRxbNumR48eUZchEbJCj8WLF2uBbygbjx7e4qjLkAgpA+J5NosX67WAyZQB0bFA4CSvoq9FRMvieR5Lly7VFn2DBVaSBx98UFv0DeWRZGnqQW3JM5gyIMmkx4MPLtX2bIMpA6JjgcBJLvBnzJiB4zgN/vvud78LcNjPHcfBdRu9UUAawbZtevfurS36BtNF9sxm49E7/zy2LqpjLGVAPM/m+ed743l6LWAqZUB0LBA4iS36QKO34mvr/qlV9xl8MZeFT0VFhRb4hqr9zF1F1GVIhJQB8X2bigq9FjCZMiA6FgicxBn8IAhO6j85dTzPY8mSJdqib7DATvHoo4/quWYojxRL0o/ikYq6FImIMiCplMejjy4hldJrAVMpA6JjgcBJbtGXlsW2bfr166ct+gazghxPPfWUzuAbyiZHv9xT2OSiLkUiogxILmfz1FP9yOX0WsBUyoDoWCDQghf477zzDpMmTeKcc84hmUzSs2dP7rjjDvbs2XPSj/nzn/8cy7KwLIsnn3yyGauNlm3bdO3aVQt8g1kErFu3Tgt8Q9kEdPXXYaMdHKZSBiQIbNat60oQ6LWAqZQB0bFAoIUu8Lds2UJpaSlz587lkksu4c477+T888/nxz/+MZ/97GfZvXt3ox9zx44dfP3rX+eMM844BRVHK5/Ps2jRIvL5fNSlSEQCO8WTTz6pLfqGypNiUfpJ8tqSZyxlQFKpPE8+uYhUSq8FTKUMiI4FAi10gX/LLbewa9cuHn30UZ577jkefPBBlixZwp133smmTZu45557GvV4YRhy44030rlzZ772ta+doqqj4zgOgwcPxnGcqEuRiFhBjlmzZukMvqEccgyumYWjLXnGUgYkl3OYNWswuZxeC5hKGRAdCwRa4AJ/y5YtlJeX06tXL2699dYGt82cOZO2bdvys5/9jA8//PCEH/PRRx9lyZIlzJ07l7Zt2zZ3yZGzbZtOnTppi77BLAI2bdqkBb6hbAI6BZu0Jc9gyoAEgc2mTZ20PdtgyoDoWCDQAhf4L730EgCjRo06bMHarl07hg4dSiaTYeXKlSf0eBs3bmTatGncfvvtDB8+vFG11NTUsG/fvgb/Afi+X/j/kdqe5zVo122bPlo7n883aNd9rWBdOwzDw9pAoZ3P5/nd735HJpMp/DyVqt2aE+DgkTzUdgttHxePokLbL7QT+CQOtYvwD32TotegnSRo0HYOtVMEhyKVb9BOEzZoW4SFNoRY5EnX1o5daAfYhS1GAXbhiqD1+xRaLslksjAGdd8k4Pt+4d80tFpXn05qnJx2PP3004dlry5LgdUK+9TIcaqrvf43d9R/PqXTra9PJzpOOdL8rs3T5A79OZ0+1Kd68wVQmBdsOyhcZdlxApLJ2rbr1m/7FBXVb9fmKpHwSSRq20VFPq5b1/YK7WTSw3WDQttxgkO/38O269r5QjudzmPbYaFtWbWjk07na0fJqmuDbddvB4WtqA37FBbmhSAIGswLdUKr9c57R8pe/lAGspxZ6FNoJQr9PdLxKZlM4rphhON0OrOXanBsrZsj0ul0K+5Tw3Fq27aGp59+gU6dDh6lT+kjvo6o+7ew7bDF9an5sxcU+l03L9Q/Zrhu2Ar79NE4deiQ4emnX+CMM2qOMU4f/Rsc6TVsUVERodU65r269snO5XXHCWj4ujyVSn2sH62nTxk68Ls2T5MnfULj9PHXC3VzxEfzwkbS6deANdj2alKpw9uOs5pksrbtug3bRUWHtxOJ1SQSq4E1FBW9huse3k4mG7Ydp7adSr2GbR/eTqcbti1rNbD6UO2rsazVDfrRsE8bC/8G9eeFI7U/vtY43WvCE9XiFvibNm0CoE+fPke8ve7nb7755nEfy/M8/u///b+cd9553H///Y2u5YEHHqB9+/aF/7p37w7Ahg0bgNo3DzZurA3F+vXr2bx5MwBr165l69atALz66qvs2LEDgIqKCnbu3AnA0qVLqaqqAmDJkiVUV1cDUF5ezv79+wFYuHAh2WwWz/NYuHAhnueRzWZZuHAhAPv376e8vBzXdbn44otZunQpANlslocffhiAnc4QKlIzAdjhjuDV5DQAtrpjWJu8HYDNifGsL7q5tk9FE9lYNLG2T0U3szkxvrZPydvZ6o6p7VNyGjvcEbV9Ss1kpzOktk/ph6ly+tf2Kf0Y1XbtWJW3mcN+q/Z7WRe2nU/W6oRHmoVt5+ORJmt1YmHb+bV9soopbzMHgGq7D0vSjwFQ5fRnafrwPh3oMIJp0w71aetW1q5dW9unzZsL/6bVZ7WuPp3MOO3v/EXuuusuqqurG2TvwIEDALzfq/X1qbHjlD2jtk/vvffeEZ9P8+fPZ9PuTqx+u7ZPq99Os2pHbZ/WbIVX3y3m96k5rNkKK9/rw6Kix1izFV55vz+LnIdZsxUqdg/hj9ZM1myF5dUjeDGYVtveN4Yl3u2s2QpLD4znpZqbWbMVXs5M5OXMRNZshZdqbmbpgfGs2QpLvNtZvm8Ma7bCi8E0llePYM1W+KM1k4rdQ1izFRY5D/PK+/1r20WPsfK9PqzZCr9PzeHVd4tZs7V2nFbt6MTrb9v4Vhtef9tm0+5OzJ9/aJwOzRFQu9Pnscdqx6l//yoefrh2vhgyZCczZ9Z+Z+6IETuYNu1VAMaM2crtt9c+n8aP38zNN68HYOLEjUycWDvv3XzzesaPr533br99LWPG1GZv2rRXGTGidt6bObOCIUNq572HH15K//61895jjy2hT5/acZozp5zi4rpxWkinTlnSaY/58xeSTnt06pRl/vzaea+4eD9z5tT2qU+fah57bMkR+pRh5sxD2duxg1dfre3T1q1bC29y7PtE6533jvR8cqmhu/cyG4u+UuhT9Vm1fUomk0c8Pk2bNo0RIw5EOE6nM3sPk81ma8ep3jF3zpw5FBd7rbRPDcepe/cPueuuYTz22EtHGKeQ+fPnE4bhYa8j3n333UN9yrW4PjV/9v4KQCaToaKitk87duwoXNtpzJgPW2GfPhqnu+9exV13DaOsbOcxxqn291dXVx/xNeztt9/Oh51ax7wHTXsdMXPmzMLHW+u/Ln/sscfIpVtnn1al7uai3Hxcak5onObPn49lWYetNSorK7EtKC6+mzlzNgOl9OlzPY899jpQSv/+N/Hww68ApQwZMoWZM18EShkxYhrTpv0OKGXMmO9y++2/BEoZP/4H3HzzT4FSJk6czcSJs4FSbr75p4wf/wOglNtv/yVjxnwXKGXatN8xYsQ0oJSZM19kyJApQCkPP/wK/fvfBJTy2GOv06fP9UApc+Zsprj4aqCU+fMr6dRpNOn0MObPrySdHkanTqOZP78SKKW4+OqP9SmLbcG7775bWEvt3LmzwRxR/3VE/bXG+vW1c8TpWhOeKCtszNsBp8E//MM/8MQTT/DEE09w0003HXb7Pffcw/3338/999/P3XfffczHuvfee/n+97/P8uXL+exnPwvAjBkzmDlz5lEfv76amhpqamoKf963bx/du3fngw8+oGPHjoV3ZBzHadD2PA/Lsgpt27axbfuo7Xw+j+M4hbbruliWVWhD7ZsV9duJRKLwTlMikSAIAnzfJ5FIsHr1ai699FJWfDvLgF4OAS4uNQS4BDi41ODjEmLjkjv0DqCNQ67wLqFD/tC7h7XvNXoUYRXaSWx87ELbw8bHI4VNDpuAPCmcQjuNSw1WoZ0FQjzSuGQAC48UCTKE2HgkSZAhwManiARZAmwCinDJEvBRn1Zvcxn6XYeKigouvvhiwjDEdV1832ft2rUMHjyY176fYEDP1tOnkxmnddsCPn2Px6pVqxg4cGAhe6+//jqf/vSnWfX9JIN6tq4+NXacXt+a49PfDli1ahWDBg1q8HxauHAh11zzZbLZg4Rh7ZmsTCaDZVmkUikymQy2bZNMJgvtoqIistlsg7bjOLiuS01NDa7r4jhOoW3bNrlcrkE7kajtUz6fp6ioqPAucP12MpksvCOcTCYL7/amUilyuRxBEDRop9NpampqCu1sNnuEPrXhV7/6BWPGjCnMEf/93//NTTfdRDa7AtseQFFRQDbr4jgBrhtQU+PiugGOU9f2se2QXK6uXfv5zrqzWPm8Q1GRTxCA5zkUFXkEgYXnOSSTHr5v43k2yaSH59n4vk0q5ZHL2QSBTSqVJ5dzCAKbdDpPTY1LEFik03myWZcwhHTaI5Nxsazas2CZTALbDkkm69oBRUU+2Wxdu65Pq3HdocyZM4cJEyYQBEFhXnjmmWeYOHEir33fZUDP1jnvnejzad02+PQ9eebNm8e1117b4Pj0+uuvU1ZWhu+vwPNKIxqn05W9daRSQ1m+fDmlpaWFY+66deu49NJLqalZRhCUtrI+NXac1pBOD2PZsmUMGjSoweuI1atXM3jwYGz7NYqK+reiPp3MOK0hmx3Ma6+9xsUXX4zrugRBwJo1axg8eDCu+xq2fXEr61Njx2ktuVztv8GAAQMavIZ95plnmDRpEhXTA0p7ts5570Tn8nVbPcq+l2TOnDlcf/31hdfl8+fP56abbmL5t3OU9mpdfWrsOK3dGnDp99M88cQTXHfddQ3WGk8//TQTJ05k3i02JecmsYPa/oV2EXaQ/VjbIbRc7LCG0HIJceq1beww97F2bZ+sME9g1fbDCr2PtZNY+B+1Qw8Ln8BOYQU5LIKPtdNYQU29du04hXYaK6gdp9BO1evHR316469FTPy3LPPmzePLX/5yYV6oe+1Qv+37foO1xpHWgadqTXjw4EE6dOjA3r17OfPMM4+5hnWPeWsLVPd+xPE+a/zqq69y//33881vfrOwuG+sZDLZYPtOnbp3++pf1K5+u+7JcaLtukVAY9uWZZFIJMjn8yxcuJAxY8YUfl73Lk/tE94/1PawObSV69D/D2/n67U/ukCH26Bdc5T2R+8sJRq0M8dph4W2RVBo2wTYZI/Q/qhPVuhRU1O3Pa3heNR9xMMK89Td0hr6dDLjFFppnnvu2Qb/DnWTAoAd1hS267SWPtU50XGqmxHqJkn46LlSXV1NJnMAmAf05dCnWQhDCu0gaNiue6O0ftv3a/8D8Lza/+radeq363+xRS535Ha99xAbtOu/UVu/nckc3k6nA+bPr2TChGIymU1kMhOprq4uzBEfPU72UJ9ssln7UJ9qX4TW1l774rS2/dHzqX47n/+oXf9CTrncR3NaTc2R29ls/fZHdWUyx27XjlPiUO1WvfZH/WjYJwvfr/3HrJ+H+nOEFXr15oXWNe8d6fmUP3RGacyBCTiH+mTVe/u+/rxQp/YNbOtQO4pxOp3Zyxbmw/rPidqPtlmttE8NxymdzjN//m+ZMGEMQfDxPlmFNwDrzwuWZRWeH0FgFca7pfSpTnNnz7KswnOh/hzheRZ1L41bW59836aoyOe55xYwYcKYwv0PH6eP/g2O9Ho2l8sV5o6WPu8d3m7cXF7/JF79uTGb/eg1RWvrU4jNb9v+P8YcmPCxeo88TnUf7/3464U6fc8JGNSj7v4BFB6nfts/9B+Ad+g/6v3/4+363/KQO0q75ijt7FHameO0w3rtoEHbqvc4R5oXjvY64kTazbkmbMx1tlrcAr99+/YA7N2794i3130Ovu5+R1K3Nf/CCy/ke9/7XvMX2cK4rsuoUaMaBETMYgVZJk+ezKJFi6IupYXrCwyKuohml82GTJ78f8hmU7TAT17JaeCSZdTByQ1eeItZslmXyZNHNVhQilmUAdGxQKAFvhIsKSkBjv4Z+7rPNFx44YVHfYwPP/yQN998k40bN5JKpQrvWFuWVfhc5s0334xlWdxxxx3N24GIaHFvupCDBw9GXYREJAzh4MHa7Z1iqhA3PEjtWQoxkeYBUQZExwKBFngG/7LLLgNqLywQBEGDK+nv37+fFStWkE6n+cxnPnPUx0gmk0yePPmIt61Zs4a1a9dy6aWXUlJSctLb91uSugtjjBkz5ojbayT+QjtduICSmKfuwky12zKjrkai4NXbop9AITBRw3lArwVMpAyIjgUCLXCB37t3b0aNGkV5eTmzZ8/m61//euG26dOnc+DAAf7xH/+x8H32+XyeLVu2kEgk6N27N1D7lQ9PPvnkER9/xowZrF27lq9+9avHvchea+G6LmPGjNFZfINZQYYJEyawbNmyqEuRCGQy7qEXdJoDTOWSYcyBCYcu+iQm0jwgyoDoWCDQAhf4AI8//jhlZWVMmTKFF198kb59+7Jy5UpeeuklLrzwQr7//e8X7ltZWUnfvn3p0aMH27Zti67oiNW/8qWYyKJNmzZRFyERsSxo08YrXIVZTGThWW1ww9orB5+4jaeqoBbEhD5qHhBlQODkjwUSJy1yRdi7d29ee+017r33Xv7whz+wcOFCunXrxpQpU5g+fTqdOnWKusQWxfM8ysvLtUXfYKGdYs6cOdqib6hUymPOnHJt0TeYR4ryNnNOeFvmzp07sS0Iwomnobro2RaF7xyOq4bzgF4LmEgZkMYeCySeWuQCH6B79+7MnTv3uPfr2bNnoxY1M2bMYMaMGU2orOVJJBJcddVVUZchEbKDDOPGjWP16tVRlyIRyGQSjBunOcBkCTJcdWDcCd+/urqaIIR5t0Dfc05dXS3Bxndh4uO1fY4zzQOiDEhjjwUSTy12gS8nLgxD9u/fT7t27Rr1HYkSHyE23bsX6wy+oWw7pLh4P5WV7QiCqKuRKITY7LeKaRdWYnHiIeh7DgzqdQoLk9Om4Tyg1wImUgbkZI8FEi8t7mvypPE8z2PZsmV4nhd1KRKR0E7y0EMPaYFvqGTS46GHlpFMag4wlUeSZemH8EhGXYpERPOAKAOiY4GAFvixkEgkuPLKK/X5e4PZQYbrrruuwddKijkymQTXXXelPnNpsAQZrjx4nT5zaTDNA6IMiI4FAlrgx0IQBHzwwQcE2ptrrBCbkpISncE3lG0HlJR8gG1rDjBVgM0HdgmBDuvG0jwgyoDoWCCgBX4s+L7PqlWr8H0/6lIkIqFdxNSpU7XAN1RRkc/UqasoKtIcYCqfIlYlp+JTFHUpEhHNA6IMiI4FAlrgx0IikWD06NHaom8wO8hy0003aYu+obLZBDfdNJpsVnOAqRJkGZ25iQTZqEuRiGgeEGVAdCwQ0AI/FoIgYNeuXdqib7AQmwEDBugMvqFsO2DAgF3almmwAJtdzgBtyzSY5gFRBkTHAgF9TV4sBEHAhg0bGD58uM7gGiq0i5g0aZIW+IYqKgqYNGkD3/rWcLJ6095IAUVsKJrE8My3sHXmxkgN5wG9Fjg5G6MuoElqM/BXvvWts46RgdbdRzk2HQsEtMCPBdd1GTlyZNRlSITsIMuUKVNYvXp11KVIBLJZlylTNAeYzCXLyMyUqMuQCGkeOHk7d+7EtiAIJ0ZdSpNkszDlBKYB26rts8SPjgUCWuDHQhAE7Ny5k27duukMvqFCHMrKhugMvqEcJ2DIkJ2sXNkNXWvTTAEOO50hdPNXYqMQmKjhPKDXAo1RXV1NEMK8W6DvOVFXc/JCHDJnDiG9byXWUeaBje/CxMdr+yzxo2OBgBb4sRAEAVu2bOGss87SAt9QoeUyduxYLfAN5boBY8duYfXqs7TAN1SAy5bEWM7yV+tFnaEazgN6LXAy+p4Dg3pFXcXJ83CpSI3l4s6rcTUPGEnHAgFdZC8WXNdl+PDhuK7erzGVHdYwbdo0vcFjqJoal2nThlNToznAVC41DM9Ow6Um6lIkIpoHRPOAKAMCWuDHQhAEvP3227qKvsFCy+Xyyy/XGXxDuW7A5Ze/jetqDjBVgMvb7uUE2phnLM0DonlAlAEBLfBjIQgCKisrtcA3WIjD0KFDtcA3lOMEDB1aieNoDjBVgEOlM5QAJ+pSJCKaB0TzgCgDAlrgx4LrupSVlWmLvsHssIaZM2dqi76hampcZs4s09Zcg7nUUFYzU9syDaZ5QDQPiDIgoIvsxYLv+2zdupVevXrhOHrHzkS1F9kbozP4hnJdnzFjtrJwYS88L+pqJAo+LlvdMfTyFuKgEJio4TxwMq8FTPh+9Hj3UfOAKAMCWuDHQhiG7Nmzh549e0ZdikQkxKakpEQLfEPZdkhJyR7+8IeeUZciEQmx2eOU0NP7Q9SlSEROdh6Iy3fAn6g4fwe85gFRBgS0wI8F13UZPHhw1GVIhOwwx6xZs7j22mujLkUikMu5zJqlOcBkLjkG18yKugyJ0MnOA3H5DvgTEffvgNc8IMqAgBb4seD7Pps3b6ZPnz7aom+o0HK59trxOoNvKNf1GT9+M88+20db9A3l47I5MZ4++We1LdNQDeeBxr8WaO3fAS+aB0QZkFq6IldMZDKZqEuQCIXYdO7cWQt8Q9k2dO6cQddYNJlNxuqMDuvm0jwgmgdEGRDQ6MeC4zgMHDhQZ+8NZoc5Zs+eravoGyqXc5g9eyC5nOYAUznkGJibjUMu6lIkIpoHRPOAKAMC2qIfC77vs3HjRvr27atFvqFCK8GNN07UGXxDJRI+EyduZN68vuTzUVcjUfBJsLFoIn1z83BQCBonHldWTyRCJk6sZt68DuTz1sdujUcf5dg0D4gyIKAFvoiIiBgoflePTwATgXlwhBf2cb56vIiIfEQL/BhwHId+/fpFXYZEyArzzJ07l9tuuy3qUiQC+bzD3LmaA0zmkKdfbm7UZbQq8bt6fB6Yy23TD78l7lePl1qaB0QZENACPxZ832f9+vX0799fW/QNFVhF3HrrzQRBEHUpEoGiIp+bb17PE0/0J6eP3RnJp4j1RTfTP/eEPnvZSHG5erwyIMqAKAMCushebKTT6ahLkAhZBOzevRvL+vjnLsUEQQC7d6fR+zsmC0iHuwGFwFzKgCgDogyIFvix4DgOF110kc7eG8wKPZ555hkt8A3leQ7PPHPRSX33tcSDg8dF+Wf0vccGUwZEGRBlQEAL/FjwPI9Vq1bheXoymyqwipg6daq26BuqqMhj6tRVFBVpDjCVRxGrklPxKIq6FImIMiDKgCgDAlrgx4JlWXTs2FFnbw1mEbBp0yZlwFBBYLFpU0eCQONvKouAjv4mLG3LNJYyIMqAKAMCWuDHguM4XHDBBdqibzAr9Hj++ee1wDeU5zk8//wF2qJvMAePC7zntS3TYMqAKAOiDAjoKvqx4Hker776KpdccgmuqyE1UWAlmT592lG36G989zQXFAET+ng0yaTHtGmv8uCDl1BTE3U1EgWPJK8mp3FJzYO4KAQmUgZEGRBlQEAL/FiwbZvi4mJsWxsyTGXhs2LFCr70pS81+PnOnTsBm4mPm7JVyz7UZ7P4vs2KFcX4vuYAU9n4FPsrsPGjLkUiogyIMiDKgIAW+LFg2zY9evSIugyJkBV6LF68+LAt+tXV1dR+Vco8oG8ElZ1OG4GJh/psFs+zWbxYc4DJbDx6eIujLkMipAyIMiDKgIAW+LHgeR4VFRWUlZVpi76hAivJgw/OPMZV9PsCg05nSXIaJZMeM2dWMH16mbboG8ojSUVqJmXZ6dqWaShlQJQBUQYEdJG9WLBtm969e2uLvsF0kT2zeZ7N88/3xvM0B5jKxqN3/nlsXVjJWMqAKAOiDAjoDH4s1H0GX8xl4VNRUaEFvqF836aiQnOAyWo/d1kRdRkSIWVAlAFRBgR0Bj8WPM9jyZIleJ7erTNVYKd49NFHj7FFX+IslfJ49NElpFKaA0zlkWJJ+lE8UlGXIhFRBkQZEGVAQAv8WLBtm379+mmLvsGsIMdTTz2lM/iGyuVsnnqqH7mc5gBT2eTol3sKm1zUpUhElAFRBkQZENAW/ViwbZuuXbtGXYZEyCJg3bp1WuAbKghs1q3THGAym4Cu/rqoy5AIKQOiDIgyIKAz+LGQz+dZtGgR+Xw+6lIkIoGd4sknn9QWfUOlUnmefHIRqZTmAFPlSbEo/SR5bcs0ljIgyoAoAwJa4MeC4zgMHjwYx3GiLkUiYgU5Zs2apTP4hsrlHGbNGkwupznAVA45BtfMwtG2TGMpA6IMiDIgoC36sWDbNp06dYq6DImQRcCmTZu0wDdUENhs2qQ5wGQ2AZ2CTVGXIRFSBkQZEGVAQGfwYyGfz/PCCy9oi77BAjvN008/rS36hkqn8zz99Auk05oDTJUnzQttniZPOupSJCLKgCgDogwIaIEfC67rMmzYMFxXGzJMZQU13HXXXTqDb6iaGpe77hpGTY3mAFO51DAscxcuNVGXIhFRBkQZEGVAQFv0Y8GyLM4888yoy5AIWQTs2LFDC3xDBYHFjh2aA0xmEXBmuCPqMiRCyoAoA6IMCOgMfizk83kWLFigLfoGC+w0zz33nLboGyqdzvPccwu0Rd9gedIsaPuctmUaTBkQZUCUAQEt8GPBdV1GjRqlLfoGs4IskydP1hl8Q2WzLpMnjyKb1RxgKpcsow5OxiUbdSkSEWVAlAFRBgS0wI8NLe5NF3Lw4MGoi5CIhCEcPOgShlFXItEJccODgEJgLmVAlAFRBkQL/FjwPI+FCxfieV7UpUhEQjvN/PnzCbXCM1I67TF//kLSac0BpvJIs7DtfDxtyzSWMiDKgCgDAlrgx4LruowZM0Zn8Q1mBRkmTJigLfqGymRcJkwYQyajOcBULhnGHJiASybqUiQiyoAoA6IMCGiBHxs6e286izZt2kRdhETEsqBNGw+9v2MyC89qAygE5lIGRBkQZUC0wI8Fz/MoLy/XIt9goZ1izpw52qJvqFTKY86cclIpzQGm8khR3mYOHqmoS5GIKAOiDIgyIKAFfiwkEgmuuuoqEolE1KVIROwgw7hx47BtPaVNlMkkGDfuKjIZzQGmSpDhqgPjSGhbprGUAVEGRBkQ0AI/FsIwZN++fTp7a7AQm+7duysDhrLtkO7d92HbGn9Thdjss7oT6rBuLGVAlAFRBgS0wI8Fz/NYtmyZtugbLLSTPPTQQ1rgGyqZ9HjooWUkk5oDTOWRZFn6ITySUZciEVEGRBkQZUBAC/xYSCQSXHnlldqibzA7yHDddddpi76hMpkE1113pbboGyxBhisPXqdtmQZTBkQZEGVAAPSdSjEQBAHV1dV06NBBC7wj2Phu1BWceht32pSU9NEZfEPZdkCfPtVs3tyBIIi6GolCgE213YcOwWZsFAITKQOiDIgyIKAFfiz4vs+qVasYOXKkFvj17Ny5E7CZ+Hj8J7hUqojHHvvWoT6LaYqKfKZOXcVtt40km426GomCTxGrklMZmbkNG4XARMqAKAOiDAhogR8LiUSC0aNHR11Gi1NdXQ0EwDygb7TFnGLZ7EZuumki8+bNi7oUiUA2m+CmmzQHmCxBltGZm6IuQyKkDIgyIMqAgBb4sRAEAVVVVXTp0kVn8I+oLzAo6iJOKdsO6d9/QNRlSERsO6B//yrWr++iLfqGCrCpcvrTxV+vbZmGUgZEGRBlQEAX2YuFIAjYsGEDgV7ZG6uoKGTSpElRlyERKSoKmDRpA0VFmgNMFVDEhqJJBBRFXYpERBkQZUCUAQEt8GPBdV1GjhyJ62pDhqmyWZspU6ZEXYZEJJt1mTJlJNms5gBTuWQZmZmCq89cGksZEGVAlAEBLfBjIQgCKisrdQbfYI4TUlZWFnUZEhHHCSgrq8RxNAeYKsCh0ikjwIm6FImIMiDKgCgDAlrgx0IQBGzZskULfIO5bsjYsWOjLkMi4roBY8duwXU1B5gqwGVLYiyBLq1jLGVAlAFRBgS0wI8F13UZPny4tugbrKbGZtq0aVGXIRGpqXGZNm04NTWaA0zlUsPw7DRcaqIuRSKiDIgyIMqAgBb4sRAEAW+//bbO4BvMdUMuv/zyqMuQiLhuwOWXv60z+AYLcHnbvVxnbQymDIgyIMqAgL4mLxbqPoNfXFzc4GvyNr4bYVGniQl9PBGOEzJ06NCoy5CIOE7A0KGVLFtWjOdFXY1EofZzl0Mp9pZhoxCYSBkQZUCUAQEt8GPBdd0GF1jbuXMnYDPxcVPO5tmH+myumhqbmTNnMm/evKhLkQjU1LjMnKmLLJrMpYaymplRlyERUgZEGRBlQEAL/FjwfZ+tW7fSq1cvHMehuroaCIB5QN9oizvlNgITD/XZXK4bMmaMLrJnKtf1GTNmKwsX9tIZfEP5uGx1x9DLW4ijszZGUgZEGRBlQEAL/FgIw5A9e/bQs2fPj93SFxgUQUVyutl2SElJSdRlSERqx38Pf/hDz6hLkYiE2OxxSujp/SHqUiQiyoAoA6IMCOgie7Hgui6DBw/WVfQNlsvZzJo1K+oyJCK5nMusWYPJ5TQHmMolx+CaWbjkoi5F/v/27j2+qvLO9/hnXfYN5G4RpQwgSLRyWtBiFQRvTLBgAds6BeQo4dJ2yhGklgFtX42MbQXpTJWRaedwq5cBbKeCTKFCFREEi9RCLacQhAMIHhULKGj2bV3OHzEhgYBckjxhr+/79cqri723K7+nzzfP3r+sZ+8YogyIMiDKgIAa/ILg+z7bt2/H933TpYghrhsybNgw02WIIa7rM2zYdlxXa0BU+bhsjw3D18a8yFIGRBkQZUBADX7BSKfTpksQg2w7pE2bNqbLEENsG9q0SWNrRY8wm7TVBj2tR5kyIMqAKAOi2S8IjuPQs2dPHMcxXYoYksvZzJ4923QZYkgu5zB7dk9yOa0BUeWQo2duNo62ZUaWMiDKgCgDAmrwC4Lv+2zdulVb9CMsFgspKSkxXYYYEov5lJRsJRbTGhBVPjG2xkvwiZkuRQxRBkQZEGVAQA2+iIiIiIiISEFQg18AHMehe/fu2qIfYfm8xYIFC0yXIYbk8w4LFnQnn9caEFUOebrnFuCQN12KGKIMiDIgyoCAGvyC4Ps+mzdv1hb9CIvHA8aPH2+6DDEkHvcZP34z8bjWgKjyibM5Ph6fuOlSxBBlQJQBUQYE1OAXjFQqZboEMSgILA4ePGi6DDEkCODgwRRBYLoSMScgFR4EFILoUgZEGRBlQNTgFwTHcbj88su1RT/CPM9i8eLFpssQQzzPYfHiy/E8rQFR5eBxeX4xDp7pUsQQZUCUAVEGBNTgFwTP89i0aROepx/mqIrHAyZPnmy6DDEkHveYPHkT8bjWgKjyiLMpMRlP2zIjSxkQZUCUAQE1+AXBsixatWqFZVmmSxFDgsCirKzMdBliSMX8tyIItAZElUVAK78MS9syI0sZEGVAlAEBNfgFwXEcunbtqi36EeZ5FsuWLTNdhhjieQ7LlnXVFv0Ic/Do6i3TtswIUwZEGRBlQEANfkHwPI8NGzZoi36EJRIBpaWlpssQQxIJj9LSDSQSWgOiyiPBhkQpHgnTpYghyoAoA6IMCKjBLwi2bdO+fXtsW9MZVb5vsX79etNliCG+b7N+fXt8X2tAVNn4tPfXY6M/lRhVyoAoA6IMCKjBLwi2bdOxY0c1+BHmeRYvvPCC6TLEEM+zeeGFjnie1oCosvHo6L2ArW2ZkaUMiDIgyoCAGvyC4Hkea9eu1Rb9CEskAqZPn266DDEkkfCYPn2ttuhHmEeCtcnp2pYZYcqAKAOiDAiowS8Itm3TpUsXXcGPMH3IXrR5ns2yZV10BT/CbDy65Jfpqk2EKQOiDIgyIKAGvyDoPfji+xYbNmwwXYYY4vs2GzboPfhRVvG+yw1632WEKQOiDIgyIKAGvyB4nsfq1au1RT/CksmAWbNmmS5DDEkmPWbNWk0yqTUgqjySrE7NwiNpuhQxRBkQZUCUAQE1+AXBtm26d++uK/gRlstZzJ8/33QZYkguZzN/fndyOa0BUWWTo3tuPjY506WIIcqAKAOiDAiAa7oAOXe2bdO2bVvTZYhBQWCxZcsW02WIIUFgs2WL1oAoswlo628xXYYYpAyIMiDKgICu4BeEfD7PypUryefzpksRQ5LJgLlz55ouQwxJJvPMnbuSZFJrQFTlSbIyNZe8tmVGljIgyoAoAwJq8AuC4zj06tULx3FMlyKG5HIWM2fONF2GGJLLOcyc2YtcTmtAVDnk6JWdiaNtmZGlDIgyIMqAgLboFwTbtmndurXpMsSgILAoKyszXYYYEgQ2ZWVaA6LMJqB1oDUgypQBUQZEGRDQFfyCkM/nWb58ubboR1gqFbBw4ULTZYghqVSehQuXk0ppDYiqPCmWN1lInpTpUsQQZUCUAVEGBNTgFwTXdenbty+uqw0ZUZXNWkyZMsV0GWJINusyZUpfslmtAVHlkqVvegouWdOliCHKgCgDogwIaIt+QbAsi+bNm5suQwwKAot9+/aZLkMMqZh/rQFRZhHQPNQaEGXKgCgDogwI6Ap+Qcjn8zz33HPaoh9hqVTA0qVLTZchhqRSeZYufU5b9CMsT4rnmi7VtswIUwZEGRBlQEANfkFwXZfi4mJt0Y+wTMZizJgxpssQQzIZlzFjislktAZElUuG4vIxuGRMlyKGKAOiDIgyIKAGv2CouY+2MITy8nLTZYghFfPvEoamKxFzQtywHFAIoksZEGVAlAFRg18QPM9jxYoVeJ5nuhQxJJUKWbRokekyxJBUymPRohWkUloDosojxYqmi/C0LTOylAFRBkQZEFCDXxBc12XgwIG6ih9h6bTF8OHDTZchhqTTLsOHDySd1hoQVS5pBn48HJe06VLEEGVAlAFRBgTU4BcMXb2PNsuCJk2amC5DDKmYfw/LMl2JmGPhWU0AhSC6lAFRBkQZEDX4BcHzPFatWqUmP8KSyZB58+aZLkMMSSY95s1bRTKpNSCqPJKsajIPj6TpUsQQZUCUAVEGBNTgF4RYLMaQIUOIxWKmSxFD0mmboUOHmi5DDEmnYwwdOoR0WmtAVMVIM+TjocS0LTOylAFRBkQZEFCDXxDCMOTIkSOE+gjtyLLtkA4dOpguQwypmP8j2LbWgKgKsTlidSDU03pkKQOiDIgyIKAGvyB4nse6deu0RT/CEomQGTNmmC5DDEkkPGbMWEcioTUgqjwSrEvNwCNhuhQxRBkQZUCUAYFG3ODv37+f0aNHc8kll5BIJOjUqRP33nsvhw8fPq3//uDBg8ydO5fbb7+drl27kkqlaNGiBddffz3z5s0jCIJ6HkHDicViDBo0SFv0IyydthkxYoTpMsSQdDrGiBGDtEU/wmKkGVQ+QtsyI0wZEGVAlAGBRtrg79q1i6uvvpoFCxZwzTXXMGnSJC699FIee+wxrrvuOg4ePPip5/j1r3/NuHHj+MMf/sCXvvQl7r33Xr72ta+xdetWxo4dyx133FEwW9qDIODQoUMF9UsLOTO2HVJUVGS6DDHEtgOKig5h21oDoirA5pBdRNA4n9alASgDogyIMiDQSBv873znOxw4cIBZs2axdOlSpk+fzurVq5k0aRJlZWV8//vf/9RzdOvWjaVLl7J//37+8z//k4cffpj58+ezfft2OnTowLPPPstvfvObBhhN/fN9n02bNuH7vulSxJB4PGTy5MmmyxBD4nGfyZM3EY9rDYgqnzibEpPxiZsuRQxRBkQZEGVAoBE2+Lt27WLVqlV07tyZ8ePH17hv2rRpNG3alCeffJKPPvrolOe5+eabGTJkCI7j1Li9Xbt2fPvb3wZgzZo1dVq7KbFYjAEDBmiLfoRlMjZjx441XYYYksnEGDt2AJmM1oCoipFhQHosMTKmSxFDlAFRBkQZEGiEDf5LL70EQHFxMbZds7xmzZrRp08f0uk0GzduPOvvEY9X/FarUBriIAg4cOCAtuhHmG2H9OjRw3QZYohtB/TocUBb9CMswOaA00PbMiNMGRBlQJQBgUbY4JeVlQFw2WWX1Xp/5e07duw4q/N7nscTTzwBwK233nrKx2azWY4cOVLjC6jaCu/7fq3HnufVOK5svE92nM/naxxXfjZA5XEYhiccA1XHQRDwl7/8hVwuV1V7MpkEwHGCqk/Wdt3qxz7xePXjinpjMZ9YrOI4Hvdx3cpjr+o4kfBw3aDq2HGCT76nV9VgJJP5quNUKl/157tSqTyWFQIhqVQeCLGsyuOKRvXYcUAyWf3Yq2VMIYlEomoOKv+SQPW3K8Ri4Xk2pjOfpyZNAkaPHl1j7NX/qkIiEZx3YzrzeTr2mRq1/TylUqnzcEynN0/xuM+YMX8hHvc/GVMKoMZ6UXGe5HkzpnObp2PrQhAEta4LoeVWbWH0ieET++Q4jo8LgFfjOEFQ49j55DhZ9UIqX+M4VfVniiqOLcKqYwixyPPJPGFXHQfY5ElWHXtVx07VpyIHuFXHPi4ecQLi/CU+mjxNq8YUWsd+iV3b81MikSC0Gu+YKo/rYp4qsw81n3NTqfN3TMfPk0eSrfHRZGlR65hqWxeqfxZR2AjHVNfZC+xjOahcF6pfHAmt829M1ecpRzO2xkfjkTrpPAXWsa3btb2Gjcfjx60LhbtGVD5PQM3X5clk8rhxnD9jytGMv8RHExA/rXk6fl2o7DUqNYYx1Xf2TrYu1HZ8fK/R0D3h6Wp0Df6HH34IQIsWLWq9v/L2Dz744KzOP3XqVLZu3cqXv/xlBgwYcMrHPvzww7Ro0aLqq/LvjG/duhWAbdu2sW3bNgDeeOMN3nzzTQA2b97M7t27AXjttdfYt28fABs2bOCdd94BYO3atfztb38DYPXq1VXjWbVqFUePHgVgxYoVZDIZPM9jxYoVeJ5HJpNhxYoVABw9epRVq1bhui49e/bk5ZdfBsBxHB555BEAvvSld5g2bQMAN964j6lTXwNg4MDdTJy4GYCvf/1Nxo17A4CRI7cxcmTFmMaNe4Ovf71iTBMnbmbgwN2f/H/4GjfeWDGmadM28KUvVYzpkUfW8vnPV4zp8cdXc9llFWOaN28V7dtXjGnRohW0bp0hlfJYtGgFqZRH69YZFi2qGFP79keZN28VAJdd9gGPP74agM9//m888sjaWsb0MVOnTgVg9+7dbN5cMaY333yzauEeOfKD82xMZz5Pt932ERMmTCCZTNbInuu6n4zp/fNuTGc+TxXb0Zo0aVLrz9OiRYto3do/z8Z0evNkWdChw0dYFrRu7bNo0SLg2BoBYNs2jz/++HkzpnObpzTTpk0DYN++fbz2WsWYdu/eXdXoHfnM13kjPg6AbfGRbIuPBOCN+DjejH0dgM2Jiex2BwLwWmIq+9wbAdiQnMY7zpcAWJt6hL85nwdgdepxPrArfgm9qsk8jlrtAVjRdBEZqzUeKVY0XYRHiozVmhVNP5knqz2rmswD4AP7MlanKubpb87nWZuqWMvfcb7EhuQnY3Jv5LXEJ+ueO5DNiYm4ZGjvbeCv8buqxvTBRRVjSiQStT4/TZ06lY9bNt4xAbwZq5t5euSRR6reslf9OXfevHl4ifNzTMfP00d2B25OT2B1k9knzFNop6rWheNfRzRtWvFLoVyq8Y2prrP33qUVY3Ichw0bKta9ffv2Va0LH7U+/8ZUfZ5eS97PzekJvONed9J5+uDiijHF4/FaX8NOnDiRj1o3njHVZ/amTZtWtS5Uf13++OOPk0udn2N6LXk/l+cW45I5rXlatGgRlmWd0GtccMEFAHgJ82Oq7+y9e1nFmBzHYe3aitcR77zzTo01ovrriOq9xhtvVLw2aqie8HRZYSP7KPlvfvObzJkzhzlz5tT6nuIHHniAhx9+mIcffriqsTtdjz76KJMmTaKoqIhXXnmFCy+88JSPz2azZLPZqn8fOXKEDh06cOjQIVq1alX1GxnHcWoce56HZVlVx7ZtY9v2SY/z+TyO41Qdu66LZVlVx1Dx253qx7FYjDAM8TwPx3H4f//v/9G2bVvi8Tj/+Z//ydixY8lk1uM4PXDdgGzWxXUrruJWHPvYdkguV3kMuZxTdWUun3eIx32CADzPIR73CAILz3NIJDx838bzbBIJD8+z8X2bZNIjl7MJAptkMk8u5xAENqlUnmzWJQgsUqk8mYxLGEIq5ZFOu1hWxZW9dDqGbYckEpXHAfG4TyZTeRyQybg4TlBtTK/jOH2YN28ew4YNIwxDXNfF930WL17MyJEjicX+CPQ4j8Z05vNkWZu5+uqJfOc732HYsGFV2XvmmWcYOXIkicQmPO+q82pMZz5PfyYIvsjTTz/N8OHDa/w8LVy4kHHjxpHJrCMMrzqPxnR682TbAX37vs26de0Jgi0kk32ZM2cOI0aMqFovqq8Ltt2j0Y/p3LL3Oq5bsS4MHz6cIAhOWBf++GOXHp1sHHJVVxIc8p9cYai4HuERx6o6TmDjY1cde9j4eCSxyWETkCeJU3WcwiWLVXWcAUI8UrikAQuPJDHShNh4JIiRJsDGJ06MTMWVBeK4ZAhwCHBxyRLgEuDgksXHJcTGxudtpzft/D8SI41PjC174Ivfz/P000/XWBcsy2Lx4sWMGTOG9T/0ubpT4xyTS+6TqznnNk9bdvv0+VGSuXPncuedd1Y95y5atIhx48ax7vtZru58fo2ptnmy8HnP6cWF/hvEKa8xT3/aHdL3x6kT1oUwDFm4cGHFz8SPbD7fuXGNqa6z96e9cXo9kOHpp5/mG9/4Bq7rEgQBixYtqloXvtDp/BpT9XnySPC+04OL/NcBap2nzXtsen0/V2NdqHwNu3jxYkaPHs2G0qDautB4171zmactuz16P5Rg3rx53HnnnVWvyxctWsTYsWN55Qe5auvC+TEmG48cTXjPuYr2/qsExE45T5t3B1x/3LpQ2WvUXBca77pXF9k72bpQ+dqh+rHv+zV6jdr6wPrqCcvLy2nZsiUffvghzZs3r7V3reSe8l4DKq/QV17JP17lNvmTXeE/mccee4xJkyZxxRVXsHr16k9t7qHiqkf17TuVKn/bV/0D/KofV/5wnO5x9c8COJNjy7KIxWJ4nsf//b//l3bt2lU9pvK3PL5f8cIawPMqXnBXHB+rt/pxPn/sOJerfnys3my29uNMpvrxsXqr/23u2o7D8NhxEFjVjm0yGfuE45pjsvC8il/CnGw+8nkLPtnac36M6cznKZGAwYMH1xh79YxlszaVG3bOlzEdOz7debKq/l35+R3Vf27S6fQnj7HOozFVHp96blw35NZb9/Dqq5eQzVqfjPXYGnHsPJnzZkzVj898nix8v2JdqHzShJrrghV6VP7L4djbGByOvdXJrXGcPcnxsd+ox2ocpz/lOKw6tgiqjm0C7E/OU/PYx8b/5NjD5pO3I3zyvx4JdscGcbH/WtWYrGq/vq99XchWPaYxjunE47Ofp+pXPo5fFypXjvNtTMfPk0eCXbHBXOS/jkVQYxwW1LouWNaxdbNifI1rTMeO6yh7wbFzVv4sVP+8Jyv0ql4YnzdjOm6eKjNQWcPx82TXsi5UXxtzudxJ1oXCWyOqX8SrvjZmMplPWRca75hsfHbHbuNif9NpzdPJXi9UagxjqvfsnWRdqFwbTvY64nSO67InrL5ef5pGt0W/8m95n+w99pVbHrp163ba5/zpT3/KvffeS/fu3VmzZk2NRrgQuK5Lv379agREoiWbtc94R4sUjmzWZerUfjWaaYkWlyz9MlNrvBCSaFEGRBkQZUCgETb4N910E1DxvoPjPxX+6NGjrF+/nlQqxbXXXnta53v44YeZPHkyPXr04KWXXqJt27Z1XrNpQRCwd+9efYp+hLluSP/+/U2XIYa4bkD//nurPthOoifAZa/bnwD9kieqlAFRBkQZEGiEDX6XLl0oLi5mz549zJ49u8Z9paWlfPzxx9x1111VHwqTz+fZvn07u3btOuFcDz30EA888ABXX301L7744mltyz8fBUHA22+/rQY/whwnpE+fPqbLEEMcJ6BPn7erPq1eoifA4W2nD5WfNCzRowyIMiDKgEAjfA8+wL//+7/Tu3dvJkyYwIsvvsgVV1zBxo0beemll+jWrRs//vGPqx779ttvc8UVV9CxY0f27NlTdfsTTzzBD3/4QxzHoW/fvsyaNeuE79OpUydGjRrVACOqX67r0rt3b9NliEHZrM20adN4+umnTZciBmSzLtOmaQ2IMpcsvbPTTJchBikDogyIMiDQSBv8Ll268Mc//pEf/vCHPP/886xYsYKLL76YCRMmUFpaSuvWrT/1HJV/ksD3fR599NFaH3PDDTcURIPv+z67d++mc+fONT7YQaLDdUMGDhxsugwxxHV9Bg7czYoVnfG8T3+8FB4fl93uQDp7K2p8mJFEhzIgyoAoAwKNcIt+pQ4dOrBgwQLeeecdcrkce/fu5bHHHjuhue/UqRNhGNa4eg/w4IMPEobhKb/WrFnTcAOqR2EYcvjwYRrZXzyUBmTbYdUHVEr0VMz/YWxba0BUhdgcdooIG+/TutQzZUCUAVEGBBpxgy+nz3VdevXqpU/Rj7BczmbmzJmmyxBDcjmXmTN71fhTdRItLjl6ZWfW+DNDEi3KgCgDogwIqMEvCL7vs337dnzfN12KGOK6IcOGDTNdhhjiuj7Dhm3HdbUGRJWPy/bYMPzG+c47aQDKgCgDogwIqMEvGOl02nQJYpBth7Rp08Z0GWKIbUObNmlsregRZpO22qCn9ShTBkQZEGVANPsFwXEcevbsqQ/Yi7Bczj7hz0pKdORyDrNn9ySX0xoQVQ45euZm42hbZmQpA6IMiDIgoAa/IPi+z9atW7VFP8JisZCSkhLTZYghsZhPSclWYjGtAVHlE2NrvASfmOlSxBBlQJQBUQYE1OCLiIiIiIiIFAQ1+AXAcRy6d++uLfoRls9bLFiwwHQZYkg+77BgQXfyea0BUeWQp3tuAQ5506WIIcqAKAOiDAiowS8Ivu+zefNmbdGPsHg8YPz48abLEEPicZ/x4zcTj2sNiCqfOJvj4/GJmy5FDFEGRBkQZUBADX7BSKVSpksQg4LA4uDBg6bLEEOCAA4eTBEEpisRcwJS4UFAIYguZUCUAVEGRA1+QXAch8svv1xb9CPM8ywWL15sugwxxPMcFi++HM/TGhBVDh6X5xfj4JkuRQxRBkQZEGVAQA1+QfA8j02bNuF5+mGOqng8YPLkyabLEEPicY/JkzcRj2sNiCqPOJsSk/G0LTOylAFRBkQZEFCDXxAsy6JVq1ZYlmW6FDEkCCzKyspMlyGGVMx/K4JAa0BUWQS08suwtC0zspQBUQZEGRBQg18QHMeha9eu2qIfYZ5nsWzZMtNliCGe57BsWVdt0Y8wB4+u3jJty4wwZUCUAVEGBNTgFwTP89iwYYO26EdYIhFQWlpqugwxJJHwKC3dQCKhNSCqPBJsSJTikTBdihiiDIgyIMqAgBr8gmDbNu3bt8e2NZ1R5fsW69evN12GGOL7NuvXt8f3tQZElY1Pe389NvpTiVGlDIgyIMqAgBr8gmDbNh07dlSDH2GeZ/HCCy+YLkMM8TybF17oiOdpDYgqG4+O3gvY2pYZWcqAKAOiDAiowS8Inuexdu1abdGPsEQiYPr06abLEEMSCY/p09dqi36EeSRYm5yubZkRpgyIMiDKgIAa/IJg2zZdunTRFfwI04fsRZvn2Sxb1kVX8CPMxqNLfpmu2kSYMiDKgCgDAmrwC4Legy++b7FhwwbTZYghvm+zYYPegx9lFe+73KD3XUaYMiDKgCgDAmrwC4LneaxevVpb9CMsmQyYNWuW6TLEkGTSY9as1SSTWgOiyiPJ6tQsPJKmSxFDlAFRBkQZEFCDXxBs26Z79+66gh9huZzF/PnzTZchhuRyNvPndyeX0xoQVTY5uufmY5MzXYoYogyIMiDKgAC4pguQc2fbNm3btjVdhhgUBBZbtmwxXYYYEgQ2W7ZoDYgym4C2/hbTZYhByoAoA6IMCOgKfkHI5/OsXLmSfD5vuhQxJJkMmDt3rukyxJBkMs/cuStJJrUGRFWeJCtTc8lrW2ZkKQOiDIgyIKAGvyA4jkOvXr1wHMd0KWJILmcxc+ZM02WIIbmcw8yZvcjltAZElUOOXtmZONqWGVnKgCgDogwIaIt+QbBtm9atW5suQwwKAouysjLTZYghQWBTVqY1IMpsAloHWgOiTBkQZUCUAQFdwS8I+Xye5cuXa4t+hKVSAQsXLjRdhhiSSuVZuHA5qZTWgKjKk2J5k4XkSZkuRQxRBkQZEGVAQA1+QXBdl759++K62pARVdmsxZQpU0yXIYZksy5TpvQlm9UaEFUuWfqmp+CSNV2KGKIMiDIgyoCAtugXBMuyaN68uekyxKAgsNi3b5/pMsSQivnXGhBlFgHNQ60BUaYMiDIgyoCAruAXhHw+z3PPPact+hGWSgUsXbrUdBliSCqVZ+nS57RFP8LypHiu6VJty4wwZUCUAVEGBNTgFwTXdSkuLtYW/QjLZCzGjBljugwxJJNxGTOmmExGa0BUuWQoLh+DS8Z0KWKIMiDKgCgDAmrwC4aa+2gLQygvLzddhhhSMf8uYWi6EjEnxA3LAYUgupQBUQZEGRA1+AXB8zxWrFiB53mmSxFDUqmQRYsWmS5DDEmlPBYtWkEqpTUgqjxSrGi6CE/bMiNLGRBlQJQBATX4BcF1XQYOHKir+BGWTlsMHz7cdBliSDrtMnz4QNJprQFR5ZJm4MfDcUmbLkUMUQZEGRBlQEANfsHQ1ftosyxo0qSJ6TLEkIr597As05WIORae1QRQCKJLGRBlQJQBUYNfEDzPY9WqVWryIyyZDJk3b57pMsSQZNJj3rxVJJNaA6LKI8mqJvPwSJouRQxRBkQZEGVAQA1+QYjFYgwZMoRYLGa6FDEknbYZOnSo6TLEkHQ6xtChQ0intQZEVYw0Qz4eSkzbMiNLGRBlQJQBATX4BSEMQ44cOUKoj9COLNsO6dChg+kyxJCK+T+CbWsNiKoQmyNWB0I9rUeWMiDKgCgDAmrwC4Lneaxbt05b9CMskQiZMWOG6TLEkETCY8aMdSQSWgOiyiPButQMPBKmSxFDlAFRBkQZEFCDXxBisRiDBg3SFv0IS6dtRowYYboMMSSdjjFixCBt0Y+wGGkGlY/QtswIUwZEGRBlQEANfkEIgoBDhw4RBIHpUsQQ2w4pKioyXYYYYtsBRUWHsG2tAVEVYHPILiLQ03pkKQOiDIgyIKAGvyD4vs+mTZvwfd90KWJIPB4yefJk02WIIfG4z+TJm4jHtQZElU+cTYnJ+MRNlyKGKAOiDIgyIKAGvyDEYjEGDBigLfoRlsnYjB071nQZYkgmE2Ps2AFkMloDoipGhgHpscTImC5FDFEGRBkQZUBADX5BCIKAAwcOaIt+hNl2SI8ePUyXIYbYdkCPHge0RT/CAmwOOD20LTPClAFRBkQZEFCDXxCCIGDr1q1q8CMsHg8ZPXq06TLEkHg8YPTorcTjWgOiKiDO1vhoAm3LjCxlQJQBUQYE1OAXBNd1ufnmm3Fd13QpYkgmYzNhwgTTZYghmYzLhAk3k8loDYgqlww3pyfgaltmZCkDogyIMiCgBr8gBEHA22+/rSv4EeY4Ib179zZdhhjiOAG9e7+N42gNiKoAh7ed3gQ4pksRQ5QBUQZEGRBQg18QgiBg165davAjzHVDBg8ebLoMMcR1AwYP3oXrag2IqgCXXbHBBGgXR1QpA6IMiDIgoAa/ILiuS79+/bRFP8KyWZupU6eaLkMMyWZdpk7tRzarNSCqXLL0y0zFJWu6FDFEGRBlQJQBATX4BSEIAvbu3asr+BHmuiH9+/c3XYYY4roB/fvv1RX8CAtw2ev211WbCFMGRBkQZUBADX5B0HvwxXFC+vTpY7oMMcRxAvr00Xvwo6zifZd99L7LCFMGRBkQZUBADX5BcF2X3r17a4t+hGWzNtOmTTNdhhiSzbpMm9ZbW/QjzCVL7+w0bcuMMGVAlAFRBgTU4BcE3/fZuXMnvu+bLkUM0YfsRZvr+gwevBPX1RoQVT4uO93B+NqWGVnKgCgDogwIqMEvCGEYcvjwYcIwNF2KGGLbIUVFRabLEEMq5v8wtq01IKpCbA47RYR6Wo8sZUCUAVEGBNTgFwTXdenVq5e26EdYLmczc+ZM02WIIbmcy8yZvcjltAZElUuOXtmZuORMlyKGKAOiDIgyIKAGvyD4vs/27du1RT/CXDdk2LBhpssQQ1zXZ9iw7dqiH2E+Lttjw7QtM8KUAVEGRBkQUINfMNLptOkSxCDbDmnTpo3pMsQQ24Y2bdLYWtEjzCZttUFP61GmDIgyIMqAaPYLguM49OzZE8fRn8SIqlzOZvbs2abLEENyOYfZs3uSy2kNiCqHHD1zs3G0LTOylAFRBkQZEFCDXxB832fr1q3aoh9hsVhISUmJ6TLEkFjMp6RkK7GY1oCo8omxNV6CT8x0KWKIMiDKgCgDAmrwRURERERERAqCGvwC4DgO3bt31xb9CMvnLRYsWGC6DDEkn3dYsKA7+bzWgKhyyNM9twCHvOlSxBBlQJQBUQYE1OAXBN/32bx5s7boR1g8HjB+/HjTZYgh8bjP+PGbice1BkSVT5zN8fH4xE2XIoYoA6IMiDIgoAa/YKRSKdMliEFBYHHw4EHTZYghQQAHD6YIAtOViDkBqfAgoBBElzIgyoAoA6IGvyA4jsPll1+uLfoR5nkWixcvNl2GGOJ5DosXX47naQ2IKgePy/OLcfBMlyKGKAOiDIgyIKAGvyB4nsemTZvwPP0wR1U8HjB58mTTZYgh8bjH5MmbiMe1BkSVR5xNicl42pYZWcqAKAOiDAiowS8IlmXRqlUrLMsyXYoYEgQWZWVlpssQQyrmvxVBoDUgqiwCWvllWNqWGVnKgCgDogwIqMEvCI7j0LVrV23RjzDPs1i2bJnpMsQQz3NYtqyrtuhHmINHV2+ZtmVGmDIgyoAoAwJq8AuC53ls2LBBW/QjLJEIKC0tNV2GGJJIeJSWbiCR0BoQVR4JNiRK8UiYLkUMUQZEGRBlQEANfkGwbZv27dtj25rOqPJ9i/Xr15suQwzxfZv169vj+1oDosrGp72/Hhv9qcSoUgZEGRBlQEANfkGwbZuOHTuqwY8wz7N44YUXTJchhniezQsvdMTztAZElY1HR+8FbG3LjCxlQJQBUQYE1OAXBM/zWLt2rbboR1giETB9+nTTZYghiYTH9OlrtUU/wjwSrE1O17bMCFMGRBkQZUBADX5BsG2bLl266Ap+hOlD9qLN82yWLeuiK/gRZuPRJb9MV20iTBkQZUCUAQE1+AVB78EX37fYsGGD6TLEEN+32bBB78GPsor3XW7Q+y4jTBkQZUCUAQE1+AXB8zxWr16tLfoRlkwGzJo1y3QZYkgy6TFr1mqSSa0BUeWRZHVqFh5J06WIIcqAKAOiDAiowS8Itm3TvXt3XcGPsFzOYv78+abLEENyOZv587uTy2kNiCqbHN1z87HJmS5FDFEGRBkQZUAAXNMFyLmzbZu2bduaLkMMCgKLLVu2mC5DDAkCmy1btAZEmU1AW3+L6TLEIGVAlAFRBgR0Bb8g5PN5Vq5cST6fN12KGJJMBsydO9d0GWJIMpln7tyVJJNaA6IqT5KVqbnktS0zspQBUQZEGRBQg18QHMehV69eOI5juhQxJJezmDlzpukyxJBczmHmzF7kcloDosohR6/sTBxty4wsZUCUAVEGBLRFvyDYtk3r1q1NlyEGBYFFWVmZ6TLEkCCwKSvTGhBlNgGtA60BUaYMiDIgyoCAruAXhHw+z/Lly7VFP8JSqYCFCxeaLkMMSaXyLFy4nFRKa0BU5UmxvMlC8qRMlyKGKAOiDIgyIKAGvyC4rkvfvn1xXW3IiKps1mLKlCmmyxBDslmXKVP6ks1qDYgqlyx901NwyZouRQxRBkQZEGVAQFv0C4JlWTRv3tx0GWJQEFjs27fPdBliSMX8aw2IMouA5qHWgChTBkQZEGVAQFfwC0I+n+e5557TFv0IS6UCli5daroMMSSVyrN06XPaoh9heVI813SptmVGmDIgyoAoAwJq8AuC67oUFxdri36EZTIWY8aMMV2GGJLJuIwZU0wmozUgqlwyFJePwSVjuhQxRBkQZUCUAQE1+AVDzX20hSGUl5ebLkMMqZh/lzA0XYmYE+KG5YBCEF3KgCgDogyIGvyC4HkeK1aswPM806WIIalUyKJFi0yXIYakUh6LFq0gldIaEFUeKVY0XYSnbZmRpQyIMiDKgIAa/ILgui4DBw7UVfwIS6cthg8fbroMMSSddhk+fCDptNaAqHJJM/Dj4bikTZcihigDogyIMiCgBr9g6Op9tFkWNGnSxHQZYkjF/HtYlulKxBwLz2oCKATRpQyIMiDKgKjBLwie57Fq1So1+RGWTIbMmzfPdBliSDLpMW/eKpJJrQFR5ZFkVZN5eCRNlyKGKAOiDIgyIKAGvyDEYjGGDBlCLBYzXYoYkk7bDB061HQZYkg6HWPo0CGk01oDoipGmiEfDyWmbZmRpQyIMiDKgIAa/IIQhiFHjhwh1EdoR5Zth3To0MF0GWJIxfwfwba1BkRViM0RqwOhntYjSxkQZUCUAQE1+AXB8zzWrVunLfoRlkiEzJgxw3QZYkgi4TFjxjoSCa0BUeWRYF1qBh4J06WIIcqAKAOiDAiowS8IsViMQYMGaYt+hKXTNiNGjDBdhhiSTscYMWKQtuhHWIw0g8pHaFtmhCkDogyIMiCgBr8gBEHAoUOHCILAdCliiG2HFBUVmS5DDLHtgKKiQ9i21oCoCrA5ZBcR6Gk9spQBUQZEGRBQg18QfN9n06ZN+L5vuhQxJB4PmTx5sukyxJB43Gfy5E3E41oDosonzqbEZHzipksRQ5QBUQZEGRBQg18QYrEYAwYM0Bb9CMtkbMaOHWu6DDEkk4kxduwAMhmtAVEVI8OA9FhiZEyXIoYoA6IMiDIgoAa/IARBwIEDB7RFP8JsO6RHjx6myxBDbDugR48D2qIfYQE2B5we2pYZYcqAKAOiDAiowS8IQRCwdetWNfgRFo+HjB492nQZYkg8HjB69Fbica0BURUQZ2t8NIG2ZUaWMiDKgCgDAmrwC4Lrutx88824rmu6FDEkk7GZMGGC6TLEkEzGZcKEm8lktAZElUuGm9MTcLUtM7KUAVEGRBkQUINfEIIg4O2339YV/AhznJDevXubLkMMcZyA3r3fxnG0BkRVgMPbTm8CHNOliCHKgCgDogwIqMEvCEEQsGvXLjX4Eea6IYMHDzZdhhjiugGDB+/CdbUGRFWAy67YYAK0iyOqlAFRBkQZEFCDXxBc16Vfv37aoh9h2azN1KlTTZchhmSzLlOn9iOb1RoQVS5Z+mWm4pI1XYoYogyIMiDKgIAa/IIQBAF79+7VFfwIc92Q/v37my5DDHHdgP799+oKfoQFuOx1++uqTYQpA6IMiDIgoAa/IOg9+OI4IX369DFdhhjiOAF9+ug9+FFW8b7LPnrfZYQpA6IMiDIgoAa/ILiuS+/evbVFP8KyWZtp06aZLkMMyWZdpk3rrS36EeaSpXd2mrZlRpgyIMqAKAMCavALgu/77Ny5E9/3TZcihuhD9qLNdX0GD96J62oNiCofl53uYHxty4wsZUCUAVEGBNTgF4QwDDl8+DBhGJouRQyx7ZCioiLTZYghFfN/GNvWGhBVITaHnSJCPa1HljIgyoAoAwJq8AuC67r06tVLW/QjLJezmTlzpukyxJBczmXmzF7kcloDosolR6/sTFxypksRQ5QBUQZEGRBQg18QfN9n+/bt2qIfYa4bMmzYMNNliCGu6zNs2HZt0Y8wH5ftsWHalhlhyoAoA6IMCDTiBn///v2MHj2aSy65hEQiQadOnbj33ns5fPiwkfM0dul02nQJYpBth7Rp08Z0GWKIbUObNmnsRruiS/2zSVttaMRP61LvlAFRBkQZEBrnr3d27dpF7969OXDgAEOGDOHyyy/ntdde47HHHuP5559n/fr1p9XM1NV5GjvHcejZs6fpMsSgXM5m9uzZXHfddaZLEQNyOYfZs7UGRJlDjp652abLEIOUAVEGRBkQaKS/3vnOd77DgQMHmDVrFkuXLmX69OmsXr2aSZMmUVZWxve///0GPU9j5/s+W7du1Rb9CIvFQkpKSkyXIYbEYj4lJVuJxbQGRJVPjK3xEnxipksRQ5QBUQZEGRBohA3+rl27WLVqFZ07d2b8+PE17ps2bRpNmzblySef5KOPPmqQ84iIiIiIiIicDxpdg//SSy8BUFxcjH3cG0qbNWtGnz59SKfTbNy4sUHOcz5wHIfu3bvjOI7pUsSQfN5iwYIFpssQQ/J5hwULupPPaw2IKoc83XMLcMibLkUMUQZEGRBlQKARvge/rKwMgMsuu6zW+y+77DJWrVrFjh07uOWWW+r1PNlslmw2W/XvDz/8EKDqA/oqt8Q7jlPj2PM8LMuqOrZtG9u2T3qcz+dxHKfq2HVdLMuqOgbwPK/GcSwWIwzDqvP85S9/4YorriCRSFBeXk4ikSCbfR3bPorrhuRyNo4T4jjHjm07JJ+veey64SffwyIWCwgCC9+veRyPB/j+sWPPswgCi0QiIJezCMOax8lkQDZ77DiTsQBIJsPjjm0sKySROHYcj4dkszWPbTusNqYyHCdOeXk5hw8fJgxDXNfF933Ky8sBcN3XgaPn0ZjOfJ5c901GjhxX9f9DZfYq/z+Ix1/H846eV2M683l6kzCE8vJyPvjggxo/T+Xl5SSTSTKZiiycP2M6vXmKxQJGj/6Q+fNbkM/vJJlMUl5ezocffli1XlRfFyzraKMf07llrwzXjVdlIQiCE9aF1/c6HMna2GGe0KpYW63QI7BiWARYoX/ccRwL/9hx6GERENgJrCCHRXjccRIryFY7zgAQHndsBxlCLEI7Ue04jh1kjzu2CS0XO8wRWg4hTrXjil9if9CuhBbvPY0TlBNaLjveA/BOWBcsy6K8vJx4PM7re30+yjTOMVXMTfXjs5unHe8GVc+NR44cqXrOrVwXXt+T5aPM+TWm2uYpDOFIu7toduAZHP9ojXna8S61rgthGFb7mbA4kmtcY6rr7O14Pw5kKS8v59ChQ7iuSxAEJ1kXzo8xVZ8n327C0YuG0/y9p7DCoNZ52vGeDeRrrAuVr2HLy8uJxWK8vjc4ti404nXvXOZpxzs+8Xi8al2ofD1d+Vz5+t5ctXXh/BiTFfp49gUcuWgELd9dAJZ9ynna8W54wrpQ2WtU/UzssTiSa7zrXl1k72TrQuVrh+rHvu/X6DXgxD6wvnrCyjkJw4rXYacUNjLjxo0LgXDOnDm13v/AAw+EQPiTn/yk3s9TWloaAvrSl770pS996Utf+tKXvvSlL30Z/dq3b9+n9tON7gr+pwk/+a2FZVn1fp7777+f7373u1X/DoKAQ4cO0aZNm3P+/nXpyJEjdOjQgX379tG8eXPT5YgBykC0af5FGRBlQJQBUQYKVxiGHD16lEsuueRTH9voGvwWLVoAx7bDH+/IkSM1Hlef50kkEiQSiRq3tWzZ8pTf16TmzZvrhznilIFo0/yLMiDKgCgDogwUpk/rfys1ug/ZKyoqAmDHjh213v/mm28C0K1btwY5j4iIiIiIiMj5oNE1+DfddBMAq1atIgiCGvcdPXqU9evXk0qluPbaaxvkPCIiIiIiIiLng0bX4Hfp0oXi4mL27NnD7Nmza9xXWlrKxx9/zF133UXTpk0ByOfzbN++nV27dp3Tec5niUSC0tLSE95OINGhDESb5l+UAVEGRBkQZUAArDA8nc/ab1i7du2id+/eHDhwgCFDhnDFFVewceNGXnrpJbp168aGDRto06YNAHv27KFz58507NiRPXv2nPV5RERERERERM5njbLBB9i3bx8//OEPef755zl48CAXX3wxQ4cOpbS0lNatW1c97lQN/pmcR0REREREROR81mgbfBERERERERE5fY3uPfgiIiIiIiIicubU4IuIiIiIiIgUADX4jdD+/fsZPXo0l1xyCYlEgk6dOnHvvfdy+PBhI+eRhneuc3fw4EHmzp3L7bffTteuXUmlUrRo0YLrr7+eefPmnfCnI6XxqY+f36eeegrLsrAsi7lz59ZhtVIf6jID69at42tf+xoXX3wxiUSCiy++mOLiYlasWFEPlUtdqKv5X7ZsGf379+ezn/0sqVSKSy+9lDvuuINXX321niqXuvBf//Vf3HPPPfTt25fmzZtjWRYjR448q3Pp9eD5qS4yoNeDERVKo7Jz586wbdu2IRAOGTIknDJlSnjTTTeFQFhUVBT+7W9/a9DzSMOri7n7+c9/HgJhu3btwhEjRoRTp04NS0pKwhYtWoRA+NWvfjUMgqABRiNnoz5+ft96662wRYsW4QUXXBAC4Zw5c+qhcqkrdZmBhx56KATCCy+8MBw1alR4//33h+PGjQu/+MUvhpMnT67HUcjZqqv5v++++0IgbNOmTThmzJhwypQp4de+9rUwFouFlmWFTzzxRD2PRM7WF77whRAIL7jggvDyyy8PgfDOO+884/Po9eD5qy4yoNeD0aQGv5EpLi4OgXDWrFk1bp80aVIIhN/61rca9DzS8Opi7l588cVw6dKloed5NW5/5513wg4dOoRA+Otf/7pO65a6U9c/v0EQhLfcckt46aWXht/73vfU4J8H6ioDzzzzTAiE/fv3D48cOXLC/blcrk7qlbpVF/P/zjvvhLZthxdddFH43nvv1bhv9erVIRB26tSpTuuWurN69epwx44dYRAE4UsvvXTWDb5eD56/6iIDej0YTWrwG5GdO3eGQNi5c+fQ9/0a9x05ciRs2rRpmEqlwqNHjzbIeaThNcTc/fjHPw6BcPz48edartSD+sjAo48+GlqWFb788sthaWmpGvxGrq4y4Pt+2KlTpzCVSoUHDhyoz5KlDtXV/P/hD38IgXDw4MG13t+sWbPwggsuqLO6pf6cbXOn14OF41x+yXMyej1YuPQe/EbkpZdeAqC4uBjbrjk1zZo1o0+fPqTTaTZu3Ngg55GG1xBzF4/HAYjFYmdfqNSbus7Atm3bmDp1KhMnTqRfv351Xq/UvbrKwIYNG9izZw+DBg2iVatWLF++nBkzZvDYY4/p/deNWF3N/2WXXUYikWDjxo0cOHDghO9x9OhR/v7v/75ui5dGRa8H5VT0erBwqcFvRMrKyoCKJ+XaVN6+Y8eOBjmPNLz6njvP83jiiScAuPXWW8/qHFK/6jIDnufxP//n/+Tv/u7v+MlPflJ3RUq9qqsMbNq0CYB27dpx9dVXc9tttzF16lTuvfdeevfuzQ033MD7779fh5VLXair+W/dujUzZ87k/fff53Of+xzjxo3j/vvv54477uDWW2+luLiYX/ziF3VbvDQqej0oJ6PXg4XNNV2AHPPhhx8C0KJFi1rvr7z9gw8+aJDzSMOr77mbOnUqW7du5ctf/jIDBgw4q3NI/arLDPzzP/8zmzdv5pVXXiGVStVZjVK/6ioDlVdtf/7zn3PppZeyevVqevXqxd69e7nvvvtYuXIld9xxB2vWrKmz2uXc1eUacM8999CxY0dGjRpV4y9ndO3albvvvpu2bduee8HSaOn1oJyMXg8WNl3BP4+EYQiAZVmN4jzS8M5l7h599FH+5V/+haKiIp588sm6Lk0ayOlm4LXXXuMnP/kJ9913H9ddd11DlCYN5HQz4Pt+1eN/85vfcNNNN3HBBRdw5ZVXsmTJEj772c/y8ssva7v+eeZMngcefvhhbr/9dkaNGsWuXbv4+OOPef3117n00ku58847+ad/+qf6LlcaMb0ejCa9Hix8avAbkcrfpFb+xvV4R44cqfG4+j6PNLz6mrvHHnuMSZMmccUVV7BmzRouvPDCcytU6k1dZKBya363bt146KGH6r5IqVd1tQ60atUKgEsvvZT/8T/+R437UqlU1VWb11577ZzqlbpVV/O/evVqHnjgAYYMGcK//uu/cumll9KkSROuuuoqlixZQvv27fmXf/kXdu3aVbcDkEZDrwfleHo9GA1q8BuRoqIi4OTvhXrzzTcB6NatW4OcRxpefczdT3/6U+699166d+/OmjVraNeu3bkXKvWmLjLw0UcfsWPHDrZt20YymcSyrKqvadOmATBu3Dgsy+Lee++t2wHIOavr54KWLVvWen/lLwDS6fTZlCn1pK7mf/ny5QDcdNNNJ9zXpEkTrrnmGoIgYPPmzedSrjRiej0o1en1YHToPfiNSOWT8KpVqwiCoMYnnh49epT169eTSqW49tprG+Q80vDqeu4efvhhHnjgAXr06MHvf/97/ab2PFAXGUgkEowZM6bW+/70pz+xefNmrr/+eoqKirR9vxGqq3WgX79+uK7Lzp07yeVyVZ+YXGnr1q0AdOrUqW4HIOekruY/l8sBnPSDFCtvTyQSdVG2NEJ6PSiV9HowYsz9hT6pTXFxcQiEs2bNqnH7pEmTQiD81re+VXVbLpcLt23bFu7cufOcziONS11l4J//+Z9DILz66qvDgwcP1nvdUnfqKgO1KS0tDYFwzpw5dVqz1K26ysCdd94ZAmFpaWmN21etWhValhW2aNEiPHz4cH0MQc5BXcz/M888EwLhRRddFO7fv7/GfStWrAgtywqTyWT4t7/9rf4GInXi0/4Gul4PFr5zyYBeD0aPFYaffMKGNAq7du2id+/eHDhwgCFDhnDFFVewceNGXnrpJbp168aGDRto06YNAHv27KFz58507NiRPXv2nPV5pHGpiww88cQTjBo1CsdxuOeee2p9f12nTp0YNWpUA41KzkRdrQO1efDBB5k2bRpz5sxh7Nix9TwSOVt1lYEDBw7Qp08fdu7cSb9+/ao+RX/JkiVYlsXChQu54447DIxQTqUu5j8IAgYMGMALL7xAs2bNuP3222nXrh3btm3jt7/9LWEY8uijjzJx4kRDo5RTWbp0KUuXLgXg3XffZeXKlVx66aX07dsXgAsvvJCf/vSngF4PFqq6yIBeD0aU4V8wSC3eeuutcNSoUWG7du3CWCwW/t3f/V04YcKEE37rtnv37hAIO3bseE7nkcbnXDNQeZX2VF833HBDww1IzlhdrQPH0xX880ddZeDgwYPhpEmTwk6dOoWxWCxs3bp1OHjw4PDVV19tgFHI2aqL+c/lcuHPfvaz8Etf+lLYrFmz0HGc8DOf+Uw4aNCgcOXKlQ00Ejkbn/Y8Xn2+9XqwMNVFBvR6MJp0BV9ERERERESkAOhT9EVEREREREQKgBp8ERERERERkQKgBl9ERERERESkAKjBFxERERERESkAavBFRERERERECoAafBEREREREZECoAZfREREREREpACowRcREREREREpAGrwRURERERERAqAGnwREZHz2KhRo7Asiz179jTY9+zUqROdOnVqsO9X3S9/+Ussy6r6uvXWW43UcSZuu+22GjX/8pe/NF2SiIgUKDX4IiIi9WDEiBFYlsXPf/7zT33sTTfdhGVZ/Pa3v22AyupHZePdUM3rkCFDKC0tZeTIkQ3y/QCuvPJKPv/5z5/xfzdixAhKS0sZMmRIPVQlIiJyjBp8ERGRevDNb34TgDlz5pzycbt27eLll1+mffv2fPnLX26I0s7Ziy++yIsvvmi0hqFDh/Lggw82WIO/Y8cO/vrXv3L77bef8X87YsQIHnzwQYYOHVr3hYmIiFSjBl9ERKQe3HjjjXTr1o3Nmzfzpz/96aSPmzt3LmEYMnr0aBzHacAKz16XLl3o0qWL6TIa1JIlSwDOqsEXERFpKGrwRURE6sm4ceOAiia+Np7n8ctf/hLbthkzZkzV7du3b2fUqFF06NCBRCLBRRddxIgRIygrKzuj7//MM8/Qt29fWrRoQSqVonv37vzkJz8hk8nU+vj9+/czYcIELrvsMpLJJK1bt+aaa67hoYceqvG449+Df+ONN1JSUgJASUlJjfeb79mzh6lTp2JZFk8++WSt3/f111/Hsiy+8pWvnNH4avPggw9iWRZr1qxh0aJFXH311TRp0oRLLrmE7373u2SzWQB+//vfc8MNN9CsWTNatWrFXXfdxaFDh0563meffZbOnTvTo0ePqtuWLFnCTTfdRLt27UgkErRr147rr7+e2bNnn/M4REREzoYafBERkXpy9913E4/HWbhwIel0+oT7f/vb3/Luu+9SXFxMx44dAXj++ee56qqrWLhwIb169WLixInccsstPPvss1xzzTWn3A1Q3ZQpUxg2bBhlZWXceeed/K//9b8Iw5Dvf//7FBcXk8vlajz+j3/8I1/4whf4t3/7N9q3b8/EiRMZMWIEF1xwAQ8++OApv9eoUaOq3l9e+d74yq+WLVvy7W9/G9u2+Y//+I9a//tf/OIXAHzrW986rbGdjn/7t39jzJgxFBUV8Y//+I+0adOGn/3sZ3z729/mV7/6Fbfddhtt2rTh29/+Np/73Od46qmnuPPOO2s919tvv82mTZtqXL3/+c9/zle/+lW2b9/O4MGDue+++7jtttvI5XL6ED0RETEnFBERkXrzD//wDyEQPvHEEyfcN3DgwBAIn3322TAMw/DQoUNhy5YtwwsvvDDctm1bjcdu3bo1bNq0adijR48at999990hEO7evbvqtldeeSUEwo4dO4bvvfde1e35fL7qe/7oRz+quj2bzYadOnUKgXDhwoUn1PnWW2/V+HfHjh3Djh071rhtwYIFIRAuWLCg1v8fBg0aFALhX/7ylxq3HzlyJGzatGnYoUOH0PO8Wv/bM/k+paWlIRA2b948/Otf/1p1eyaTCT/3uc+Ftm2HLVu2DNesWVN1XxAEYXFxcQiEmzdvPuGcjz/+eAiE69atq7qtZ8+eYTwer/H/b6X333//rGoXERE5V7qCLyIiUo8qP2zv+G36+/fvZ+XKlbRr165qa/qTTz7JBx98wLRp07j88strPP7KK69k3LhxbNmyhf/zf/7PKb/nggULAPjBD35A27Ztq253XZd//dd/xbZt5s2bV3X7f//3f7Nnzx4GDx7M8OHDTzhfhw4dzmDEtfvOd74DwP/+3/+7xu1PP/00H3/8MePGjavTzyCYOHEiV1xxRdW/E4kE3/jGNwiCgK985SvccMMNVfdZllV19f7Pf/7zCedasmQJbdu2pXfv3jX+G9d1icViJzz+wgsvrLNxiIiInAnXdAEiIiKF7Oabb6ZLly6sW7eOsrIyioqKAJg/fz6+71NSUoLrVjwdv/rqqwBs2bKl1m3xO3bsACreo3/llVee9Htu3rwZqPjze8crKiris5/9LLt37+aDDz6gZcuW/OEPfwCo10/xv/XWW+ncuTNPPfUUM2bMIJVKAfAf//EfuK5b4zMI6sLVV199wm2XXHLJp963f//+GrcfOnSIl19+mZKSEmz72HWRO++8k/vuu48rr7ySYcOG0a9fP/r06cNnPvOZuhyGiIjIGVGDLyIiUo8sy2Ls2LHcf//9zJ07l5kzZxIEAfPnz8eyrBqN7cGDB4FP/9N6H3300Snv//DDDwFo165drfdffPHFvPXWW3z44Ye0bNmSDz74AID27duf7rDOmG3bfOtb32Lq1Kn86le/4u6772bjxo38+c9/5vbbb69qsOtKixYtTrit8hcpp7ovn8/XuP2///u/8TyPr371qzVu/+53v8uFF17Iv//7v/PYY4/xs5/9DMuyuOmmm5g5cyZXXXVVXQ1FRETktGmLvoiISD0rKSkhFovx5JNPks/n+f3vf8/evXurru5Xqmw8//znPxOG4Um/7r777lN+v8rzvPvuu7Xe/84779R4XMuWLYGKD5OrT2PGjCGRSFR92F7l/9blh+vVtSVLltC8eXNuvvnmE+676667+MMf/sDBgwdZvnw5Y8aMYc2aNRQXF/P+++8bqFZERKJODb6IiEg9u+iiixg8eDAHDhxg2bJlVe/Hr3x/fqVrr70WgHXr1p3T9+vZsycAa9asOeG+nTt3sn//fjp37lzV2Fd+35UrV57196x8/7zv+yd9zIUXXsgdd9zBq6++yiuvvMIzzzxD586dKS4uPuvvW5/Ky8tZtWoVgwYNIh6Pn/RxLVu2ZODAgcyZM4dRo0Zx8ODBc55DERGRs6EGX0REpAGMGzcOgJkzZ/Lcc8/xmc98hqFDh9Z4TElJCS1btmTatGm89tprJ5wjCIJam/bjjR49GoAf/ehHNa4k+77P9773PYIgqPHWgK985St06tSJpUuX8qtf/eqE853Olf02bdoAsG/fvlM+rvLD9v7hH/6B8vJyvvnNb2JZ1qee34Tf/e53pNPpGn8er9Lzzz+P53kn3H7gwAEAkslkvdcnIiJyPL0HX0REpAEUFxfTuXNnNm7cCMDdd999wlXhNm3a8F//9V/cfvvtXHvttdxyyy1ceeWV2LbNW2+9xauvvsrBgwfJZDKn/F69e/fmn/7pn3jkkUfo3r07X//612natCm/+93v2Lp1K9dffz2TJ0+uenw8HufXv/41xcXFfOMb3+AXv/gF11xzDel0mm3btrF69epam9nqrrvuOpo0acKjjz7KwYMHueiiiwC45557arzn/brrrqNHjx5s2bKFWCxGSUnJGf3/2JCWLFlCMpms9cMHhw0bRjKZ5Prrr6dTp06EYci6devYtGkTV111Ff379zdQsYiIRJ0afBERkQZQ+YF6P/jBDwAYO3ZsrY+75ZZbeOONN/jpT3/KypUrWbduHfF4nEsuuYSbb76Zr33ta6f1/WbMmEHPnj15/PHHq97736VLF370ox9x3333nfDLhS9+8Yts2bKF6dOn87vf/Y5XXnmFZs2a0bVrV6ZNm/ap369Vq1b85je/Ydq0aSxYsICPP/4YgJEjR57woXYlJSVMnDiR22+/veoXAY1NPp9n+fLl/P3f/z0XXHDBCfdPnz6dlStX8qc//YkVK1aQTCbp2LEjM2bM4B//8R9PuaVfRESkvlhhGIamixAREZHouOuuu3jqqad48cUXa/3wulP55S9/SUlJCQsWLGDUqFH1UyCwatUqBgwYwPz58+tsl0FD1S4iItGl9+CLiIhIg9m7dy/PPPMMn/vc5864ua+upKQEy7K49dZb67C6Y5YsWYLjOHzlK18553PddtttWJbVqN+OICIihUFX8EVERKTePfXUU5SVlfHMM8+wc+dOnn322Vo/vO7TbNmyhaVLl1b9u2vXrowcObIOK617CxcuZMeOHVX/Hjp0KD169DBXkIiIFCw1+CIiIlLvbrzxRtauXUuHDh343ve+xz333GO6JBERkYKjBl9ERERERESkAOg9+CIiIiIiIiIFQA2+iIiIiIiISAFQgy8iIiIiIiJSANTgi4iIiIiIiBQANfgiIiIiIiIiBUANvoiIiIiIiEgBUIMvIiIiIiIiUgDU4IuIiIiIiIgUgP8P0vqeIpnWhe8AAAAASUVORK5CYII=", - "text/plain": [ - "
" - ] - }, - "metadata": {}, - "output_type": "display_data" - } - ], - "source": [ - "tidal.graphics.tidal_phase_probability(data.d, data.s, flood, ebb) " + "data": { + "text/plain": [ + "" ] + }, + "execution_count": 12, + "metadata": {}, + "output_type": "execute_result" }, { - "cell_type": "code", - "execution_count": 12, - "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "" - ] - }, - "execution_count": 12, - "metadata": {}, - "output_type": "execute_result" - }, - { - "data": { - "image/png": "", - "text/plain": [ - "
" - ] - }, - "metadata": {}, - "output_type": "display_data" - } - ], - "source": [ - "tidal.graphics.tidal_phase_exceedance(data.d, data.s, flood, ebb)" + "data": { + "image/png": "", + "text/plain": [ + "
" ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [] - } - ], - "metadata": { - "kernelspec": { - "display_name": "base", - "language": "python", - "name": "python3" - }, - "language_info": { - "codemirror_mode": { - "name": "ipython", - "version": 3 - }, - "file_extension": ".py", - "mimetype": "text/x-python", - "name": "python", - "nbconvert_exporter": "python", - "pygments_lexer": "ipython3", - "version": "3.9.12" - }, - "vscode": { - "interpreter": { - "hash": "1b38577481a8c337d860514619746143ecc67292e11e5807b52b737c5351e332" - } + }, + "metadata": {}, + "output_type": "display_data" } + ], + "source": [ + "tidal.graphics.tidal_phase_exceedance(data.d, data.s, flood, ebb)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [] + } + ], + "metadata": { + "kernelspec": { + "display_name": "base", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.9.12" }, - "nbformat": 4, - "nbformat_minor": 4 + "vscode": { + "interpreter": { + "hash": "1b38577481a8c337d860514619746143ecc67292e11e5807b52b737c5351e332" + } + } + }, + "nbformat": 4, + "nbformat_minor": 4 } diff --git a/examples/tidal_performance_example.ipynb b/examples/tidal_performance_example.ipynb index 1eb311853..a3cd56c62 100644 --- a/examples/tidal_performance_example.ipynb +++ b/examples/tidal_performance_example.ipynb @@ -1,690 +1,715 @@ { - "cells": [ - { - "attachments": {}, - "cell_type": "markdown", - "metadata": {}, - "source": [ - "# Tidal Power Performance Analysis\n", - "\n", - "The following example demonstrates a simple workflow for conducting the power performance analysis of a turbine, given turbine specifications, power data, and Acoustic Doppler Current Profiler (ADCP) water measurements.\n", - "\n", - "In this case, the turbine specifications can be broken down into\n", - " 1. Shape of the rotor's swept area\n", - " 2. Turbine rotor diameter/height and width\n", - " 3. Turbine hub height (center of swept area)\n", - "\n", - "Additional data needed:\n", - " - Power data from the current energy converter (CEC)\n", - " - 2-dimensional water velocity data\n", - "\n", - "In this jupyter notebook, we'll be covering the following three topics:\n", - " 1. CEC power-curve\n", - " 2. Velocity profiles\n", - " 3. CEC efficiency profile (or power coefficient profile)\n", - "\n", - "Start by importing the necessary tools:" - ] - }, - { - "cell_type": "code", - "execution_count": 1, - "metadata": { - "scrolled": true - }, - "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "c:\\Users\\mcve343\\Anaconda3\\lib\\site-packages\\xarray\\backends\\cfgrib_.py:29: UserWarning: Failed to load cfgrib - most likely there is a problem accessing the ecCodes library. Try `import cfgrib` to get the full error message\n", - " warnings.warn(\n" - ] - } - ], - "source": [ - "import numpy as np\n", - "import matplotlib.pyplot as plt\n", - "\n", - "from mhkit.tidal import performance\n", - "from mhkit.dolfyn import load" - ] - }, - { - "attachments": {}, - "cell_type": "markdown", - "metadata": {}, - "source": [ - "In this case, we'll use ADCP data from the ADCP example notebook. I am importing a dataset from the ADCP example notebook. This data retains the original timestamps (1 Hz sampling frequency) and was rotated into the principal coordinate frame (streamwise-cross_stream-up)." - ] - }, - { - "cell_type": "code", - "execution_count": 2, - "metadata": { - "scrolled": true - }, - "outputs": [], - "source": [ - "# Open processed ADCP dataset\n", - "ds = load('data/tidal/adcp.principal.a1.20200815.nc')" - ] - }, - { - "attachments": {}, - "cell_type": "markdown", - "metadata": {}, - "source": [ - "Next, since we don't have power data, we'll invent a mock timeseries based off the cube of water velocity, just to have something to work with." - ] - }, - { - "cell_type": "code", - "execution_count": 3, - "metadata": {}, - "outputs": [], - "source": [ - "# Streamwise and hub-height water velocity\n", - "streamwise_vel = ds['vel'].sel(dir='streamwise')\n", - "hub_height_vel = abs(streamwise_vel.isel(range=10))\n", - "\n", - "# Emulate power data\n", - "power = hub_height_vel**3 * 1e5\n", - "# Emulate cut-in speed by setting power at flow speeds below 0.5 m/s to 0 W\n", - "power = power.where(abs(streamwise_vel.mean('range')) > 0.5, 0)" - ] - }, - { - "attachments": {}, - "cell_type": "markdown", - "metadata": {}, - "source": [ - "The first step for any of the following calculations is to first split velocity into ebb and flood tide. You'll need some background information on the site to know which direction is positive and which is negative in the data." - ] - }, - { - "cell_type": "code", - "execution_count": 4, - "metadata": {}, - "outputs": [], - "source": [ - "ebb = streamwise_vel.where(streamwise_vel > 0)\n", - "flood = streamwise_vel.where(streamwise_vel < 0)" - ] - }, - { - "attachments": {}, - "cell_type": "markdown", - "metadata": {}, - "source": [ - "With the ebb and flood velocities, we can also divide the power data into that for ebb and flood tides." - ] - }, - { - "cell_type": "code", - "execution_count": 5, - "metadata": {}, - "outputs": [], - "source": [ - "# Make sure ebb and flood are on same timestamps\n", - "power = power.interp(time=streamwise_vel['time'])\n", - "\n", - "power_ebb = power.where(~ebb.mean('range').isnull(), 0)\n", - "power_flood = power.where(~flood.mean('range').isnull(), 0)" - ] - }, - { - "attachments": {}, - "cell_type": "markdown", - "metadata": {}, - "source": [ - "### Power-curve\n", - "\n", - "Now with power and velocity divided into ebb and flood tides, we can calculate the power curve for the CEC in both conditions\n" - ] - }, - { - "cell_type": "code", - "execution_count": 6, - "metadata": {}, - "outputs": [], - "source": [ - "power_curve_ebb = performance.power_curve(\n", - " power_ebb,\n", - " velocity=ebb,\n", - " hub_height=4.2,\n", - " doppler_cell_size=0.5, \n", - " sampling_frequency=1, \n", - " window_avg_time=600,\n", - " turbine_profile='circular',\n", - " diameter=3,\n", - " height=None,\n", - " width=None)\n", - "power_curve_flood = performance.power_curve(\n", - " power_flood,\n", - " velocity=flood,\n", - " hub_height=4.2,\n", - " doppler_cell_size=0.5, \n", - " sampling_frequency=1, \n", - " window_avg_time=600,\n", - " turbine_profile='circular',\n", - " diameter=3,\n", - " height=None,\n", - " width=None)" - ] - }, - { - "cell_type": "code", - "execution_count": 7, - "metadata": {}, - "outputs": [ - { - "data": { - "text/html": [ - "
\n", - "\n", - "\n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - "
U_avgU_avg_power_weightedP_avgP_stdP_maxP_min
U_bins
(0.0, 0.1]0.0674590.0000000.0000000.0000000.0000000.000000
(0.1, 0.2]0.1156140.0000000.0000000.0000000.0000000.000000
(0.2, 0.3]0.2496760.2256390.0000000.0000000.0000000.000000
(0.3, 0.4]0.3396000.3155610.0000000.0000000.0000000.000000
(0.4, 0.5]0.4593930.4372492890.7249862660.8100225551.535008229.914964
(0.5, 0.6]0.5485070.53297419677.3435184645.89093624323.23445415031.452582
(0.6, 0.7]0.6714490.65536240369.4355173679.26013545506.30667737083.470337
(0.7, 0.8]0.7261890.70484552413.9720242856.73714257360.86147350670.102583
(0.8, 0.9]0.8439580.82591679944.0008559798.56967496206.92802566531.815452
(0.9, 1.0]0.9387010.920960103970.0421755828.263891112163.97743499100.055332
(1.0, 1.1]1.0466071.026293148511.10000818809.350864171583.550611124179.073981
(1.1, 1.2]1.1473481.127691200340.8205816299.518554209073.741656187772.752668
\n", - "
" - ], - "text/plain": [ - " U_avg U_avg_power_weighted P_avg P_std \\\n", - "U_bins \n", - "(0.0, 0.1] 0.067459 0.000000 0.000000 0.000000 \n", - "(0.1, 0.2] 0.115614 0.000000 0.000000 0.000000 \n", - "(0.2, 0.3] 0.249676 0.225639 0.000000 0.000000 \n", - "(0.3, 0.4] 0.339600 0.315561 0.000000 0.000000 \n", - "(0.4, 0.5] 0.459393 0.437249 2890.724986 2660.810022 \n", - "(0.5, 0.6] 0.548507 0.532974 19677.343518 4645.890936 \n", - "(0.6, 0.7] 0.671449 0.655362 40369.435517 3679.260135 \n", - "(0.7, 0.8] 0.726189 0.704845 52413.972024 2856.737142 \n", - "(0.8, 0.9] 0.843958 0.825916 79944.000855 9798.569674 \n", - "(0.9, 1.0] 0.938701 0.920960 103970.042175 5828.263891 \n", - "(1.0, 1.1] 1.046607 1.026293 148511.100008 18809.350864 \n", - "(1.1, 1.2] 1.147348 1.127691 200340.820581 6299.518554 \n", - "\n", - " P_max P_min \n", - "U_bins \n", - "(0.0, 0.1] 0.000000 0.000000 \n", - "(0.1, 0.2] 0.000000 0.000000 \n", - "(0.2, 0.3] 0.000000 0.000000 \n", - "(0.3, 0.4] 0.000000 0.000000 \n", - "(0.4, 0.5] 5551.535008 229.914964 \n", - "(0.5, 0.6] 24323.234454 15031.452582 \n", - "(0.6, 0.7] 45506.306677 37083.470337 \n", - "(0.7, 0.8] 57360.861473 50670.102583 \n", - "(0.8, 0.9] 96206.928025 66531.815452 \n", - "(0.9, 1.0] 112163.977434 99100.055332 \n", - "(1.0, 1.1] 171583.550611 124179.073981 \n", - "(1.1, 1.2] 209073.741656 187772.752668 " - ] - }, - "execution_count": 7, - "metadata": {}, - "output_type": "execute_result" - } - ], - "source": [ - "power_curve_flood" - ] - }, - { - "attachments": {}, - "cell_type": "markdown", - "metadata": {}, - "source": [ - "Next we can plot the two power curves. A velocity bin is missing in the ebb tide power curve in this example because the data is so short, there are no samples for that bin." - ] - }, - { - "cell_type": "code", - "execution_count": 8, - "metadata": {}, - "outputs": [ - { - "data": { - "image/png": "", - "text/plain": [ - "
" - ] - }, - "metadata": {}, - "output_type": "display_data" - } - ], - "source": [ - "def plot_power_curve(P_curve, ax):\n", - " ax.plot(P_curve['U_avg'], P_curve['P_avg'], '-o', color='C0', label='Avg Power')\n", - " ax.plot(P_curve['U_avg'], (P_curve['P_avg'] - P_curve['P_std']), '--+', color='C1', label='Power - 1 Std Dev')\n", - " ax.plot(P_curve['U_avg'], (P_curve['P_avg'] + P_curve['P_std']), '-+', color='C1', label='Power + 1 Std Dev')\n", - " ax.plot(P_curve['U_avg'], P_curve['P_min'], '--x', color='C2', label='Min Power')\n", - " ax.plot(P_curve['U_avg'], P_curve['P_max'], '-x', color='C2', label='Max Power')\n", - " ax.set(xlabel='Flow Speed at Hub Height [m/s]', ylabel='Power [W]')\n", - " ax.legend()\n", - "\n", - "fig, ax = plt.subplots(1,2, figsize=(10,7))\n", - "plot_power_curve(power_curve_ebb, ax[0])\n", - "plot_power_curve(power_curve_flood, ax[1])" - ] - }, - { - "attachments": {}, - "cell_type": "markdown", - "metadata": {}, - "source": [ - "### Velocity Profiles\n", - "Various velocity profiles can be created next from the water velocity data, and we can do this again with ebb and flood tide. These functions are following three steps:\n", - " 1. Reshape the data into bins by time (ensembles)\n", - " 2. Apply a function to the ensembles to get ensemble statistics (mean, root-mean-square (RMS), or standard devation)\n", - " 3. Regroup and bin the ensemble statistics by flow speed\n", - "\n", - "These profiles are created using the `velocity_profiles` method, and a profile is specified using the \"function\" argument. For the average velocity profiles, we'll set the function = 'mean'.\n" - ] - }, - { - "cell_type": "code", - "execution_count": 9, - "metadata": {}, - "outputs": [], - "source": [ - "avg_profile_ebb = performance.velocity_profiles(\n", - " velocity=ebb, \n", - " hub_height=4.2,\n", - " water_depth=10,\n", - " sampling_frequency=1, \n", - " window_avg_time=600,\n", - " function='mean')\n", - "avg_profile_flood = performance.velocity_profiles(\n", - " velocity=ebb, \n", - " hub_height=4.2,\n", - " water_depth=10,\n", - " sampling_frequency=1, \n", - " window_avg_time=600,\n", - " function='mean')\n" - ] - }, - { - "attachments": {}, - "cell_type": "markdown", - "metadata": {}, - "source": [ - "### RMS Tidal Velocity\n", - "\n", - "For RMS velocity profiles, we'll set the function = 'rms'." - ] - }, - { - "cell_type": "code", - "execution_count": 10, - "metadata": {}, - "outputs": [], - "source": [ - "rms_profile_ebb = performance.velocity_profiles(\n", - " velocity=ebb, \n", - " hub_height=4.2,\n", - " water_depth=10,\n", - " sampling_frequency=1, \n", - " window_avg_time=600,\n", - " function='rms')\n", - "rms_profile_flood = performance.velocity_profiles(\n", - " velocity=ebb, \n", - " hub_height=4.2,\n", - " water_depth=10,\n", - " sampling_frequency=1, \n", - " window_avg_time=600,\n", - " function='rms')" - ] - }, - { - "attachments": {}, - "cell_type": "markdown", - "metadata": {}, - "source": [ - "### Std Dev Tidal Velocity\n", - "\n", - "And to get the standard deviation, we'll set function = 'std'." - ] - }, - { - "cell_type": "code", - "execution_count": 11, - "metadata": {}, - "outputs": [], - "source": [ - "std_profile_ebb = performance.velocity_profiles(\n", - " velocity=ebb, \n", - " hub_height=4.2,\n", - " water_depth=10,\n", - " sampling_frequency=1, \n", - " window_avg_time=600,\n", - " function='std')\n", - "std_profile_flood = performance.velocity_profiles(\n", - " velocity=ebb, \n", - " hub_height=4.2,\n", - " water_depth=10,\n", - " sampling_frequency=1, \n", - " window_avg_time=600,\n", - " function='std')" - ] - }, - { - "attachments": {}, - "cell_type": "markdown", - "metadata": {}, - "source": [ - "Finally, we can plot these variables together based on ebb and flood tides. The following code plots the mean and RMS profiles as line plots with \"x\" and \"+\" markers, respectively, and shades the area between +/- 1 standard deviation from the mean." - ] - }, - { - "cell_type": "code", - "execution_count": 12, - "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "Text(0.5, 1.0, 'Flood Tide')" - ] - }, - "execution_count": 12, - "metadata": {}, - "output_type": "execute_result" - }, - { - "data": { - "image/png": "iVBORw0KGgoAAAANSUhEUgAAA0oAAAJuCAYAAACOkPJ5AAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjUuMywgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy/NK7nSAAAACXBIWXMAAA9hAAAPYQGoP6dpAAEAAElEQVR4nOzdeXxU133//9edRSON9gUhCQnEDkJgxBK22IaAMcFLncROWieO3SZu2qTN6uZbf5s0idPEv+SbJk3dLE2a1o2z2nHSOl4wNt5ZhADJIMQmLAQSEkL7Mlpm5t7fH1czkkDL3NG9oxnp83w8eICuZu69YEtvnXM/53MUTdM0hBBCCCGEEEIE2ab6BoQQQgghhBAi2shASQghhBBCCCGuIQMlIYQQQgghhLiGDJSEEEIIIYQQ4hoyUBJCCCGEEEKIa8hASQghhBBCCCGuIQMlIYQQQgghhLiGDJSEEEIIIYQQ4hoyUBJCCCGEEEKIa8hASYhRPP744yiKMuav1157LfhaRVH4m7/5m5DPeeTIEcP3M969XHtfDzzwAIWFhSGf96tf/arh+xFCCGGN8fLnoYceCr6usLCQBx54YErucaLs2Lp1a0iZ9dWvfjX4971w4cKE1926dStbt2417e8hxEQcU30DQkSz//qv/2LZsmXXHS8qKorofRw8eHDEx1//+td59dVXeeWVV0YcLyoqoqCggM985jORvD0hhBAmGy1/8vLypuhujPnhD39IZ2dn8OPnnnuOf/qnf7ru75Sfn4/L5eLgwYPk5uZOxa0KMS4ZKAkxjuLiYtatWzfVt8HGjRtHfDxr1ixsNtt1xwFSUlIidVtCCCEsEi35E45rJxNPnz4NjP13mjVrVkTuSwijpPROCJP8+7//O0uWLMHlclFUVMRvfvObUV/X1tbGn//5n5ORkUFiYiJ33HEH77zzjmn3MVrpXWdnJw8++CCZmZkkJSWxa9cuzp49O+r7z507x7333kt2djYul4vly5fzgx/8wLT7E0IIYY2LFy/ykY98ZMT373/+539GVdURr2ttbeWTn/wkc+bMIS4ujgULFvAP//AP9Pf3j3idkewI12ild5qm8e1vf5t58+YRHx/PmjVreOGFF0Z9f2dnJw899BDz588nLi6OOXPm8NnPfpaenh5T71PMTPJESYhx+P1+fD7fiGOKomC320cce+aZZ3j11Vd55JFHSExM5Ic//CF/9md/hsPh4O677x7x2o997GPccsst/OpXv+LSpUt86UtfYuvWrRw/fpy0tDTT/w6apnHXXXdx4MAB/vEf/5H169ezf/9+3vve91732qqqKjZv3szcuXP553/+Z3JycnjxxRf59Kc/TXNzM1/5yldMvz8hhBDXGy1/HI6xf2y7evUqmzdvZmBggK9//esUFhby7LPP8tBDD3H+/Hl++MMfAtDX18e2bds4f/48X/va11i1ahVvvvkmjz76KBUVFTz33HOAseww29e+9jW+9rWv8bGPfYy7776bS5cu8eCDD+L3+1m6dGnwdR6Ph5tvvpm6ujr+7//9v6xatYqTJ0/yj//4j5w4cYKXX34ZRVEsv18xjWlCiOv813/9lwaM+stut494LaAlJCRojY2NwWM+n09btmyZtmjRouvO+b73vW/E+/fv368B2j/90z+FfH/333+/lpiYOObn5s2bF/z4hRde0ADt+9///ojXfeMb39AA7Stf+Urw2K233qrl5+drHR0dI177N3/zN1p8fLzW2toa8j0KIYQwbrz88Xq9wdfNmzdPu//++4Mf//3f/70GaKWlpSPO99d//deaoijamTNnNE3TtB//+McaoD355JMjXvetb31LA7S9e/dqmmYsO0L9O5WVlY35uZqaGk3TNK2trU2Lj48fMytvvvnm4LFHH31Us9ls1533d7/7nQZozz//fMj3KMRopPROiHH8/Oc/p6ysbMSv0tLS6163fft2Zs+eHfzYbrfzoQ99iOrqaurq6ka89sMf/vCIjzdv3sy8efN49dVXLfk7BM577XXvvffeER/39fWxb98+3ve+9+F2u/H5fMFfu3fvpq+vj0OHDllyj0IIIUYaLX/Ge6L0yiuvUFRUxLve9a4Rxx944AE0TQs2/3nllVdITEy8rtoh0EFv3759QOjZYbaDBw/S19c3ZlYO9+yzz1JcXMzq1atHZNatt956XYdaIcIhpXdCjGP58uUhLabNyckZ81hLSwv5+fkTvralpWUSdzq2lpYWHA4HmZmZo97f8Nf5fD4ee+wxHnvssVHP1dzcbMk9CiGEGCnU/AloaWkZdWuIQKe8QMa0tLSQk5NzXUladnY2DodjxOtCyQ6zBa4/Xq4GXLlyherqapxO56jnkswSkyUDJSFM0NjYOOaxa0NmrNcuWrTIknvLzMzE5/PR0tIy4l6uvY/09HTsdjv33Xcfn/rUp0Y91/z58y25RyGEEJOTmZlJQ0PDdccvX74MQFZWVvB1paWlaJo2YrDU1NSEz+cb8bpQssNsgWuNlZXDB4NZWVkkJCTwn//5n6OeK/B3ESJcUnonhAn27dvHlStXgh/7/X5++9vfsnDhwhFPkwB++ctfjvj4wIED1NbWWraJ3rZt20a97q9+9asRH7vdbrZt20Z5eTmrVq1i3bp11/26dtAnhBAiOmzfvp2qqiqOHTs24vjPf/5zFEUJZsH27dvp7u7mf/7nf657XeDzEHp2mG3jxo3Ex8ePmZXD3X777Zw/f57MzMxRMyvUzdeFGIs8URJiHJWVldd1HQJYuHDhiH0fsrKyeM973sOXv/zlYNe706dPj9oi/MiRI3z84x/nnnvu4dKlS/zDP/wDc+bM4ZOf/KQlf4edO3dy00038cUvfpGenh7WrVvH/v37eeKJJ6577fe//33e/e53c+ONN/LXf/3XFBYW0tXVRXV1NX/84x+v2+BWCCFEdPjc5z7Hz3/+c2677TYeeeQR5s2bx3PPPccPf/hD/vqv/5olS5YA8NGPfpQf/OAH3H///Vy4cIGVK1fy1ltv8c1vfpPdu3ezY8cOwFh2mCk9PZ2HHnqIf/qnfxqRlV/96levK7377Gc/y9NPP81NN93E5z73OVatWoWqqly8eJG9e/fyhS98gQ0bNlh6v2J6k4GSEOP48z//81GP//SnP+XjH/948OM777yTFStW8KUvfYmLFy+ycOFCfvnLX/KhD33ouvf+7Gc/44knnuBP//RP6e/vZ9u2bXz/+98nIyPDkr+DzWbjmWee4fOf/zzf/va3GRgYYMuWLTz//PPX7fpeVFTEsWPH+PrXv86XvvQlmpqaSEtLY/HixezevduS+xNCCDF5s2bN4sCBAzz88MM8/PDDdHZ2smDBAr797W/z+c9/Pvi6+Ph4Xn31Vf7hH/6B//f//h9Xr15lzpw5PPTQQyO2gDCSHWYbvtXGE088wbJly/jxj3/Md77znRGvS0xM5M033+T/+//+P37yk59QU1NDQkICc+fOZceOHfJESUyaommaNtU3IYQQQgghhBDRRNYoCSGEEEIIIcQ1ZKAkhBBCCCGEENeQgZIQQgghhBBCXGNKB0pvvPEGd9xxB3l5eSiKcl2rSk3T+OpXv0peXh4JCQls3bqVkydPTs3NCiGEmBEkm4QQQsAUD5R6enq44YYb+Ld/+7dRP//tb3+b7373u/zbv/0bZWVl5OTkcMstt9DV1RXhOxVCCDFTSDYJIYSAKOp6pygKf/jDH7jrrrsAfcYuLy+Pz372s/yf//N/AOjv72f27Nl861vf4hOf+MQU3q0QQoiZQLJJCCFmrqjdR6mmpobGxkZ27twZPOZyubj55ps5cODAmGHU399Pf39/8GNVVWltbSUzMxNFUSy/byGEEDpN0+jq6iIvLw+bbXosiZVsEkKI2GYkm6J2oNTY2AjA7NmzRxyfPXs2tbW1Y77v0Ucf5Wtf+5ql9yaEECJ0ly5dIj8/f6pvwxSSTUIIMT2Ekk1RO1AKuHamTdO0cWffHn744RE7UHd0dDB37lwuXbpESkqKZfcpIqPZ08+B+rZxX9Pl8bLvxBUOn2sJHls2J4Udq/QfbJITnCS7nde9TwHuWJxj6v1OmbZK6L084csOJ7ZTmdh93XF3Vxc3//G35NZfREP/t7mwcClvb94GQG9iMp7kZDy9Ho6dPEbVO1XB987Lncea4jUAJMYn4k5wG7r1XCWX99rfa+g9Ijp1dnZSUFBAcnLyVN+K6SSbxHBVzZ1Ut3nGfU242ZTtjmPjnAxzb3iqXHkd/P0TvuwP6Vdoc3pHHHN3dXHDwddY/nZZ8NhouQTg6fXw5tE3qb08NHkx2Wxaa1vLDbYbDL1HRCcj2RS1A6WcHP0H1sbGRnJzc4PHm5qarpvJG87lcuFyua47npKSImE0DfQ7+nF3+MZ9zVvVDRy52EtOdjpNHfo35LPNPha0qexcnTvm+xSYPv+P+JPAMXEIJCYNkJDov+54ydv7Wdp8CVwKdYULyb9wnlV1Z+m/UsixG3cAkABU1lZypuEMcYlx+FX9PHXtdczpnMP6levDunW34ibFPk3+Owjg+kFFLJNsEqNJ6ge31z7uawLZ5ExIxK/qy8NDyabERNf0+X/Ekwj+8f+dANwpCfQ5R/6IWvL2ftafPkJb3mzSW5oARs0l0LOprq0Oe4Idd7wbT59n0tmUZEsixTZN/jsIILRsitqi8fnz55OTk8NLL70UPDYwMMDrr7/O5s2bp/DORDTbW9HAnvIGdpXkMjs1Pnh809Is9pQ3sLeiYQrvLjasefNl1r++lwuLl484fnLNRta/vpc1b74MQNmJMkqPl7Jh1Qbs9qHgK15UTOnxUspOlCHEdCPZJMIxPJsctqEfziSbQhPIpbKbd9KelR08fm0uwVA2FS0qGnEOySYRjil9otTd3U11dXXw45qaGioqKsjIyGDu3Ll89rOf5Zvf/CaLFy9m8eLFfPOb38TtdnPvvfdO4V2LaKZqGrtKctm5Opf/2ncegOX5Kdy6OpdUtxM1Opo8RjVFVSm7eSe97kQKz53C73Bw5MYdnFqzEU9yCoqqAqBqKhtWbWD9yvWUnyoHYOWSlawrXkeiOxFVU6fyryFE2CSbhNmGZ9OrJ64AcOPyWWxflSPZFIJALh27cQc7n/o5ALWLlnHsxh0jcgmGsqkgt4Cq6ioURWH9yvUULy6WbBKGTelA6ciRI2zbti34caB++/777+fxxx/ni1/8Ir29vXzyk5+kra2NDRs2sHfv3mlZ7y7Msask77pjKwpSSXE7xy1tEEOO3qx381p+9CAAfoczeCxQ3gCwYdWG6957w7IbSExIDLu0QYhoINkkzDZaNt20IluyKUSBDBqudnERnuSUEbkEQ9nU2Kw3XrHZbMFjkk3CqCkdKG3dupXxtnFSFIWvfvWrfPWrX43cTQkhIksDh8+BXbWjaAoOxUGfvW+q70qEyOl0jii9nA4km4QQ12aTZtPos0k2xQK73Y7D4TBlfWzUNnMQQkx/Tq+TOY1zSO1NxTa4ZNKOnRqlZorvTIRKURTy8/NJSkqa6lsRQghTSDbFPrfbTW5uLnFxcZM6jwyUhBBTQlEVFtcuJtWeStqcNOxOO4qi4MBBiiKdhWKBpmlcvXqVuro6Fi9ePO2eLAkhZp6xsimBBBKUhIlPIKaUpmkMDAxw9epVampqWLx48aQ2PJeBkhBiSsR543CpLjILMolzD834OHESr8SP804RTWbNmsWFCxfwer0yUBJCxLyxssmFS7IpRiQkJOB0OqmtrWVgYID4+PD/u0Vte3AhxPSmaHrtsGKbPnvszETTaY8kIYSQbJoeJvMUacR5TDmLEEIIIYQQQkwjMlASQgghhBBCiGvIQEkIIcLQ0tJCdnY2Fy5cmOpbscyFCxdQFAVFUVi9evVU344QQogJSDaZSwZKQoiY9b2XzvKv+86N+rl/3XeO77101rJrP/roo9xxxx0UFhYGj128eJE77riDxMREsrKy+PSnP83AwMC45+nv7+dv//ZvycrKIjExkTvvvJO6ujrD93PixAluvvlmEhISmDNnDo888si4ewEBFBYWBsMm8Ovv//7vg58vKCigoaGBL3zhC4bvRwghZirJpiGxnk3S9U4IEbPsNoXvDgbOp7cvDh7/133n+O5LZ/n8LUssuW5vby8/+9nPeP7554PH/H4/t912G7NmzeKtt96ipaWF+++/H03TeOyxx8Y812c/+1n++Mc/8pvf/IbMzEy+8IUvcPvtt3P06NGQu8h1dnZyyy23sG3bNsrKyjh79iwPPPAAiYmJEwbJI488woMPPhj8ePh+SHa7nZycHNkjSQghDJBs0k2HbJKBkhAiamiaRq/XT5ziC+n1H79xPl6/yndfOovXr/LXWxfyo9fO89gr1fztexbx8Rvn4xkI7VwJg3tlhOKFF17A4XCwadOm4LG9e/dSVVXFpUuXyMvLA+Cf//mfeeCBB/jGN75BSsr1e0N1dHTws5/9jCeeeIIdO3YA8Itf/IKCggJefvllbr311pDu55e//CV9fX08/vjjuFwuiouLOXv2LN/97nf5/Oc/P+7fKzk5mZycnJCuI4QQM5GmaXi8fohwNhnJJZBssoIMlIQQUaPPq3LTV8rCeu9jr1Tz2CvVY348kapHbsUdF9q3xDfeeIN169aNOHbw4EGKi4uDQQRw66230t/fz9GjR9m2bdt15zl69Cher5edO3cGj+Xl5VFcXMyBAwdCDqODBw9y880343K5Rlz74Ycf5sKFC8yfP3/M937rW9/i61//OgUFBdxzzz383d/93aR3MhdCiOlEz6Y3wnrvZLLJSC6BZJMVZKAkhBAGXbhwYUToADQ2NjJ79uwRx9LT04mLi6OxsXHU8zQ2NhIXF0d6evqI47Nnzx7zPWOdZ3g9euAcgc+NFUaf+cxnWLNmDenp6Rw+fJiHH36Ympoa/uM//iPkawshhIgOkk3mk4GSECJqxDttHPzaRlKVVEPvC5Q0OO0KXr/G375nEX+9daGhcyQ4Q6u5Br0OfLSdvkcrI9A0zfCmrOG859rXBxbLjneez33uc8E/r1q1ivT0dO6++26+9a1vkZmZaej6QggxXcU7bRz52k24lQRD75tsNhnJJZBssoIMlIQQUUNRFBLi7LiV0L81/eu+czz2SjWfv2UJn96+OLhY1mm3jVhEa6asrCza2tpGHMvJyaG0tHTEsba2Nrxe73WzecPfMzAwQFtb24iZu6amJjZv3hzy/eTk5Fw3y9fU1AQw5rVHs3HjRgCqq6tloCSEEIMURcEt2TQjs0nagwshYtbwDkKB4Pn09sV8/pYlfHec9qyTVVJSQlVV1YhjmzZtorKykoaGhuCxvXv34nK5WLt27ajnWbt2LU6nk5deeil4rKGhgcrKSkNhtGnTJt54440R7V737t1LXl7edWUP4ykvLwcgNzc35PcIIYQYSbJp6Nqxnk0yUBJCxCy/qo0IooBAIPnV8fdqCNett97KyZMnR8zc7dy5k6KiIu677z7Ky8vZt28fDz30EA8++GCwq1B9fT3Lli3j8OHDAKSmpvKxj32ML3zhC+zbt4/y8nI+8pGPsHLlymCnoVDce++9uFwuHnjgASorK/nDH/7AN7/5zRFdhQ4fPsyyZcuor68H9EW23/ve96ioqKCmpoYnn3yST3ziE9x5553MnTvXrH8qIYSYcSSbdNMhm6T0TggRsz43zl4UVpU2AKxcuZJ169YFv4GDvq/Dc889xyc/+Um2bNlCQkIC9957L9/5zneC7/N6vZw5cwaPxxM89r3vfQ+Hw8EHP/hBent72b59O48//viIfSq2bt1KYWEhjz/++Kj3k5qayksvvcSnPvUp1q1bR3p6Op///Of5/Oc/H3yNx+PhzJkzeL1eAFwuF7/97W/52te+Rn9/P/PmzePBBx/ki1/8opn/VEIIMeNINummQzbJQEkIIcLw5S9/OTgrZ7PpD+fnzp3Ls88+O+Z7CgsLr9uRPD4+nscee2zcjf8uXLjAAw88MO79rFy5kjfeGLt97datW0dce82aNRw6dGjccwohhIgtkk3mkoGSEEKEYffu3Zw7d476+noKCgosu87p06dJTk7mox/9qGXXGMvFixcpKipiYGCAoqKiiF9fCCGEMZJN5pKBkhBChOkzn/mM5ddYtmwZJ06csPw6o8nLy6OiogJgxIaBQgghopdkk3lkoCSEEGJUDoeDRYsWTfVtCCGEEEGRzCbpeieEEEIIIYQQ15CBkhBCCCGEEEJcQwZKQgghhBBCCHENGSgJIYQQQgghxDVkoCSEEEIIIYQQ15CBkhBCCCGEEEJcQwZKQggRhpaWFrKzs7lw4cJU34plLly4gKIoKIrC6tWrp/p2hBBCTECyyVwyUBJCxK5XH4XXvz36517/tv55izz66KPccccdFBYWBo9dvHiRO+64g8TERLKysvj0pz/NwMDAuOfZunVr8Bt+4Nef/umfGrqXvr4+HnjgAVauXInD4eCuu+4K6X1tbW3cd999pKamkpqayn333Ud7e3vw8wUFBTQ0NPCFL3zB0P0IIcSMJtkETI9skg1nhRCxy2aHV7+h//nmLw4df/3b+vFt/2DJZXt7e/nZz37G888/Hzzm9/u57bbbmDVrFm+99RYtLS3cf//9aJrGY489Nu75HnzwQR555JHgxwkJCYbux+/3k5CQwKc//WmefvrpkN937733UldXx549ewD4y7/8S+677z7++Mc/AmC328nJySEpKcnQ/QghxIwm2RS8dqxnkwyUhBDRQ9PA6wHFGdrrN30K/AN68PgH4N2fg7e+B2/8P7jp7/TPD/SEdi6nGxQlpJe+8MILOBwONm3aFDy2d+9eqqqquHTpEnl5eQD88z//Mw888ADf+MY3SElJGfN8brebnJyc0O5zFImJifzoRz8CYP/+/SNm3sZy6tQp9uzZw6FDh9iwYQMAP/3pT9m0aRNnzpxh6dKlYd+PEEJMK8Fs0kJ7vVnZZCCXQLLJCjJQEkJED28vaY+uCu+9b/w//ddYH0/k/16GuMTQLvXGG6xbt27EsYMHD1JcXBwMIoBbb72V/v5+jh49yrZt28Y83y9/+Ut+8YtfMHv2bN773vfyla98heTk5NDvPQwHDx4kNTU1GEQAGzduJDU1lQMHDshASQghAry9uKcimwzkEkg2WUEGSkIIYdCFCxdGhA5AY2Mjs2fPHnEsPT2duLg4GhsbxzzXhz/8YebPn09OTg6VlZU8/PDDvP3227z00kuW3Pvw+83Ozr7ueHZ29rj3K4QQIjpJNplPBkpCiOjhTKD94VOkKanG3hcoabDH6WUON/2dXupg6NrukF/a29tLfHz8dceVUUokNE0b9XjAgw8+GPxzcXExixcvZt26dRw7dow1a9aEfE/hCOd+hRBixnEm4Hn4PG7F2BqdSWeTgVwCySYryEBJCBE9FAXi3KCEXmrA69/Wg2jbP+iLZgOLZe1xIxfRmigrK4u2trYRx3JycigtLR1xrK2tDa/Xe91s3njWrFmD0+nk3LlzloZRTk4OV65cue741atXDd2vEEJMe8FsMjBwkWwKS7Rlk7QHF0LEruEdhALBc/MX9Y9f/cbY7VknqaSkhKqqqhHHNm3aRGVlJQ0NDcFje/fuxeVysXbt2pDPffLkSbxeL7m5uabd72g2bdpER0cHhw8fDh4rLS2lo6ODzZs3W3ptIYSY1iSbwhZt2SQDJSFE7FL9I4MoIBBIqt+Sy956662cPHlyxMzdzp07KSoq4r777qO8vJx9+/bx0EMP8eCDDwa7CtXX17Ns2bJgAJw/f55HHnmEI0eOcOHCBZ5//nnuueceSkpK2LJli6F7qqqqoqKigtbWVjo6OqioqKCioiL4+cOHD7Ns2TLq6+sBWL58Obt27eLBBx/k0KFDHDp0iAcffJDbb79dGjkIIcRkSDYFxXo2SemdECJ2bXt47M9ZVNoAsHLlStatW8eTTz7JJz7xCUDf1+G5557jk5/8JFu2bCEhIYF7772X73znO8H3eb1ezpw5g8fjASAuLo59+/bx/e9/n+7ubgoKCrjtttv4yle+gt1uD75v69atFBYW8vjjj495T7t376a2tjb4cUlJCaDXdQN4PB7OnDmD1+sNvuaXv/wln/70p9m5cycAd955J//2b/82yX8dIYSY4SSbgmI9m2SgJIQQYfjyl78cnJWz2fSH83PnzuXZZ58d8z2FhYXBcAB9d/HXX399wmtduHCBBx54YMLXjGfr1q0jrg2QkZHBL37xiwmvL4QQIjZINplLBkpCCBGG3bt3c+7cOerr6ykoKLDsOqdPnyY5OZmPfvSjll1jLBcvXqSoqIiBgQGKiooifn0hhBDGSDaZSwZKQggRps985jOWX2PZsmWcOHHC8uuMJi8vL1hL7nK5puQehBBCGCPZZB4ZKAkhhBiVw+Fg0aJFU30bQgghRFAks0m63gkhhBBCCCHENWSgJIQQQgghhBDXkIGSEEIIIYQQQlxDBkpCCCGEEEIIcQ0ZKAkhhBBCCCHENWSgJIQQQgghhBDXkIGSEEKEoaWlhezs7Al3HY9lFy5cQFEUFEVh9erVU307QgghJiDZZC4ZKAkhYtYPK37Ij9/+8aif+/HbP+aHFT+07NqPPvood9xxB4WFhcFjn/nMZ1i7di0ulyvkb979/f387d/+LVlZWSQmJnLnnXdSV1dn6F76+vp44IEHWLlyJQ6Hg7vuuiuk9xUWFgbDJvDr7//+74OfLygooKGhgS984QuG7kcIIWYyySbddMgmGSgJIWKWTbHxg4ofXBdIP377x/yg4gfYFGu+xfX29vKzn/2Mj3/84yOOa5rGX/zFX/ChD30o5HN99rOf5Q9/+AO/+c1veOutt+ju7ub222/H7/eHfA6/309CQgKf/vSn2bFjR8jvA3jkkUdoaGgI/vrSl74U/JzdbicnJ4ekpCRD5xRCiJlMskk3HbLJYfkVhBAiRJqm0evrJU6JC+n1Hy36KF6/lx9U/ACv38vHVn6Mn534GT858RP+cuVf8tGij+LxekI6V4IjAUVRQnrtCy+8gMPhYNOmTSOO/+u//isAV69e5fjx4xOep6Ojg5/97Gc88cQTwRD5xS9+QUFBAS+//DK33nprSPeTmJjIj370IwD2799Pe3t7SO8DSE5OJicnJ+TXCyHETBPIJkKLCNOyyUgugWSTFWSgJISIGn2+Pm779W1hvfcnJ37CT078ZMyPJ1J6bylupzuk177xxhusW7fO8D1e6+jRo3i9Xnbu3Bk8lpeXR3FxMQcOHAg5jCbjW9/6Fl//+tcpKCjgnnvu4e/+7u+IiwttoCqEEDPBVGWTkVwCySYryEBJCCEMunDhAnl5eZM+T2NjI3FxcaSnp484Pnv2bBobGyd9/ol85jOfYc2aNaSnp3P48GEefvhhampq+I//+A/Lry2EEMJckk3mk4GSECJqxDvi2ftne0lVUg29L1DS4LQ58ape/nLlX/KxlR8zdI4ER0LIr+3t7SU+Pt7Q+Y3QNM1QuUW4Pve5zwX/vGrVKtLT07n77rv51re+RWZmpuXXF0KIWBDviOe1P3uNBCX0nIDJZ5ORXALJJivIQEkIETUURSHBmYBbCb3U4Mdv/5ifnPgJn1r9Kf7qhr8KLpZ12p381Q1/Zcl9ZmVl0dbWNunz5OTkMDAwQFtb24iZu6amJjZv3jzp8xu1ceNGAKqrq2WgJIQQgySbdDMxm6TrnRAiZgWCJxBEAH91w1/xqdWfGrXjkFlKSkqoqqqa9HnWrl2L0+nkpZdeCh5raGigsrJySsKovLwcgNzc3IhfWwghpgvJJnNNZTbJQEkIEbNUTR0RRAGBQFI11ZLr3nrrrZw8efK6mbvq6moqKipobGykt7eXiooKKioqGBgYAKC+vp5ly5Zx+PBhAFJTU/nYxz7GF77wBfbt20d5eTkf+chHWLlypeFWqlVVVVRUVNDa2kpHR0fw2gGHDx9m2bJl1NfXA3Dw4EG+973vUVFRQU1NDU8++SSf+MQnuPPOO5k7d+4k/nWEEGJmk2waEuvZJKV3QoiY9cnVnxzzc1aVNgCsXLmSdevWBb+BB3z84x/n9ddfD35cUlICQE1NDYWFhXi9Xs6cOYPHM9QW9nvf+x4Oh4MPfvCD9Pb2sn37dh5//HHsdnvwNVu3bqWwsJDHH398zHvavXs3tbW1111b0zQAPB4PZ86cwev1AuByufjtb3/L1772Nfr7+5k3bx4PPvggX/ziFyfxLyOEEEKyaUisZ5MMlMS0sqf8MjZFYefqocezJy91UDw3jUNnm1E1jV0lk+8IM52tfX0vms1GrzsRALvPy9rX93JqzUaWVRxGUVWO3ryT0uOl2BQb61euD7737dNvs654HVXVVaiayoZVG6bqr2G5L3/5yzz00EM8+OCD2Gz6w/nXXntt3PcUFhYGwyEgPj6exx57jMcee2zM9124cIEHHnhg3HNfuHBh3M9v3bp1xLXXrFnDoUOHxn2PEMIco2XTGyeb2L4qR7IpBIFcOnbj0NOMeeeqqF1SNCKXgGA2FeQWAKCqKqXHSyleXCzZNAbJprHJQElMKzZFYU95w4hjp+o6ebGigYNnmtlVImsvJqLZbKx/fS8XFi8HwO7zse7Nl0no6WbFsUOUDYaRTbFRerx0xHtPnD2BpmpUVldO6yACfZbs3Llz1NfXU1BQYNl1Tp8+TXJyMh/96Ectu8ZYLl68SFFREQMDAxQVFUX8+kJMF6Nl05unruJTNcmmEARyabh51adZ8+bLI3IJhrKpy9Olv1fTKDtRRm9vr2STiWZKNslASUwrgdm6PeUNZKe6gscDQTR8Nk+MLjBjd20oBcIo+PnBJ0mlx0ux24YexQeCaPiTpunqM5/5jOXXWLZsGSdOnLD8OqPJy8sL1pK7XK7xXyyEGNPwbLLbhtorSzaFZngutWVmB49fm0swMpuGk2wy10zJJhkoiWln45IsOjxeDp5pDh5bUZBKUX4qdc0eUtxOUtzO696nEbk9AqLd6dXvYs47Z8m7dIE5F84DULOkiIuLlpHVUIcnKQVPcgpFi4ro8fRQWV0ZfO/8OfOZN2ceTa1NJCYkkpiQOFV/DTFJDoeDRYsWTfVtCDEthJtNQnd69btwd3Wy4thQWdZouQRQtKiIptYmaupq8PTp624km6aPSGaTDJRETHHYJh7EHDhzdUQQgb5O6eSlDgB2rs4Zsxa816fidtpH/dxMsvzYIfIuXQAg8C8+/2wV88/qbUeP3LiDozfvpPJc5YhBEkBNfQ019TWAPrM33cschBDCYZu4iXC42eTx+sy5yRi3/NihEYMkGD2XACrPVVJTVzPitZJNIhwyUBIxJS6EMNq8dBZdvb7rZu1uHSxtGG/GrqPfKwMl4NSajeRdqCbv0gU09MFSzZKiYHmDJ0mftSteXBys+w6YP2c+61fppQ3jzdhpir5489oFpCK2yH8/ISDOPvEkXrjZ1DXgx6dqIU0UTmen1mwMrpUNGC2XQM+m5rbmEYMlyaaZxaz/frKPkogpcY6J/5c9dLaZg2eaWV2YFjx28lIHVXUd5Ge5JxwoCVhWcTj4RKm+cCGgz9zNrT5Nc25+sLyhqrqKyurKEWuUauprqK2vJTsje9ww8jq8qKgMeAas+4sIywX24RjeMlaImcZlDz2b8jMSgsdCzaZOySaWVRxmxbFDI9YojZZLoGdTYJDkjncDkk0zTaDVudM5uXJWeaIkYopDUVDQ1xONZm9FA3vKG9hVksvy/BQqLrQDsGlpVrDj0HiLZtv7pMRhzZsvB7veFZ47FTx+cs3GYIOHYzfuoOxEGaXHS9mwagPlp8rxq34AihcVBxfRjrdoVrWrNKU24WjSvw3FueNQFAUNjT6lz6q/njCRqqpcvXoVt9uNwyFxImauuAkGSsOzyaYo1LX2AqFnU0e/j4yEOPNuOMYEcqns5p1kNV4mvaUJuD6XgGA2FS0qoqq6KniOyWZTP/3YFHm+EO00TcPj8dDU1ERaWtqkJ/Ek2URMURSFOLuNfv/ou1rre1HoHYR6hg16thXPJtXtRJ3gUaw8UQJFVSm7eSe97kQKz53C73Bw5MYdnFqzEU9yCoqq/9sH9qJYv3I95afKAVi5ZCXriteR6E4Maefxhmz9BwRfkw/b4ANuO3bcituiv50wm81mY+7cudIERcxoEw2UhmfTsXdaAUhLdHLr6lzJphAEcunYjTvY+dTPAahdtIxjN+4YkUswlE0FuQVUVVehKArrV66neHHxpLLJhYs4ZeYOVmNNWloaOTk5kz6PDJREzHGNM1AavhDW7bLjctro96r4VTWk9qs9Xj9eVcUZwlqo6SqwGHb50YMA+B3O4LHhLVhHWwh7w7IbSExIDL39qgINsxu4knUFp8+JoilkK9lss2+b5N9CREpcXFxwU0MhZqqJBkrDsykjabCdsaavSwolm9r7ZvZA6eiwfZICahcX4UlOGZFLMJRNjc2NgD6ZEzg2mWxaaVvJfNv8SfwtRKQ4nU7TysFloCRizkSBFKAoCpnJLi639tLSNcDstISJ3wR09vvInMElDlNBtav02/sB8Ck+4u3xU3xHQggRulDWKAVkJuv50uHx4vOrOEJ4b2e/T7avmALDs0mxKcTbJJtmGpkGFDEn1IESQEaSHkgtXf0hv2emz9wJIYQwxqYoOEIcxCTFO4hz2NCA1u7QGgb4NI0er38SdyiECIcMlETMMTJQykzWSxxCDSPQF80KIYQQRoTSlRX0aofAJJ6xbJJJPCEiTQZKIuaEsl9FQDCMDDxRkjASQghhVCj7/AUEJvGMVDvIJJ4QkScDJRFzjNWCD4aRgVm7zn6vbDQnhBDCkHDKwo1M4klZuBCRJwMlEXOMld4NhVGogx+/Bt1SCy6EEMIAl4Fqh6EnSlIWLkQ0k4GSiDlGBkrpg21Y+7wqnv7QBz8dMnMnhBDCAENPlAKTeN2hP1Hq9fkZGGNrDCGENWSgJGKOkdK7OIeNlAQnYCyQ2mWdkhBCCAPCaTRk5IkSyBpaISJNBkoi5hgJIxiauZMSByGEEFYJZ41S74CfXgN509En2SREJMlAScQcowOl8LoLyaydEEKI0BnJJpfTTlK8AzDWbEiqHYSILBkoiZjjtBnbmTyc/Sr6fCr9PmnoIIQQIjRGysJheLWDTOIJEa1koCRijqIoYdaChx5GIOV3QgghQme42mGw2VCrgbLwrgEfqmxfIUTEyEBJxCQjbViD3YUMLpqVEgchhBChMl4WPvhEyUCjIVWDLpnEEyJiZKAkYpKhJ0qDs3ZtPQOoaugzcfJESQghRKiMNxoy/kQJpPxOiEiSgZKISUYCKdXtxG5T8KsaHZ7QA0b2UhJCCBEqh03ByBLawCSe0bLwdpnEEyJiZKAkYpKRgZLNppCeaLzEoWvAh9/AEyghhBAzm5GGDkObzg4YWnckT5SEiBwZKImYFGcLr7uQkRIHDX2wJIQQQoTCyCReWmIcNgX8qkankWqHfh+aNHQQIiJkoCRiUqhhtKf8MnsrGoKd7y63ethTfplOj5e9FQ3sKb887vtnYkOHta/vZc2bLwc/tvu8rH19L+6uTta8+TJrX98LQOnxUspOlI1479un36ant4eyE2WUHi+N6H0LIcRUM5JN+443kjZY7fDCscvBwdJE2TTgV+nzqZO/2RhybS4BzDtXdV0uwfXZpKoqpcdLJZtEWBxTfQNChCPU8gaborCnvIEleckAXO3s51RdJ129Pg6eaWZXSe6475+JJQ6azcb61/dyYfFyAOw+H+vefJmEnm5WHDtE2c07AbAptusC58TZE2iqRmV1JRtWbYj4vQshxFQKdaAUyKbAPn9l1a3cuDybQ2eb2VPeEFI2JTjtk77fWBHIpeHmVZ9mzZsvj8glGMqmLk+X/l5No+xEGb29vZJNwjAZKImYFGoY7Vyth82e8gYA2nv00rvAICnw+bF09M280rtjN+4AuC6UAmEU/PzK9YA+e2e3DQV2IIgCnxdCiJki3GwCOHi2OeRsau/3kZMU/n3GmuG51JaZHTx+bS7ByGwaTrJJhENK70RMMlIHvnFJFivnpQLQ0NYHwIqCVIryU6lr9oxbGz7dnyjFaaO3aDq9+l1cLigEYM6F8wDULCni4qJlZDXU4e7qBKBoURHFi4rxq/7ge+fMnsO8OfNoam2ip7fH8D0NaAP4Nf/ELxRCiCgTajZ1erwU5adSkOUOHjt4pplNS7Moyk+dcM1S5wzMptOr38XJNRtJb2kKHhstl0DPpgX5CwDw9HkAmJc3b1LZ1K8Z604opgd5oiSmvQNnrnKitmPEsZOXOjh5ST+2c3UOu0ryRn2vL1a73oW40HdNTwpJfgeHktvpsw3VvC8/doi8SxcACMTV/LNVzD9bBcCRG3dw9OadVJ6rpLK6csQ566/U8+QLTwL6zJ7RModmmnnS/yTrbOtYqCzEpsh8jhBiejlw5ip7KxqvO37wjP5UabxcAvBO82x6b/ssjiZ2UunuQh0MoeXHDrHi2KERrxstlwAqz1XyTt07I15be7mW2su1QHjZ9Lb2Ns3+Ztbb1jNbmW3ovSJ2yUBJxCS/gY4/m5fOorG9j+MX2oPHVhSkcutgaUOK2znme2M0ioDQFvoqKCztS6SwP4HDSe1UJfSAAqfWbCTn4jvk176Dhj5YqllSFCxv8CSlAFC8uDhY960oyohOTE6H/u/q9/ux243V0nfSySvqK5RTzjrbOuYr81EUAxuUCCHEFAh1U/PNS2dRXJDG7w5e5GKzJ3h809IsNi3JGjeXYlto2RSn2djUncbS3kTeSmmjIa6fU2s2BtfKBoyWS3BNNqGgDUvz5MRkUhJT0DTNcK7Ua/XU++uZq8xlvW09WUqWofeL2CNTtSImGdlz4tDZ5uAgKSlenxs4eamDqroO8rPc0zOQNGMdkVyajRu7MnhfazazvE6WVRwmv1afjWvKzQf0mbu51adpzs3Hk6wHUlV1VbDu+55d9wTPlxCfgNfnpexEGb989pdU11aH1c62jTZeUl/iaf/T1Kq10hJXCBHVQp3ES3E7qarruG6QdPBMM1V1HRPmUsx+LzR43xl+J3e0zWJbRwbFx8pYcewQzbOHnrSNlktwTTa9dyibHHYHXT1d7Du0j//d979cbb0a1l/jonaRp/1Ps9e/l1atNaxziNggAyURk0IdKOltVhvYtCQTGCoj27Q0iz3lDeytaBj7zTEtvBDN9rm46+X9rH99L+8sXwWAbXDQdXLNRtYPa9EaaLN67eLY4kXF9Pb1Mj9/Pu4EN53dnex5aw9P732ahqvh/Xu30MIedQ//4/8f6tS62P0hQQgxrRnNpsW5Qx0ZNi3JYldJ7vTOJoOTeKBXPiw58CIlb75I7ebbuTo4eQfX5xKMn00+v4/cWbnYbDbqrtTx2xd+y8sHX6bb0x3WX6dGq+Ep/1Ps8++jQ+uY+A0i5kjpnYhJ/hDLG1RNY1dJLkvykjl4tgW7TWHn6hw2L51FqtsZUqiF83h+yoURRgE2TYO19zAncw6cOo6mKBy5cQen1mzEk5yCournVjV1RBAlJiSyfuV6ihcXk+hORNVUbtl8CxWnKjhWdYzG5kae3vs0i+YuYtPqTaQmpxq+tyaaeE59jlxyWWdfR54ydg2/EEJEWqhLhwLZpAHnGrrJz0wgxe0MdrszUjURW8LMJk2Ftfcwb8X76T3wUwAuz53PsRt3jMglCD2bDlYc5FztOU6/c5rq2mpWL1/NmqI1xDnjDN9etVbNef95lihLWGtbS7KSHN7fU0QdRZvmU7OdnZ2kpqbS0dFBSkrKxG8QMeFCu4djV0KfvXnnSjf/9vxZspJd/N+7Vxi61vuW5MTeQOlqKQy0TO4cF8vhxW8zMGs+//sXn6bVGX6XpW5PN4ePH6bqvL7o1mazsWrpKtatWEe8Kz7s8+Yr+ayzrZOFtVFKvv+OTf5tpqfSy23Ud/WF/PoXjl3mpbcb2bIsiw9smhvy+2a547ixIDOcW5w6mgaXX5j8eQ7+N1TuoXndbp7d+R76beFPDDY2N7L/2P5gtYM73s27Vr2LooVF2GzhFV3ZsLFMWcYa2xoSlcSw701Yx8j3Xym9EzHJSDMHGJqdC+f7XmzOJJiwa/vg3khxfj8faJ3Npq40nGp4A8YkdxLv2fge/nT3n1KQU4CqqlScquCJZ57g7dNv4/eH1w68Tqvjf/z/wx7/Hpq15rDOIYQQZjH6JCgwVx1zk3FhMSGXAGx6MVTWgI0PNeewzBP+YCQnK4f33/J+3nvje0lNTsXT5+G1w6/xm+d/Q219eOtiVVSqtCp+7f81B/wH6NV6w74/MfWieqDk8/n40pe+xPz580lISGDBggU88sgjqKpJX2wiZhkOo8H/ZWZGGDGp0rugwTBC9WNDYZUnmQ+15LKwzz3++8aRlZ7Fne+5kzu23UFGagb9A/28efRNfvXsr6i+GF7DB4BarZan/U/zkv8l2rS2sO9PiFBINomxhFoWHhB4uc1gNsVkLZAZuQTBSTxUHwmanZu7MrirNZssb3iNmRRFYeHchdx7273cuPZGXHEuWjta+eNrf+SZV56huS28STg/fk5oJ/iV/1eU+kvp00J/0iiiR1SvUfrWt77Fj3/8Y/77v/+bFStWcOTIEf78z/+c1NRUPvOZz0z17Ykp5DcYEsEnSmGMk7RAf+yYYkIg2YcGSgGJqp0dHZks601kf3Ib7Q6f4dMqisK8vHkU5BRw6p1TlL5dSkd3B3ve3EPurFy2rNlCTlZOWLf8jvYO7/jfYbGymLW2taQqxtdBCTERySYxFqPbG00mm2KOaQOl67NpttfF+1pnU5XQTVlSBwM24yNJu93ODctuYOn8pRw5eYTjZ45zqfESv3n+NyxfsJwNN2wgyZ008Ymu4cNHhVZBlb+KlbaVrFRW4lJchs8jpkZUD5QOHjzIn/zJn3DbbbcBUFhYyK9//WuOHDkyxXcmpprRJ0pDYTQT0ghzphuHzdpdK38gnrtbcjju7uJYUic+xfj1bDYbKxatYPG8xZRXlVN+qpyGqw387sXfsXjeYjat3kRKUnhrN85p56j2V7NUWcoa2xpZWCtMJdkkxmK0LDzwcqPVDrH4QMm0uw5kk39kNtlQKO5NZkG/m0NJ7ZxL8Izy5onFu+J595p3s3LxSg5WHKT6YjWn3jnFudpzlBSVULK8JKyGDwMMcFQ9SiWV3GC7gWKlGKcyDbcnmWaiuvTu3e9+N/v27ePs2bMAvP3227z11lvs3r17zPf09/fT2dk54peYfoyWNwTCyBbGtF1MBpIppXdjD5QA7CiUeFL4YHMOhX0JYV8mzhnHhhs28JE7P8KyBcsAOFd7jl/88RfsP7af/oH+sM6roXFaO81v/L/hLf9b9Gg9Yd+jEMNJNomxGJ7EG8wyu+GfxmIwmUwvvRt9batbtfOezkzuaJ1Fui/85wGpyansunEXH9j5AXKycvD5fZSdKOMXf/wFVdVVYZfa9tPPYfUwv/b/muPqcXya8coMETlR/UTp//yf/0NHRwfLli3Dbrfj9/v5xje+wZ/92Z+N+Z5HH32Ur33taxG8SzEVwg2j8B4oxWLtnQmBpIwfRgHJqoNbO7Ko7e1lf3IbXY7wGjMkuZPYsWkHNyy9gf3l+6lrrKP8VDmn3jkVbO1qDwSkASoqJ7WTnPafZoWygtW21SQo4Q/shJBsEmMxXu2g/274iVIMjpOsLL0bTZ43ng+05HDC3cXRxE58YZTjAeTOyuUDOz/A+UvnOVB+gM7uTl4pfYW3z7zNljVbmJsberfC4Xrp5aB6kLd5mzW2NSxTlmFXjGecsFZUP1H67W9/yy9+8Qt+9atfcezYMf77v/+b73znO/z3f//3mO95+OGH6ejoCP66dOlSBO9YREr4a5RibcATJjNSNLBGyR/abNe8gQQ+2JLDmu4UwswjAGZlzOJP3vMn3L71dtJT0unr7+PNI3rDh3cuvRN2wwc/fo5rx/mV/1cc9h+WhbUibJJNYixGs0mbUdlkVuldYKA0cTbZUVjtSeFDLTnMn0Tlg6IoLJq7iA/f/mG2rNmCK85FS3sLz7zyDM+88gwt7eFvx+HBw1vqW/zG/xtOq6dRzRpQClNE9ROlv/u7v+Pv//7v+dM//VMAVq5cSW1tLY8++ij333//qO9xuVy4XLJIbroLd9YunDCasTN3Ic7aDefAxvqeVJb0udmf3M4lV3iDEUVRKJxTyNzcuVRVV1F6vJSOrg6ef+N58rLz2LJmC7Mzw9s7yYePcq2ck/6TrLKtYqWykjjFeL25mLkkm8RYVMNd78Jr5hCLsRSp0rvRJKkOdnZkcam3l7eS2+kMoxER6A0fSpaXsHzBcsoqyzhx9gQXGy5y6flLwYYPiQnhtSvvppvX1depoIK1trUsVBZiU6L6ecaMENX/BTwez3UbftntdmnBKiaxV4UVdxONzFyjZLyULtXv5L3tWdzSnkmiP/xSApvNRvGSYu77k/tYu2Itdrudy02XeWrPU+zdv5fO7vDXeQwwwBH1CL/y/4oKtQKvFv6GumJmkWwSYzG+x5/+uzIj2t6Z3x7cqIKBBO5pyWFddwp2Lfx/83hXPDeuvZF7b7+XhQUL0TSNqvNV/OKZX1B2ogyvL/w86aCDV9RX+J3/d7yjhl9FIcwR1U+U7rjjDr7xjW8wd+5cVqxYQXl5Od/97nf5i7/4i6m+NTHFwg2jsJ4oGX5HFDCl693gtwfNr5/P4L+dgsKCfjcFA/EcTezkhLuLMPerJc4Zx6bVmyheXMyhtw9xpuYMZy+c5fzF89yw7AbWrliLKy682fp++ilVSznOcUpsJSxXluNQovpbo5hikk1iLOFO4s2IcZJZP/DbQy+9G40DhbU9qSzu07e5uBhm5QNAWnIa773pvTQ0NfDWsbe40nKF0uOlVJ6rZOMNG1k6f+l1kyqhaqONl9SXyCKLdbZ1zFXmzpy9IKNIVP808Nhjj/HlL3+ZT37ykzQ1NZGXl8cnPvEJ/vEf/3Gqb01MMdmrYhyahqlPlEB/qmQP79uFU7OxsTuNpX3JvJmp0UBD2LeUnJjMLZtv4YZlN7D/2H7qr9RzrOoYVeer2LBqA0WLisJq+AD6wtoD6oHgwtqlylJZWCtGJdkkRqNpmuE1SoEOrrLhrAEhNhqaSIrfwa72LGqTXOxPvEI33WGfKzc7l7tvvZvq2moOVBygq6eLfYf26Q0fSrZQkFsQ9rmbaWaPuodssllvW88cZY4MmCIoqgdKycnJ/Mu//Av/8i//MtW3IqJMuO3Bw/nmEnt5ZPJeFaDP3IU5UApI99m5w3Yr1bzDQfUgvfSGfa7sjGzu2n4XF+ovsL98P+2d7bxe9jrHzxxnc8lmCucUhh0kPfTwpvpmsE58sbJY6sTFCJJNYjThfOcNP5tiL5nMK70zvn52LAoKhQNJzEm5mXK1nLe1t1HDvE9FUVhcuJj5BfM5fuY4RyqP0NzWzP++8r/My5vH5pLNZKZlhn2vTTTxnPocueSy3r6eXCU37HOJ0EX1QEmIsYS94Ww4P+/G2tSd2eUNYEogASian8X2xcxV5nJEPcJJ7SRamIGvKArz8+czN2+o4UNbZxvPvf4cc2bPYcuaLWRnZId9r1108Zr6GuWUs862joXKQpnFE0KMyWguDX+PNHMwwG7OE6UgzYdTcfIu+7tYrC1mv7qfeq0+7NM57A7WFK0JNnyoPFtJ7eVaLjZcpGhhERtWbcCd4A77/A008Iz/GfKVfNbb1pOthJ9zYmIyTSpikuE1SmGWN0AsBpLJ5Q0Qdi34dQYbJrgUF1vsW3i//f1kM7lv8nabnZVLVnLfnfexpmgNdpud+iv1PPnCk7x04CW6eromdf4OOtin7uN3/t9Ro9bIwlohxKj8YXzrDa6fnRl14eacxmZs64oJqUONF9KVdG6z3cZ223bchD+YAUiIT+CmdTfxZ7f/GQsKFqBpGierT/LEM09wpPLIpBo+ANRpdfzB/wf2+PfQooXfnlyMT54oiZhkfI2S/vuM2KvCtDpwRR8saX7zZu7UkcGQpWRxl/0uzmhnKFVL6SP8RbWuOBebSzYHGz6cvXCWMzVnqL5Yzeplq1m7Yi1xzvDbgLfSyl51L1lksd62ngKlQJ4wCSGCjE7gwQzbR8n09uDmD5RgcM8kZRFzlbkcVY9yQjsRduUDQHpKOrtv2k39lXr2H9tPU2sTh94+NKLhw2SypFarpdZfywJlAets60hX0sM+l7iePFESMSns0rswvhfF3vMDE+94Ei3CR6VeP4OmKArLbMv4kP1DLFeWT/oSKUkp7Nyyk3t23UPerDz8fj9HTx7liWeeoPJs5aRbODfTzAvqC/yv/3+pV8MvzxBCTC+TKb0z+nNyTD7YnsJ9lMal+Ub9B41T4thk38QH7B8gh5xJX2bO7Dncs+sebtl8C8nuZLo93bx88GWefOFJ6hrrJn3+d7R3eMr/FK/4X6FD65j0+YROBkoiJhmduQvuozQTyhvM3NXbbnaJw9jniVfiucl+E3fZ7yKLrElfanbmbN53y/vYfdNuUpNT6e3r5bWy1/j1c7/mQv2FSZfQXeEKz6rP8kf/H2nUGid9v0KI2BbWQGnw2/WMeKJkdumdWU+UQB8sjSFTyeRO+51stW0lnvhJXUZRFJbOX8qH7/wwm1ZvIs4Zx9W2q/zPvv/h2deepa2jbVLn19A4p53jt/7f8rr/dbq0yZWeCym9EzEq1EDaU34Zm6LgtOtzAo1tvXR6vKS4neytaEDVNHaV5I1/klibuZvsQOno70CxwZr3D83cVT6vf3z6Vf38a+8O894mrsmerczmffb3UaVVUaaWMcBAeNdCD6UFBQuYN2celecqKTtRRltnG8++9iz5OfmkJqWS5E5i/cr1APT09lB5rpLixcVUVVehaiobVm0Y9xqXtcv8r/9/KVAKWG9bzyxlVtj3K4SIXaG2Bg/k0s7VucEJm8qL7Sybk8Khs80h5VKsxRJgXjbNLdE/9nv1Y8u3Tz6bVC/YnGN+WlEUlipLKVQKOawepkqrCu86gxx2B2tXrKVoYRGHTxym8lwlF+ovUHu5llnps8jPyWdzyWYgvFzS0Ditneas/yzLleWU2EpIVBIndc8zlQyUREwKddGsTVHYU97AkrxkABra+uj0eDl0tpk95Q3sKpm4vWbsBdIkw0ixwdGn9D8HBkqnXh76fe09k7i10Bav2hQbxUoxC5QFHFIPcU47F/410Rs+3LD0BpbNX8aRyiO8feZt6hrrqEMvdxjwDrBlzRZ6ensoO1FGb28vldWVE4bRcJe0S1zyX6JQKWSdbR2ZSvhtYIUQsSfUCbxALunv0Y9VXuwgOaGBg2eaQ8qlWEymSQ+UAtnUO1hW5vfBsaf1jyOUTS7FxY32G1mmLeNN/5tc5Wr410Rv+HDz+ptZtWQVByoOUFNXQ1NrE02tTVxtvcptN982qVxSUTmpneS0/zQrlBWstq0mQUmY1D3PNIo2zVs4dXZ2kpqaSkdHBykpKVN9O8IkfzjTEHJM7K1oCIYSwKalWcEw2rl64kDatSAbtzOGNh4d6ICr+yd3jmO/1wMpzg0DnqHja+/RnyyFK2kBpC4z/LbL2mXe8r9FG5MrSwjo7O7kYMVBztUODcDmZM9h4w0befqlpwHYsGpD8ElTOBYqC1lrWzujF9bK99+xyb/N9NPU089bda0hvTaQS+lJcbR1Dz01DzWXkuLs7JwfY22hu6qh8+zkzhHIJgBHPPgGGwBNNpuy3gUuYyXfqqZyWjvNYfUw/fSHf+1h6hrr2F++n6ut+gAszhnHmqI1HHr7EDD5XHLgYKWykhtsN+BSXKbccywy8v1X1iiJmKNpofef6fR4KcpPJT9raAbl4JlmNi3Noig/lU7PxLNIk+l2MzVMWKO0bBss3zFykDRvrV7y0FwDnjAHLCHO2l0rT8njA/YPsNG2MbzrXiMlKYVb330rd996d3Cvpfqm+uAgaf6c+cybM4+m1iZ6envCusZ57TxP+Z/iVf+r9Grhb64rhIgNRtYobVySxaalWSMGSSsKUinKT6Wu2TNxNsVaLIE5HSiWbYOFW/Q/BwZJU5RNNsVGka2ID9k/xEJlYXjXvUZ+Tj4f3PVBblx7Iw6HgwHvQHCQZEYu+fBRrpXzK/+vOKYeQzVzTfM0JaV3Iub4DPQGP3DmKnsrrl9of/BMMwfPNLNzdc6EteAKMbbI1owAPbVvqNwuoPao/gtgzQfCqwXXwu9SZFfs3KDcwIA2wDHtWNjnGS4nK4d5eXrwDFdTX0NNfQ0A61euN1TqMJyGxlntLC3+Fu6w3zGjZ/CEmO6MNBk6cOYqB880jzh28lIHJy/pZWUTZlOMxZJpTu2D89dUTJiRTZPooJegJPAe23vo8ffQyOQb+yiKQt9AHz7fyAYTZuUSwAADlKlldCvd3Gi7Uba6GIcMlETM8RkIo81LZ1FckMav37pAQ9vQHj2blmaxaUkWKe6xF28GzMhvH8u3D9V9B8xbq4cQgDstvPOO01koVGtta7nsv2xKIAEULymmt0+v/Q7ISs/iPRvfA0BiwuQXwLbQwh7/Hnbbd+NUJv5/TggRe4xM4m1eOouuXt+IwdKKglRuHSy7myibYm4CzyzLt0PnVah+Y+hYFGSTTbHxHvt7eNr/tClleMWLi4NrkgIURWHXu3eRnJRsSi4BnNJOEa/G8y77u0w533QkpXci5hgJoxS3k6q6jusGSQfPNFNV1xHSQGlG5tHpV/VBUmLG0LHao3CxHLLmgzvMdTeTeKIUYFNsbLdvx4U5T2eqqquCC2SXL9D3cWpua6bybCXZGdmmBVIjjbysvozfhH8DIUT0MZJNh87qVQ2JrqH1rycvdVBV10F+ljuEgdIMdfrVkYMkiJpsSlaSudl286TPAyNz6e6d+hMyTdN4pfQVUhJTTMslgHKtnOPqcdPON93IQEnEHCNhFFgwm585tEZp05IsdpXksqe8gb0VDeO8WzfjAimwWHbtPZA8bLHw8h368WO/D//cJu17kaQksdW2ddLnKTtRRunx0uAC2ZVLVgY/V3W+ireOvjXpawx3UbvIa+prk97DSQgRfULNpkAu7SrJxTWsUdCmpVmh59KMCyaGsqnkmqYNUZRN823zKVaKJ3WOa3PJNri9icPhoH+gnydfeBK/WZvtDjqoHuS0etrUc04XMlASMcevhr74UN+PIpecNH2gtDg3iRS3k52rc9lVkhvS4tsZV+KgqUMdhAIb+xWu1z9ee8/kWrya+DSl0FY46UAK7EcR6CKU6E5k7Yq1ZKTqT9LO1JxhwBv+Pk6jqdaqOaAekMGSENNMqAOlQC7tXJ2Lb3DzpU1LMrnVQC7NSMFs+sDQsVW3R102bbBtIJPwt4e4LpcSElm/cj233XQbNpuNzp5O3jzyplm3G/SG+gY1ao3p5411skZJxBwjT5QCi2F//pr+xb+iIC1Y0hBKC1aYgTN3wxfC2ge/Rcxbq5c0TKb9KpiyRmm4jbaNNPobaaZ54heP4trFsIkJiWxavYnixcU8tecpPH0eXj7wMu+96b2mLnat1CpxaS7WKetMO6cQYmr5QvxBfXiTBt/gxN9NK7KDk3ihmJGL74dnk2LTB0bF7426bHIoDnbYd/C0/2l8GD/vaLkUOPbeG9/Lc68/R+W5SjLTMkdUQUyWhsbL6svsZjdzbHNMO2+skydKIuYYGSgF3zO4Q63DbjxcZmAcDQk8UfKbFCImlTcE2BU7O+w7cGJug4TkxGTee9N7sdlsvFP3TrA9q5mOqkepVCsnfqEQIiaEl036exx2Yz+OzehcgqFsMqsEzeRJvDQljRttN5p6ToD5+fPZtHoTAG8ceYNLDZdMPb+Kyovqi1zVJreR7nQiAyURc4x0vQu+J8wwghn4RGm4wBMlswY4mt+cvTSGSVVSLQmk3Fm5bN+4HYCjJ49ypuaM6dfYr+7nnHpu4hcKIaKeP4KTeDM5lgCwD06OmTaJZ36TnSW2JSxRlph+3jVFa1g6fymaprHnrT20dZqzEXuAFy/P+5+nTTP3vLFKBkoi5kT6idKMjiSznyihYcqGuNdYbFvMUmWp6eddOn8pa4rWAPDKoVdobDanJflwr6qvUqvWmn5eIURkGc0mVdUIvMVhM/hEaQbHEgD2wSYYpk3imftEKeDdtneTRpqp51QUhW0btpGTlUP/QD/PvfYcff19E7/RgD76eM7/HF1al6nnjUUyUBIxJ6yB0uB7HDYpvTMkWN5gfNfyMVkwcwewxbbF9EAC2LR6E/Pz5+NX/Tz/+vN09ZgbHBoaL6kv0aBN3OlKCBG9jGbT8Ncbf6I0o5Np2CSeSdlk0bYNTsXJDvsO7NgnfrEBDruD3TftJtmdTHtXOy++9SKqgUZXoeihh+f9z9Or9Zp63lgjAyURc3xhfDOQ0rsw2c1+ooRlM3dWBZKiKNyy+RYy0zLx9Hl4/vXn8fpMHDgCfvzs8e+hWQuvKYUQYuoZHSh5/UNZFk42zWg2k8vCTV4/O1ymkskm2ybTz+tOcHPb1ttw2B1carzEW8fM3c4CoJ12nvc/z4BmbvfXWCJfmSLmRLIOHOSJEmDuUyCLBkqgB9Jm22bTzxvnjOO2m28jwZXA1barvHzgZdPbew8wwPP+5+nQOkw9rxAiMkLtehfgH5zAUxSwG6x2mNETeGDN+lkLFSlFFCqFpp83Kz2LW7bcAsDxM8epPGd+g6BmmnlRfRGfhdkdzWSgJGJOJDsLwQxtwxpgdhiBZaV3AcuV5SxQFph+3pSkFHbftBubzcb5S+c5fPyw6dfopZdn/c/So/WYfm4hhLUMl94FJvCkJNw4m8nNHCweBCiKwlbbVpJIMv3cCwsWsvGGjQC8UfYGdY11pl/jsnaZl9WXUSezV1WMkoGSiDlhdb1Tww+kGc30Zg5EJJBust1EMsmmnzs3O5dtG7YBUFZZxtkLZ02/RjfdPOd/jj7N3MW5QghrGa128MoEXvhioCPrtVyKi+327ZasL1u7Yi1LCpegaiovvPkC7V3tpl+jVqvldfX1GbdZugyURMyRvSoiyG7yglmwvMQBhgLJZsG3uOULllOyvASAfYf2caX5iunXaKONF/wv4NXMXQslhLCGpmlhNHOYTDfWGc6SSTzrsylHyWG9bb3p51UUhfdsfA+zM2cHO+H1D/Sbfp2z2lkOqgdn1GBJBkoi5kSyPfhMn7QzfcEsWP5EKWC2MtuSQAK9E17hnEL8fj/PvfEc3Z5u06/RRBMvqi/ij0B4CyEmR9X0zQ+MmFRJuOF3TDM2k9uDQ0QGSgCrldXkK/mmn9dhd7D75t0kuZNo62yzpBMewAntBOVauennjVYyUBIxJ6yud4H24NKC1RgrBkoWr1Ea7gblBgqUAtPPa7PZ2LllJxmpGXh6PTz3+nOmd8IDqNfqeUV9ZUbWhQsRS8KZwAs0cwhrjdIMj6ZY6sh6LUVR2GbbRgIJpp87MSGR3TfvxmF3cLHhIvvL95t+DYAytYyT6klLzh1tZKAkYo7ROnBN04Zm7oxu6mfo1dOQ2bufQ8TCCIYCyY3b9HPHOeO4fevtxLviudp6lX0H91lSjvCO9g5vqm/OqFIHIWKN0Y53MNQePLxurDM8nQLZZOokXuSyya24eY/tPZacOzsjmx2bdwDw9um3OVltzYDmLfUtqtVqS84dTWSgJGKO0Zm74QMrp5TeGRPc/dzM9uCRLSVLUBIsC6ThnfCqL1ZTdqLMkuuc1k5zWDW/y54QwhyT2ghdSu+Ms6QsPLLZlG/Lp0QpseTci+YuYsOqDQC8fvh16q/UW3KdV9VXuahetOTc0UIGSiLmGO16F3iaBGCXTf2MsaT0LvJ7McyxzWGNssaSc+dl57H1XVsBOHziMNW11sywVWgVVKgVlpxbCDE5Ed/fb6aPlGKwI+to1tnWMZvZ1py7eB2L5y0OdsLr6DJ/jz4VlZfUl2jUGk0/d7SQnxpFTJlMZyEIp5nDDE8jmxVd76Zm07q1trXkkGPJuYsWFrF62WoAXj74Mk0tTZZcp1Qt5bR62pJzCyHCN6lurAZLwgXWrFGK4PrZAJtiY7t9Oy5cpp9bURS2b9xOdkY2ff19PPf6cwx4B0y/jg8fL/hfoEVrMf3c0UC+OkVM8YexTCMQRnabgs3gwGeGD5MsWjA7NV3crAwkgM0lm5mXNw+f38dzrz9HT681m8a+ob7BO+o7lpxbCBGeyXRjNVoSDpJNsdyR9VrJSjI322625NwOh94JLzEhkdaOVss64Q0wwPP+5+nQzH9qNdVkoCRiSlgd7ybTWcjwO6YZW2wvmL1WkpLEVttWS84d6ISXnpJOT28Pz73+HD6f+X9XDY196j7qVPN3XxdChGcy3VjDKQmf8dUOZm84C1M2UAKYb5vPCmWFJedOcicFO+HVXq7lQMUBS67jwcPz/ufp0ayZJJwqMlASMcVIHfie8svsrWgIBpjNph/r9HjZW9HAnvLLE59kpmbR0d/Bsd8PhZGvTz/madOPH/1d+Oee4n2BCm2FFCvFlpzbFefi9q23Y7fZaWppYt8hvRNeT28PpcdL6entoexEGaXHSyd1HRWVF9UXadKsKfETQhhjZO1sMJsGJ/GudvTR6dHLm0POppkqkE2BJ0p93dMmmzbaNpJJpiXnnp05m+2btgNQcaqCqvNVAKZnUyedPO9/nn7N/M1up4oMlERMMVLeYFMU9pQ38FbVVf1jm429FY28WNHAnvKGkMrwZmwLVsUGR5+C84MzT94BOPb0YBA9pX8+XFM4axew0baRLLIsOXdqciqLCxcDcK72HEcqjwRDqOy4HkS2yfz7DfLh43n/87RpbZM+lxBicsLJplN1eplSY3vfsAm8ELNphkZTMJuuntc/HugxL5umsNoBwKE42GHfgQOHJedfPG8xc7LnAPBq6atcbrpsSTa10soL/hfwaubvLTgVZKAkYoqRWbudq3PZVZLLgTPNADgG/28/eKaZXSW57FydO+E5ZmwYrXk/rL0Hzr6ufxyYaTv1sn58zfvDP/cUhxGAXbGzw74DJ05Lzr9j0w7m588HoPR4KZcaLwFQWV3JhlUbWL9yvSnX6aef5/zP0aV1mXI+IUR4jAyUAtl09vLQ1+3Bs83sKW8IPZvCustpIJBNjYNNbQLrZ83Ipil+ogSQpqRxo+1Gy85/1467yEjNQNM0nnnlGXo8epmc2dl0hSvsVffij4J/08mSgZKIKb1eY19071qUSXaqvni/w6N/Q11RkEpRfip1zZ5gucNYXDHZTtykjUmXbYO5a/U/97Tqv89bC3NLoLlGL3UIi/kLScORqqSy0bbRsvNvfddWMlP1MoqD5QcBmD9nPvPmzKOptcm0Zg899PCc/zl8UfCkToiZqtcXejZ1erwUZifidtmDxw6eaWbT0iyK8lMnzCWQbCKzUP/zhcH95czIpjA2DbbCEtsS5ivzLTm3oijsvnk38a74YOMhsCab6rQ63lLfMuVcU8ma53tCWKDZ08+xK6F3VPH5Vf79pWqaOkbWyp681MHJS/p5dq7OYVdJ3qjvT3U52DQnPfwbnioDJpVindoHF4+OPFZ7VP8FsOYDsPZu4+eNi55/02SSLTt35blKWjpGtkutqa+hpr4GgPUr1wc3BJysDjrop9+ykg0hxNjOtnRT29Eb8utfOdHIG4Ml4cMdPNPMwTPN4+YSwLzUBJZnWfe9yzJmZlPLhZHHJJtCdqbmDH39fSOOWZVNV7QrppxnKkmqipjQ2NNHaX1byO3B+71+Hn/lHa60D30zUBTQNP2J0q2DpQ0p7tFLr7LdcWzIS8cZi7N2fc3mnGf5dqh6Cfo60Qs9NH3Wbs0H9M+708I7b7w1m+uFw491ZQHFi4vp6Org7IWzwWPz58xn/Sq9tCExIdHU6/mQJ0pCRJKmaVQ1d3OmtTvk91xp76OiRh8wxDkUBnxDobZpaRablmSNmUsASzOTKMpMir2ud6oP+k0aKC3YqK9LAn1NkqaalE2zTLk9M1idTXWNdTRcbQgesyqbpkMuxeBPgWKmqe/q5WBd6IOknn4fP36xmjOXu7APtgTfVZLL525fBuhPlKrqOsjPco8aSAXJ8WzOz4jNQZLqg4FWc851Ys/gIAnY9UX999qjcLEcsuaDO5zZN2XGhFFVdVVwkGQb3FCypr6G2vpasjOyZaAkRAzTNI3jVzsNDZIuNffwb8+fobPXR6LLzoBPY9NSvanMpqVZHDzTTFVdx5gDpdXZKazISo69QRIM5pJJpW1HBwdJ8Slw1z/pf55sNsWlgd2aPfbCYXU2BQZJubP0SWOrsmk65FIM/iQoZpKLHR4OX24PubK5vWeAHzx/ltqrPTjtCn5Vu25x7KalWewpb2BvRcN171+cnsi63DTDG9NGjf4WTKkDP/Z7OP6M/ufMeZCQqv95+Q69s9Cx34d33rj0ob2ZooBVYRRos7p62WpA/6EKoHhRMaXHSyk7UWb6Nb1Mjw5DQkQ7TdM4dqWD822ekN9z7nIXP3zhHD39flLcTnr6/ewqyWXTksGB0pIsdpXkjppNNgU25KWzIN3cyZWI6ru+1DAsx34PNYf0Py8ZtknrZLMpPnvy92Yiq7Mp0GzI6myaDrkkpXciar3T3kPFlc6QX3+1o48f762mrXuAVLeTFXNTSUlwBgdJKW4nO1fnsHnpLFLdTtRrOuitnJXM4owkU/8OEddvUtmdpkJ6AbRdgoISvZRhzQf0cjx3eviLXmdIGKmayoZVG1i+cDkVpysAve67eHExie5EVAsWDfs03wxuhSVEZKiaxpGGduq6+iZ+8aDjF9p44vUL+FWNxbnJFGS5iXPY2Lk6l06Pl52rcwbzKTd4jQCnTWHTnAyy3HGm/10iyqyBkuoHRxz4BmDuaskmgwLZlOhOpKauBrvdbmk2+fChaVpsPgUdJAMlEZXOtnZTeTX0lsd1LR5+srea7j4fs1JcfOLWRWQkjXyMnuJ2BhfIDn/CpADrctMoSEkw5d6nlFlhVPJ+OLlH/3PBaj2AAotjJ9N+dYaEUWAh7PDuQYFjZrVfvdZ0KHEQIpr5VY3Sy2009oS+meahs808deAimgYr56Vx382FOIaVdQ/PJRiZTQkOG1vyM0hxRc9T+LD4esAf+tO3cc0tgfLfgzMBZi/RN56dbDbZE8ARXc0xrM6mU++cAsBhd1ieTX78Md1oKHbvXExLmqZxqqWb0y2h131XN3bxny+fp8+rkp+ZwIO3LCI5IbRgcdgUNualk50YPbXJYTMzjK5WQ38PuBIhe5E557S7wRldT+ysrAOPNBkoCWEdn6pysL6Nq56BkN/zyolGnj1yGYANSzK5Z9NcbLbQZtZT4hxszs/A7bRP/OJoZ1aDIYBLFfrv+av0QZIZ4rOjbtNEq7NJGSw/0AzsTRkuHz4ZKAlhBk3TOHG1i+q20Hv4V15s5+ev1eDzayzMSeJj2xcSHxdasLjs+mxdWnyMz9YFmPU0CfRFsQD5N4DNpKBOiJ5udwGWh5ESuTCaDrXgQkSjAb/KgbpWWvtC+xrTNI0/HqnntcomAN6zcja3rc0LufwoKyGOjXPSiYvFhkKj6TcxmwIDpYLV5p0zyiodAMs3ag1mk1l7W43Di5d44i2/jlVkoCSigqZplF/p4IKBvSgOn2vhyf21qBoUz03lvpvn43SEFixJcXa25GeQ6JxGXwJmrU8CuDQ4UJIwmhRl2KIhq+u05YmSEObr9/l5q66Vjv7Qvr78qsZTBy5y+Jy+h9qd6+ewtTj0SaK8pHjW56YFO7bGPE0dbDJkAk87XD2v/9msbFLs4Mow51wmili1g/XjpJjPpmn0U6KIVeEsjn2t8grPlNUDsH5RBh/cMi/kYEmPd7J5TgauEAdVMUHzmxdGPa3QUgso+hMlMyiOqNrML8DyMIrgzzqxHkZCRJterz5I6hoI7WvL61N54vUaKi92oCjwoS3zeNfizJCvtyDNzQ3ZKTG98P06A216Ppmh7m3996z54e+VdC1Xlj5YijIRq3aIwEgp1rNJBkpiSvlVjcMNbTR0h7Y4VtM0nj92mX3H9d2etxZnc8e6OSEHS06ii3flpeGwTaNBEpgbRpcGwyh7ISSkmHPO+Fn6xoBRJlJ14GD9EyWvJqV3QpilZ8DHW3Wt9HhD+x7RN+DnZ/vOc76xG4dd4b6b57NyXlrI11uRlcySjMTpNUgCc0vCg2V3JeadMworHSByT5SkLHxiMlASU8anqhyqb6MpxMWxqqrxu4MXOXRWf3Jy29o8tq/KCfl681ITKJmdGrt7JI3HisWy07zsDiI3awfWz9zF+qydENGiq9/Hm3Ut9PlCa5Xc1evlpy9VU9fSi8tp42PbF7IoN7QuagqwJieVeanuSdxxFDOrJFz1Q91x/c+STZMWyQF5rG9dIQMlMSW8fpUD9a209IY20+Dzq/zi9Qscr21HUeDuTXODO5qHYllmEsszk6bfbF2AWbN2fh/Un9D/bNqsnTJjw2gEiyfuZKAkxOS193nZX9dKvz+0QVJrdz///mI1Vzv7SYp38Je3LCI/K7RBj11R2DAnjZzE2F3oPi5/H3hD3wtxXFfOwYAHXEkwa6E553SmgT06O95Ot653sUwGSiLi+n0q++taaA9xcWyf189/7XuHcw1d2G0KH7m5kBsKQ1/vsnp2CgvSYnhH84n4+8AX+p5T42o8Dd5eSEiFrEJzzhmXDrbo7Cxo9TdweaIkROxo7R1gf10rXjW0r9XG9l7+/cVqOjxe0hPj+MSti8hODW3Q47Lb2DQnnYyEGN9IdjymVjoEGgzdAGaVzidE5wQeROD7eSCapJnDhGSgJCKq1+fnrUuhL47t7vPx05equdTsweWw8efbF7AkL7R1MzYF3pWbTl7yNJ2tC7Cq7M6sNUVR+jQJQMXcXcjHZXEgxXoduBBT6aqnnwN1bfhDnGGvvdrDT1+qxtPvZ3ZaPJ/YuYi0xNAGPYlOvetqUtw0/xHMkrbg0399ElifTcEnStLMYULT/KtURJMer4+3LoW+OLate4B/33uOpo5+El12HrxlEXNnhfZkyGlT2Dwng0z3NJ6tC5A9KsImT5SEEA3dfZRebiPEB0mcqe/kv155hwGfytxZbh7csYjE+NB+nEpzOdmcn068I/o6rZlK08xbn9TdAq0X9U1h81eZc057PDhCW0cWaZqmRSybpPRuYjJQEhHRNeDjrUst9Ia4OPZKex//vvcc7T1e0txOPnHrYmanhfZkKMGhbySb4orOci9TaZp5T5Q6m6C9Xn+SNGelOee0u8GZZM65LBCpWTuwPpB8WmyHkRBToa6rl7LL7SFPY1TUtPHLNy7gVzWW5CXz5+9ZgMsZ2qAn2x3HhjnpOKdb19XReDtANekpd2ACL3sxxJs0uImfrQ+8olAkKx0iteFsLJOBkrBcR5+Xtwwsjr3U3MNP9p6np99HdqqLT+xcTHpSaE+GUuIcbMnPICHE4Ip53g4wqy10IIxmLwGXSWu6ovhpElg/uIhoZ6EYn7UTItJqOzwcbewI+fUHTl/l6YOX0IDVhWnce1MhDntog565KQmsyZmmXVdHY0lb8NXmnTOKsykSTYaC2RSJNUoxPoknAyVhKaOLY89d7uI/952n36dSkOXmwVsWkhQf2pOhrIQ4Ns5JJy7E4JoWTA2jwcWyc02sAU8IfUf6qRDRmTurnyjJQEmIkJ1v6+HtptA6smmaxr7jV3j+2GUANi/N4v0bC7CFuMn5koxEVmQlT9+uq6Mxq+zO7x3WiXW1OedU7ODKMOdcFohkN1ZZozQxGSgJy1z19HOwrg1fiD8gHr/QxhOv6yUNi3OT+fPtC4gP8cnQnOR41uWkYQ8xuKYNs9Yn+Qbg8kn9z2YtllUcese7KBbRNUoWD5RivbxBiEg509LNyebQOoWqmsYfy+p5/WQTALfckMOuktyQBz2rslNYlD6Nu66ORvXqm6CbofE0+PrBnQaZheac05WlD5ai1HR7ohTr2SQDJWGJxu4+DhlYHHvobDNPHbiIpsHKeWl85KZCnI7QngwtTHOzKjtlZs3WwWAYtZtzroYqfeYuMRPS8805Z/ws8zrnWWQ6zdzF+qydEFbTNI2TzV2cbe0J6fV+VeO3b9Vy5HwrAH/yrnxuXhFayZZNgXU5aeSnJIR9vzHLrKdJABcr9N/zV5u3piiKy+4gQgMl6XoXMhkoCdPVd/Vy2MDi2FdONPLsEb2kYcOSTO7ZNDfkkoYVWcksyUiceYMkMDmMAntUrJ4xYQQR3v1cNpwVYspomsbxpk7Ot3tCev2AT+WJ12o4eakDmwJ/+u55rFuUGdJ7HTaFTXPSmeWOzs1MLWfF/klzV5t3zijPpohM4Mk+SiGTgZIwlZHFsZqm8eyRel6t1Esa3rNyNretzQtp0KMAa3NSmZsa2g7o05JZ65M0bWixrGlhpOhPlKJcJAdKVs/c+fGjaiq2KH+KJ0SkaZrGscYOajt7Q3p974Cfn718nneudOOwK9y/bQErClJDem+8w8aWORmkhri2dtrRNPNKwjsaoaNBL5MzqxOrMw3s0T2AjWTpnXS9m5gMlIRpxlscu6f8MjZFYefqXEDfI+ln+85zuVUPriW5ydy+bk5I17ErChvnpDM7Mbq/2Vlqsm3Bj/5OL4tb837ouAxdTYACaflw7PegqbD27vDPH5cOtujfw8qqQCo9XopNsbF+5frgsWMnj1FSVEJVdRWqprJh1QbTr+vDRxzR/+8uRKSomkZZQzv1XX3Xfe7aXAK43Orh31+spqvPh90Gf7VzMQtyQtviIDnOzpb8TNwzpevqaHzd4L/+3zpkw7MpMIGXmK6vU6rcM/lsSojup0lg7UApkE05WTn6tfx+So+XUry42LJskq53QgBnW7qpHGdxrE1R2FPeAMC24tn86s0LwUESEHIQuew2Nuenkx4/w38Y9HWDOokwUmxw9Cn9z47AgFODE8/BqZdh7T2Tu78oL20IsCqQbIqN0uOlgD5zp2kaFacr8Pl8VFZXWjJIAhkoCTGcX9UovdxGY0//qJ8fnks7V+fS0tXPf7x0nq4+/Qe7DYuzQs6mjHgnm/IzcM2krqujmWylw/BsunJW/727WZ/AmyHZ5NesGygFsmnZgmX6tVQ/ZSfK6O3ttSybpPROzGiaplHV0s2Zlu5xXxeYsdtT3kDpuRbaugeCn9tVkjtiRm8siU47W/IzSIqT/20nHUZr3q//fvQpSB4WHIEgCnw+XDEQRqqmWlZ2EHiSVHq8dMSms4EgGv6kyUyxHkhCmMWnqhysb+OqZ2DM1wzPpe4+L8cvdNDZq5cJlcxP4+7Nc0O6Vm6Si3flps+8rqujmeza2eHZNLyM2IxssseDw6QNay1k5ROl4dk0nJXZFOu5NMOnPsRknWvtmXCQFLBxSRaF2YkjBkkrClIpyk+lrtlDp2fsOlaX3cbNczNlkBQw0Dr5cyzbBst3DJbdDZq3Vt9HqbkGPGG2d7W5wBH97XCt3kOpaFERxYuKRwzG5s+Zz7w582hqbaKnN7TOW0YMMPYPhULMJBMNkgJ2rs5la3E2b51qDg6SABbnpVDX7Jkwm2YnutiQJ4MkYHB9kknZNG+tXmYXYEY2uTLNa1ZkoUhkU2F+IQCd3fpyCSuzKdZzSX7qFJNiZD7+wJmrXGga+QV48lIHJy/pzR92rs5hV0neqO/t96szs7PdmEyY4zi1T5+lG672qP4LYM0HwqsFV73o/2dE938vh+LAidOyhaaV5yqprK4ccaymvoaa+hpAn9kzu8yhWWsmS8ky9ZxCTHdxo2xF8eT+i8E/j5dNA34Vm2STTlH0p0DaJH/QP7VvKIcCzMgmf2z8wB6vxFt6/spzlVyouzDimJXZ1Ecf3Vo3SUpoZazRRgZKYlIyE0Lv7LN56Szau70crm4JHltRkMqtg+UPKe7xz9XY3ce8mdzlbji7Cd9Il2+H3o6Rg6V5a/UQAn2Dv7Co4OsBZ/SXOCSSSDvtlpy7eHFxsO47YP6c+axfpZc2JCaY/9TtinaFZSwz/bxCxJqM+LiQniiB3gr8Wh/cMpf8DD1vxsumtj4vvV4/CTO5gcNwdhf4JllqtXw79LTCmVeHjpmRTd7Rm01Fm0SsrcgoXlyMp9fDyeqTwWORyKZYHShJ6Z2YlLR4Z8jPDQ6dbeZwdQvpSUOLzU9e6qCqroP8LPeEA6XL3ZNoXjDdmNHe9PSr+iBp+G7ntUf1PZWy5oM7Pfxze0Pb9X6quRXrBt5V1VVUVlcyJ3uom2NNfQ219bVkZ2RbEkaNWqPp5xQiFmWEOIm3t6KB1yqb2LEqZ0T53KVmD/lZ7pCyqUGyaYjNhEm806/qgyTnsM16zcgmtT8mniq5sXZCuKq6ipPVJ0l0D2WQZNPYZKAkJsVhs5HqmvjB5N6KBvaUN7CrJJeNS4Y27du0NIs95Q3srWiY8BxNPf341AjsjhYLJjtQOvZ7fbHs2ntg/rBH7Mt36MeP/X5y54+RgZJVM3dlJ8ooPV7KhlUbWLF4RfB48aJiSo+XUnaizJLrttNOnyY/tAmREUJn1OG5tHttHoXZQ98PDp5pDimXQCbxRjAzm7LmDx03K5t80Z9NdsVOAgkTvzAMw7Npbu5QsxKrs+mKdsWS80aCDJTEpGUkTBxIqqYFu9styUsB9N3Lb1mVw66SXFRt4gGQX9MHSwK9YcJkaOpQB6GU2fqxxAz947X3TL7GfIaXOAT2oli/cj0ZqRkA2Gw21q1cx4ZVG1An++87jiataeIXCTHNuRw2kiYohxueS6Dv5wcwO9XF1uLskHIJ4KpnAK/f2gX4MWOyA6XRsilnuYnZFP0DJYhsNqWnpLN+1XpLs6mFlpjdT0nWKIlJy4h38s4Erxm+EDY/0018nJ2+AT+dvd6QWoMHNHT3kZds7ULHmDDZNUrDF8Km6hvPofr1kobJtgaHmJi1A0hUEo11JAnR8IWw6SnpKIqCquoBZFVr8IAr2hXmElpbYyGms4yEOLq9vWN+/toGDYvzUnihvIGuPh+3r52DLcROdhrQ2NNPQYo1TwFiipnZFBgoJWWal02xMomnJNKsTbLV+iiGZ1NgoKQoCokJiZZmk4rKVa6SS+g/70ULeaIkJi2UJ0rD2W0KiwY38TvbYOwH6oaevpBn+aY1M9YoBQTCqLcDBsb+ocIQf99g97voZvWiWQC73U5qcioArR0mtM6dQCOxWwsuhJky4kNvNgRQkOUm3mnD0++nvtXY90JZpzRostUOw6UMTuJ1mli2NcOfKA0XGCi1d7XjV63buykgVsvvZKAkJi3RaSfO4G7kgfK7s/XGZncG/BqtvdG/GNNyihPTvnzj3BA/2KGuy8SyrRgIpEQlMvs9BQKprSPM/T8MaNKaLC3tEyJWhDWJN1h+d/aysWxq7OnHL2tozenIGpAyuHG5mQMlX7e+31OUi0Q2JbmTcDqcqKpKR1eH5deL1YYOMlASk6YoiuGZuyV5ehjVNPWM2pp1PJe7ZZ0SimLNU6VOE7+RxUCJQyRm7WBooNTS0TLBKyfPh49WrH9yJUS0S3E5sBvc42hxcKBkbKLHp2pc7ZVssiSX+jphwGPOOTU/+E06l4UikU2KogSzKRLVDle0K2gxMEi9lgyUhCmMztzNSnGRlujEr2rUXOk29N7L3X0x+cVmOlNn7gYDqWNmlTgkkIASgY1xI/lECWJ35k4IM9kUhXSDk3hL5+jVDjVN3YYn8Rq6ZKBkauldnBsS9P8e5pbfySReQCQHSn300Un0/9tfSwZKwhRGnygpijJUfmewxMHj9dPZH5vdU0xlRS14l5klDtE/ULIpNsv3rICRYRSJQX6s1oILYbZQ91MKmJXiIs3txOfXuNAkk3iG2RygmNgnLDlQ7TCzJvEiVRaenqrvSdXaHpkqhFicxJOBkjBFusEwgvBLHED2rQCsKXHoMLP0ris2asEjMHOXlpKGoij0D/Tj6bO+7EMGSkLoQtlPaThFUVicF1429ftV2vqiv4mN5UzNpkBDB5OzKcpFYgIPIDNV39cyEk+UIDazSQZKwhTOEDeeHS6wTqm+tZfuPmNPiGSghDUDJTObOWh+8JvURc9CbsX6QHLYHaQmDXa+i8DMXRdd9Gg9ll9HiGhn9IkSDGs2JJN44TG12iHQ0GFmNRqKIw5HBHbwCTxRks53Y5OBkjCN0Zm75AQnuen6vhPnDJbfdfT78HhnePmdzYI1St0t4DOxq2AMBNJ0rAWH2AwkIcwW77DjnmDj2WsFqh3qWzz0yCSecWaun0214ImS3wNqdP/8oChKRLIpOTE52Pmus8v69UOttNKvxdZaPhkoCdOEN3M3WOJgcD8lgIaZ3v3OzCdK8SngTAA06Lpq3nljYdFshFuEy0BJiMjKNLiGNsXtJCctHg04ZzCbugf8dM30NbRmZpMVa5RAbxMe5SKRTYqiBJ8qRaIrK+hbWMQSGSgJ0xjtfAfDBkqXuwwvgp3xM3dmztopyrAW4TNs0WyEnigFF83KQEmIiAonmwLd76T8Lgxmlt6lDuZST6vJ1Q4xMIkX4WqHSHVljbVskoGSME2S047TZqzV8oLZSdhtCm3dA7R0Gfsm2OwZYMA/gzfWNDOMwJq9lGKg812kwigzbWjRbCQ6Y13lKj5ths9sC0F41Q6B8rtzDcZ/oG6Y6QMlMyfxXMl6m3CQSTyLRLzaARkoiRlKURTDM3cup515s/RvBkbbhGtA40wOJJsTU7+ErXii5OuBCCwQnYxIld5FuvOdikozzZZfR4hol+pyYnAOj4U5SdgUaOkaoMXg/kitfV56fdH9fc9SZpbeDa92MHP7ilgYKE3jsnBVi51JbhkoCVMZ3U8JYGmYrVgBLs/kdUqKYk3nO9NrwaM7kCI1a+ewO0hJ0st5pPxOiMgJZ+NZl9NOYXYSEF42zeinSlZVO5i9IXqUb18R8dK7zjZU1foBjBcvbUSmzM8MMlASpgqnFnzxYCvWcw1dqKqxb1xXevrxG3zPtGLJfhUm/3Ad5TN3TsVJHMb/vw1HpGfuYnFzPyGsYLQrKzBsP6Vwyu9m8CSemaV3YE1ZuOYFNboHs5F6opScmIzD7kBVVTq6OyJyzViaxJOBkjBVOE+UCrLcxDtt9A74qW81VpLk1zSaPDM4kEzdryJQ3nDV3HK5KB8owRTUgkdoF/Qr2pWIrIcSItqF1ZU1uE6pC9Xg11FTTz/embqG1uYAxVhL9nEFB0omd0uL8myKVC4pihLxbIqlSTwZKAlTOe02kuOMbZJmtyksyp1M+V10zwpZysyZu8R0sDv1jWK7TVzbEuWldxD5WvBIdRfqpZcuov/fXwirhVPtMHdWIi6nDU+/n8stxjbP1tArHmYsM7PJiidKEPUDpQQSUDC4uC5M0pV1bDJQEqabTIehcAZKjd39M3fW3NRFszZIDuyCbmYteGfU14K7cUfkOoGBUktHS8T+n42lmTshrJLgsJPgMPaUw25TWJQT2OvPePndjJ7EM7XaYbAsvLvZ3I1io3ygZFNsJJAQkWtlpg51ZY2ETjrp1YxNPkwVY1P/QoQgIz6O2o7QvwD2lF+mt18v9app6qa5s58j51vYvHQWh842o2oau0ryxnx/v1+lpddLljsy60yiis2kWbujv9MHSqk50F4PzTVw5Sws3w6nXwVNhbV3h3du1Qtqv/l16yZKIsnya5QeLwWNYOe7lrYWztedp3hxMVXVVaiayoZVG0y/7hXtCktYYvp5hYg1GQlO6rtCKyveU34Zm6KwJC+Zk5c6OHu5i3ULMzlw5ioDPpU4h23cXAJo7OlH1TRsSmSeCkQVsybxjv5usHFRHPgHoOk81J8wJ5tiYC+lJJLwYF2X1NLjpdgUG1npWYA+UOrp7aHyXCU+nw+Hw2FJLoGeTYVKoSXnNpM8URKmyzT4RMmmKLx56irxThs+v8bp+g72VjTyYkUDe8obQgqZGdthyKwwUmxw9CnoHQyOtktw7Gk49nv9uDLJbxVRPnMXidI7m2KjrLKMOKc+oG9sbqTsRBllx8uCYWWFWCpxEMJKmQYaOtgUhT3lDVzt1LPlnSvdtHb1s7eikdcqm0LKJZ+qcdVj4iapscSsiTHFpg+WnIPna64xL5t8PfpAK4q5FWurHWyKjdLjpdRfqQf0znfdPd2UnSij/FS5ZbkEsVPtIE+UhOmS4xw4bAq+ELvR7VydC8Ce8gYALl7VZ08OnmlmV0lu8PPjudzdR/GsZJSZNnNn1kBpzfv1348+pf/ePfj4/dTLsPaeoc+Hy9sF8bMmdw4LRaL0bv3K9cDgkyUIdheqrK5kw6oNwc+brZVWBrQB4pQZ+MRViGGMlIUPzyWX00a/V+Xl4/oPdpuWZoWUS6Bn0+xEk9tlxwKzSu+uzaYeM7NJA183OFMmdYtWsrqhw/Bcsik2VFWl/HQ5AMWLii3LJYidSTx5oiRMpygKKQYbOmxckkVhtv4N4ch5/RvhioJUivJTqWv20Onxjvv+Hq+fPl90zwxZwqzSO4Bl2yC/RP9z4yn993lrYW6JPovnmUQDAnmiBEDRoiKy0vQSh/JTehjNnzOfeXPm0dTaRE9vj+nX1NBo0kzuFiVEDEpxGculnatz2VqcTb9Xz5aqOv2Je0GWm7pmT0jZ1DxjnyiZODhctg3SC/Q/H39W/12yyTTrV66nZHlJcBPY6tpqAGZlzqKptcmybLrKVfxa9G/MLE+UhOk0TaNrwNiCywNnrnKhaeQX4slLHZy8pM+671ydM249eKLTTrxjBo77bcYbZ4zp1D6oKx95rPao/gtgzQfCrwX3W1djbYZItWGtPFdJc/vIjoI19TXU1NcAemBZUQ/eQgv55Jt+XiFiSWe/8UYAcfbrc+XJ/ReDf54om7LC6LY3LdhM/Huf2qeXgwN6P0HMyyafZBOAw3H9cODV0leDf7Yim/z4aaedTDJNPa/ZZKAkTNc54MNrcBPYjUuyeOXEFXx+DQX9W+GKglRuHSxvSHGPPyCYkxw/88ruQF/kaosD1YRZy+XbobsFzr42dGzeWj2EANxp4Z87ysMogQRs2FCx9qlk8eJimtuaqamrCR6bP2c+61fp5Q2JCdaEYrNmYrt3IWJUS6/x75OtPde/54Nb5pKfoZfrTpRN+SnR28TGUmYOlJZv15sL1Z8YOmZWNskkHgA+3/WTCNs2bGNWhl4yb2U2ZSrRPVCagVPwwmotYZQavPx2Iz6/ht2m8Le36R26Tl7qoKqug/ws98RhlByZFppRyaynSqdf1QdJtmEtdGuPwsVyyJoP7vTwz632m7uJrckURYnIOqWq6qoRgyTQnyjV1teSnZEtAyUhLGR0oLS3ooEj1XopeFF+CpuW6mWzl5o95Ge5J8wml90mT5TMcPrVoUFSQpr+u1nZFOWTeFY3cwCCjRsWFizUrxmvX/Nqy1WyM7JnfDbJQEmYLpwwOnBG/2JZNicFh03/33LT0iz2lDewt6Jh3PcnOu2kGqw9n1bMCKRAB6G19wztpQSwfId+/NjvJ3+NKJ+5s3qgVHZC7273rpXvwhU3VL9fvKiY0uOllJ0os+zaHXTg1cZfSyHEdKZpGi29oX8N7B3supqeqH9/XZafyqYl+kDp4JnmCXMJZnClA5g3UApkU/Fu/eO+wc6sZmWTL7r38rH6iVIglzas2sCaFWsAUFW9sqKyutLSXAJo0VosPb8ZZvBPl8IqzQbCCEDVNNISnbT3eFmen0KK28nO1TlsXjqLVLcTdYKNOfNnchiBOYGkqUMdhC6fhI4GKFyvf+xON6eFqs8DzuTJn8ciiUpisPzdCoF9ktavXE/t5VqutFxh4dyFrF+1nkR3YnAhrRU0NFppZTazLbuGENGs2+un3x/615iqaWxflcOrJ/ROd8vzU3DabexcncOAT50wl0AfKM1YNjsodpjsYv1ANt1wJ1Q+r3+88jZYdZs52aT26feoGNuMOFLilDicOPFizUTX8FzqH+gHoG+gjzVFa9A0zdJcAn39rKZpUf0znAyUhKk8Xj+9PmPfGG8qyualt/UwWjY4UAosjg2lBeucmVx2B+YMlIYvhE3M0H/PXqQH0WRbgwf4Z/bM3fCFsGnJaVxpucKs9FkkJiRa2oI1oEVrYbYiAyUxMxmtdNhVksfbF9pQNZiV4iIz2RU8HooZXXYXYIub/Pf94dmUkKLv9bdoi7nZ5OsFp/WbjocrkUTaabfk3MNzyRXnIiE+gd6+XhbNXUR2ZvY47zTHAAN00UUK0duiPepL7+rr6/nIRz5CZmYmbreb1atXc/To0am+LTGGcBbLnr3chabB7NR4MpKMtRRNmulld2BuLTgMDZR6JtFydTRRXgseqRbhAGkpaQB0dHVE7JqxUAseSySbYks4a2dPD7YDX5Zv/Ie4GV12F2BmV1YAt0XZFO1l4RFYpxSQlpwGQHtXe8SuGe3ZFNU/Yba1tbFlyxa2bdvGCy+8QHZ2NufPnyctLW2qb02MIZyB0qk6/YfFsMIoJUHCyPQwGlwY62k197zRHkYRaOYQMBVhFAu14LFCsin2GM0mTdM4Xa8PlJbnpxq+3oxuMBRgxSReywXzsynaJ/Ei1PkO9Em8hqsNEc+mBSyI2PWMiuqB0re+9S0KCgr4r//6r+CxwsLCqbshMSGjYaSOCCPjA6X8mVwDHmA3O4wGW3XOtCdKEQyj1BT9B6/2zvaIXbOFFlRNxaZEfSFB1JNsii19Pj/dXmMl4Q1tvXR4vDjtCgtnGyvLirfbyEwweQIrFkm1gykiOlAKTOJFMJuaie4nSlGdmM888wzr1q3jnnvuITs7m5KSEn7605+O+57+/n46OztH/BKR4fWrdBjc0O9yay9dvT7iHDYWGAyj5Dg7KXFRPdaPDNPDaPCJUo8FT5RCWAA9VSJaejcYRr39vcEFtFYLbO4nJk+yKbaEV+mg//dZlJuM0+Bm5lJ2N8jsbHJblU1Rvn52CrJJSu+GRPVA6Z133uFHP/oRixcv5sUXX+Sv/uqv+PSnP83Pf/7zMd/z6KOPkpqaGvxVUFAQwTue2Vr6wq8BX5ybjGOUHdDHMydZyu4A62btPG2gmtjxRlPN2RjXIpGctYtzxuFO0Ev9pPwu9kg2xRYjbcEDApUOy+aEU+kgZXeABdUOgWyS0jurDF8/q0VoYtODh14tegerUT1QUlWVNWvW8M1vfpOSkhI+8YlP8OCDD/KjH/1ozPc8/PDDdHR0BH9dunQpgnc8s7V4jIfRqfrw1ydJ2d0gswdKCamgKPrAps/kZgNRHEhOxUkcketSNSUlDlE+cxcrJJtii9EnSn0DfmqudAPG1yfFO2xkSNmdLlZK76K82iGSzRxSk/T/3/sH+unr74vYdaM5m6J6oJSbm0tRUdGIY8uXL+fixYtjvsflcpGSkjLil4gMo2HU2++jtqkHgOUGZ+2S4xykuCSMAPPDyGYf2v3civK7KDbdGzpEey14rJBsih0+VaW9z9gk3tnLncG24Fkpxjqx5kulw5BYaTSk+aXaYZDD4SDZre93GOk1tNEqqgdKW7Zs4cyZMyOOnT17lnnz5k3RHYmxqJpGq8HSuzOXu1A1yE51kZFsNIzkaVKQYsf0L+WZumh2ClqERzSMtJaIlVNMZ5JNsaOtz2t4H+lTkyi7m9GbzF7LqidK/T3gM3ltZxRP4rlxoxC5wXcgm9q6TM7/ccgTpTB97nOf49ChQ3zzm9+kurqaX/3qV/zkJz/hU5/61FTfmrhGe58X1WAaTab1qoTRMIoSOzN3URxGMEXdhSL4RKmffrrpjtj1pivJptjRbHD/JE3Twt4/KcFhIyNeKh2CzB4oxbnBMTipana1QxRP4tkUGwlEbt3bVJSFR/P62ageKK1fv54//OEP/PrXv6a4uJivf/3r/Mu//Asf/vCHp/rWxDWaw9mjoi68WbsUKbu7nlWLZmfaE6UpWDTb3tke0ac80RxIsUKyKXYYLQlvaOujw+PFYVdYmJNs6L3SYOgaZg+UFGVY5zuzsyl6mwnA1DV0iJR22vFqxte5R0LU91a+/fbbuf3226f6NsQEjIbR5dZeOnu9xDlsLMwx1hY8P0WeJl3HskWzM2fWDgYXzUZozJKalIqiKHh9Xjx9HhITIhOEzTRTSGFErjWdSTZFP1XTaDXY8e70YIOhRTnJxBlsCy4l4dcwu9IB9GzqbLSg2qHH3POZLKLZlDy4z18Eqx1AX6eUQ05ErxmKqH6iJGKDpmmGB0qBsrtFuUlhtQUX17CsRbjJYaT26wtno1QkZ+3sdjvJiVOwaFaeKIkZorPfh8/g09pApYPRDdATHHbSpexuJMUGisn/JpZN4skTpYBgtUOXVDuADJSECboH/Az4jX0xBTbzWz7H2PqkVJeDZNlk9nqxsrEfRHUgRbKZA8jmfkJYyXBbcK+fmsFOrEbXJ+XLJrOjM/upkpUtwqNYJLMpJTEFm2LD7/fT7YncmtZozSYZKIlJM7o+qXfAz4Um/YvPaBjJ06QxxEoYQVQHUiRn7WBqasG76aZPi9z+GEJMFaPZdO5yF35VIyvZxSyDJd7SYGgMZq+ftazRUJ9UOwyy2WykJOs/m8mG6DJQEiYwOmsX2KMiO9VFprQFN4dVpXfeXhgw+QlQFK9TSiAhom1Yg7XgESy9g+gNJCHMEk5J+Kkwu925nVJ2N6ZY2XQWorvaIdKTeFPQ+a6VVvxROFiVgZKYNMPrk4Ld7oyX3SVJ2d3ozA4jZzw4B5/emT1zF8UDpSlrwxrhRbOy8ayY7jxeP30+NeTXa5oWbORgdH2SlN2NI1YaDUFUVzu4lchthg5Tk01+/LQTueuFSn7qFJPS5/PT4x1/BmBP+WVsisLO1blomkZVnR5Gc2e52VvRgKpp7CrJm/Ba+VJ2NzYzw+jo7/RFuIkZ0F4PLRfh/EFYvh1OvwqaCmvvDv/8URxGoM/cebD+HkuPl+L16h252rva6erpoup8FcWLi6mqrkLVVDas2mDJteWJkpjuQpnAG55NV9r7aO/xoigwKyXeUDZJSfg4zMqmQC4tuVn/2NMOPS16Jvn69f2VJpNLENWTeJF6olR6vBSbYhuxfUVPbw+V5yrx+Xw4HA7Lcgn0bMpUMi07fzjkiZKYlFDCyKYo7ClvYG9FAw1tvXT1+gC9HnxPeQO2EGfipAZ8HGbWgSs2OPoU+Afb6rZfhmNPw7Hf68eVSX7biOIwgsgtmrUpNipOV6AoCqqq0tzWTNmJMsqOlwXDyirRumhWCLM0h9AWfHg2BcruNA1erbwScjYlOu2kuWTOeUxmDZQCuXTmVX0/Jc0PbfV6Nh1/dvK5BOCP3tK7OOJwRODZhk2xUXq8lMbmRkCfxOvp7aHsRBnlp8otzSWIzmwK6V+9s7PT8IlTUow9uhaxqSWEMNq5OheAPeUNvHNlqINK6bkWdpXkBj8/njSXU8ruxmPmE6U179d/P/qU/nvfYKOBUy/D2nuGPh8uf6/+00iUlqpEauZu/cr1gD6DB9Dl6QKgsrqSDas2BD9vhXba8Wk+HEpsf01JNomxhDKJNzybMpKGvocePNMccjbNkbK78ZnVaGh4LjnjwdunZxLA8h2TzyWI6kk8RVFIJJEOrG38c20udXZ3UnmuEoDiRcWW5hLoeylFm5BSMi0tzdA3AkVROHv2LAsWLAj7xkRsCLWr0MYlWXR4vBw8MzRbsKIglaL8VOqaPaS4naS4x/6GKk0cJmB217tl2+BCGbRcgKqX9GPz1sLcEmiuAXfaUPchozQ/qANgN9bII1ISlcSIbexXtKiIk+dP0t3TzRtlbwAwf8585s2ZR1NrE4kJiZZsRKuh0Uor2WSbfu5IkmwSo+n3q3QN+EJ67cYlWbR2DXC4eugHNGPZJGV34zJ7Es/bqz9BAj2jALLm67kEk8umKB4ogZ5NHZr1HVLXr1xP/0A/Facr9OUS1VUAzMqcRVNrk34vFmVTs9aMpmlRNfkQ8nTi7373OzIyMiZ8naZp7N69e1I3JWKDpml09oe26/mBM1dHDJIATl7q4OQl/Yt+5+qccWvBZyWavCB0ulHs+i+zOsac2qcPkoarPar/AljzgcmvU4rSgZKbyC2arTxXSXfPyH0qauprqKnXQ3/9yvWWrlPKVmJ7oASSTeJ6oeYS6Nk0fJAEoWeT06aQKmV34zO7mYNjlNx486dDf55MNkVx6R1ENpuczusnB14tfTX4Z6uyaYABuukmmWTTzx2ukL7C582bx0033URmZmgLrBYsWDDqP7KYXhRFwe2w0z1BMweAzUtn0dXru+6J0q2DpQ3jzdiBvsN6erwMlsalOMwbKC3fDo1n4fKJoWPz1uohBPqs3WT4+yf3fgu5iNwArnhxMZcaLgXrwUF/orR+lV7eYMWMXUAkZiatJtkkRpPotIf82s1LZ9HWPUBZ9VAXtVCzyatq9PlVEhyhX2/GsZk8kPSNkh03Pqg/VYLJZZPmA9UPtuj87xnJbPL5rn8iu23DNmZlzAKsz6ZkJXoGSiGtyqqpqQk5iAAqKyspKCgI+6ZE7EhxhfZDx6GzzRw800x+5tCMyMlLHVTVdZCf5Z5woGR048AZycxAOv3q0CApebb+e+1RuFiuB1K4pQ0BavT+94xTIjcgr6quCg6SstKyAP2JUm19LdkZ2ZaGUSfG1/dEG8kmMZoEhx2HLbTSnUNnmymrbiUhbuiHYyPZ1OKJ3u9lUcHMdZDHfq+X3c1eon+cPvi13Fyj55Ip2RS9k3hxRCabAo0bZqXrg6LA4Ohqy1WyM7JnXDZJ1zsxKaGUHeytaGBPeQO7SnLZvCwreHzT0qxgx6GJSBiFwKxACnS3W75D/9g7WLe9fId+/NjvJ38NeaJE2Qm9u13RwiIAevv1so/iRcWUHi+l7ESZpdefDk+UhBiNoiikhND8Z3g2LZ0z1OTDSDbJJN4EzJrAC+TS2ntg7hr9WLL+AzynXjYnlyCqJ/FcivXZFMilDas2UJhfCECyW3+6U1ldaXkuQfRlU1j/Bx8+fJjXXnuNpqYmVHXkhm7f/e53TbkxERtCeaKk70WhdxC63Kr/0G23wS035JDqdqJqE6+c7/b66fP5iZcSh7GZFUiaqofR4hv1ABro1Uvulm/XZ+u00DdxHFM0h1GEBkqBfZKWzl9K1fkqevt6WV+8nuIlxSS6E1HN+HceRyedUbdodrIkm0RAqstJa9/4a5WGZ9NrlVeoqGkjO8XFratzQ86mZpnEG59ZE3iBXFrzfji9Tz/m9+nZ5Os3J5dgxk/iBXJp/cr1wW53A74B1q9cj8/nszyXIPqeKBn+P/ib3/wmX/rSl1i6dCmzZ88eEbLTKXBFaEJ5ojR8IezstAScdgWvX6Pf6w+p/WpAc++AdBgaj1mBFFgIOzC4sFX1wQ13giPOnBasENXlDZEaKAUWwvr8ei24qqncsOwG4l3xlrdgBfDho5feiC4QtpJkkxguxWA2FWTpXwcDPpUUtzPkbOoc8DHgV4mzS4HOqBTFnEZDwxs0uJL03339k99k9lpRPIkXidK74Q0aAuV1/QP9lm4ye61OLcYHSt///vf5z//8Tx544AELbkfEmkSnHbui4A9h5g3AblPIz3JTc6WHi1c9zE4LfeDT4pGB0rjMXjTrjB8KuP5ucEzcWSxk/ugNIwcOFBS0CPUId9gduOJc9A/009PbQ7wrcq3wO+mcNgMlySYxXGqI62cD8jPdKAq0e7x0erwTrk0arqV3gNwk2cJiTGY2GoKhgVJ/9/ivC4dM4gUFBko9vT0RvW60VTsYngKx2Wxs2bLFinsRMUhRlJBm7oabm6V/8V1sNrZngdSCT8DszUMVBeIHF2yaHUhRHEaKosyYQIq2WvDJkGwSwxnNJZfTzuxUfbBzsdnY16GU303A7Em84EDJgu+XUTyJF8lGQwCJbj2Xevt6rytltpIPHx6iZ08rwwOlz33uc/zgBz+w4l5EjDI+UNJnsC8ZDKOOfr3EQYzB7IESDAVSn8kDpSgOI4hcd6GAQCD1eCI8cxdlJQ6TIdkkhouz20hwGPsRZ+4s/evwkkzimcvsbAoOlLogxGqWkEXxJF6kJ/ASXAkoioKmaXj6IjtwiaZ1Sob/733ooYe47bbbWLhwIUVFRdftSfH735vUeUTEDL3EIfSN2goGnyjVt/bi86s4DNR2S4nDOMyetQPrShw0r774VonOuv6Z8kQpmsJosiSbxLVSXE56R9t3Zwxzs9wcPtfCxavGvg7b+7z4VBWHLTq/n005058oDVY6qH59nZLTxJ8JongSL9K5ZLPZcMe76entoae3hyR3UsSu3al1kquEvobdSoa/qv/2b/+WV199lSVLlpCZmUlqauqIX2LmMbozeWZyHG6XHb+q0dBmbCfsFpm5G5uVT5QsqQWP3v+WkWjDOtyUDZSm0RMlySZxLaPZVDCsLFwz8KRCA1p7x++wN6OZnU0OF9gHJ0JmUFl4pCsdYCibPL0RfqIURdlk+P/en//85zz99NPcdtttVtyPiEEpccYWzSqKQkFWImfqO7l41RMMp1BILfg4LHmiZNEaJdDbsNqj8+lgxEvvpmqNEtNnjZJkk7iW0YYOuenxOOwKvQN+mrv6mZUS+ven5t4BshMjO8ESM6xYP+tKBE+7nk1JWRO+JWRRPFBSFIU44hggcj8HJboToXVmZ5PhJ0oZGRksXLjQinsRMcrlsOEy2Bo1sE7J6KLZtj4vPjUy3chijiVPlPSN5ixZNBvNT5QiXXrnnpqBUj/99GvR+4OBEZJN4lpG18867DbyMvTOqkbXKUm1wzisLAs3e/2s6jVvTyYLzJiy8Ch6omR4oPTVr36Vr3zlK3g80dORQkw9oyUOQw0djP1/pAFtfRJIo4rFJ0pRaqqeKE3F99Xpsk5JsklcKznOgdEGw4GurOEMlELZoHZGsrQsfGZN4k1ZtUOkGw1FUS4Z/r/3X//1Xzl//jyzZ8+msLDwugWzx44dM+3mROxIdTlpMlAWFyi3u9LeR5/XT7zTHvJ7mz0DzHJLicN1rAijeItm7SCqw8iluIjQNkrAsDDq64n4/hEdWgezlFkRu55VJJvEtWyKQnKcg84BX8jvCVY7GGzooGp6xUNmQuTXkUQ9SxsNdZl/bnUgasvCpyybpqDaoU/rI16Z+v8Ohv/vveuuuyy4DRHrjJY4pLidpLmdtHu81LV4WJSTHPJ7pRXrGGKp6x1EdS14pMsb3An6D2eqqtLX30dCfOQ2Vo6mmbvJkGwSo0l1GRsoBSbx6lo8+FUNuy30SYtmz4AMlEajhD4RGjKrqx2MLW+LmJmyfhb0bIonBgdKX/nKV6y4DxHjUgwumgUomJVIe207F68aGyi19npRNQ1blOzaHDVireudlN4F2W12EuIT6O3rpae3J7IDpSiqBZ8MySYxmhSXE7r6Qn79rFQX8U4bfV6VxvZe5mS4Q36vrFMag82CUUe8rJ+NhKlaPwt6NmUr2RG/7rWk6b8wRUqc8R/Sw9141q9ptPdJK9brWDJQsnDWTsJohKmqBe/Qoqe7kBBmM7p+1jbYlRXCW6dkpK34jGFlNllRFh7Fk3hT1cyht68Xv+qP6LWjpdohpIFSRkYGzc3NIZ907ty51NbWhn1TIvbYbQrJccYer88dtmeFUVJ+NwrFBoaXLk/A0gWz0RtGccrU7Vchm86GTrJJTCSsaocw1yl5VY2O/tDL/GaMmCsLj96fLyKdTfGueGyDGylHei+laJnEC+n/3vb2dl544YWQN+1raWnB74/syFNMvRSXk66B0P+75w+GUVv3AN19XpLiQw80KXEYhaLoM3eaiU/bAmHk6wffADhM/CYtO6CPMFUDJQ8evJoXpxKlRfnjkGwSE0lw2HDaFLwGtpUItysr6NmUZiDLZgRL1ijJ+tlIUBSFxPhEujxd9PT2kJwY+jKJyYqWsvCQh/n333+/lfchpoFUl4N6Aw1oEuLsZKe6aOro5+JVD0UFof2wA/qi2Uh3B4sJNjv4TRwoxbn1J1WaqgeSI8O8c6sDoGn6AC/KTMlAaQprwbvoIgMT/9tGkGSTGI+iKKS4nIYm1+bO0r8WG9p6GfCpxDlCX6XQ3DvAwvTQN1GfEWJu/Wz0TuJFev0sgNvtDg6UIilaqh1C+upXVdXwrwULFlh97yLKpMQZn0UbKr8zXuJgpJPRjGHVDuhgQfmdpm/uF4WmIoymsrtQtJQ4GCXZJEJhdJ1SqttJcoIDVYP6FmNPlQKTeGIYK5o5WLp+Vp4oDTdV62cD1Q5TTZo5CNMYDSMYqgUPp8Sh2cC+TTOGJYE080oc7Iodh/GmoJMyVWEE0TNzJ4QVjG5foShK2BvP9vtVerxS3jmCJXv8Det6Z/bANIqfKLmUmVMWDtGRTZH9SUBMa26nHYei4Avxm9ae8st0evTZgotXPXT0DHDwbDObl87i0NlmVE1jV0nemO9vkRKH65lZC370d3rZXWCg1NkIl0/C8u1w+lW9HG/t3ZO7RjQvmiUOH9Y/tSw9XopNsTEvbx6gh1FPbw+V5yrx+Xw4HA42rNpg6T1ESy24EFZINdDQYU/5ZWyKwtwsNycvdXCxuYdOj5cDZ64Gy/DGyyXQy++SwugEO20pJs7JB3Jp5W79Y78Xuprg3Jv6WlqHy4Rc6o/asvBIVjsEsmn4QGkqsilTybT0GhORJ0rCNHoteOjhYFMUDp1tQQF6+n3UtXjYW9HIixUN7ClvmHCfpGZpxXo9M7sLKTY4+hT0DS4862qGY0/Dsd/rx80IP2nDik2xUXq8lHO15wDw9Hno7umm7EQZ5afKsZn5Q8YYomHWTgirGNm+wqYo7Clv4Gqn/r3pUrOHTo+XvRWNvFbZFNL+fVLtcI1AoyFTzjWYSyee09fkArQ36Nl0/FmTBmUaaNFZ2h/J0rtANjW1NgFDA6WZlk0y5SFMleJy0BriHkc7V+cCsKe8AYDGdn1TwINnmtlVkhv8/Fj6fCoer59EmbkbYmaJw5r3678ffUr/3dur/37qZVh7z9DnJyOKnyhFKpDWr1wP6LN3AJqmcfzMcQCKFxUHP2+lWF2jJEQonHYbbocdj2/ikrhrc+lqZz9vntJ/UNy0NGvCXALpyjoqmwP8Jgw+hueSwwWqH868ph9bvsOcXAJ9Es+KUvZJiuQTpWuzqcfTQ9W5KmBmZZM8URKmMlLiALBxSRazU+MBeO7oZQBWFKRSlJ9K3eBM3nhkP6VrmF0LvmwbpOXrf67co/8+by3MLYHmGvC0Te78UfxEKZL7VaxfuZ6S5SXBj89cOAPArMxZNLU20dTaZGl9eDfd+DVZVyGmLyPVDjtX57L1/2fvz4PkOtPzTvR3cquqrH2vAgr7DgIgFlaDS3NBk42mZcnTYkt956plaaRWz3hCtjxhK+6M584mXTvadxxaRprQ+LrbrVZYdmvci622LLG5gWyuIIiFAAgQIJba933JPc93//gysypRW56sc/JkIt9fBKISWVV5kmBVPvm+3/M+75G2zN8v3JkC9EztwERoQ21ajCcJy5xSNnY38Y79rLbaAfToN/K07NK6ZIc2Fen8rA8fngK+de8+2s3B3QcBmJqd4vqd60DhtKlkT5Tu3r3Ln/7pn3L37l3+j//j/6CtrY2XX36Zbdu28cgjj9j9HIUSotpvbUbmvVvjjM5Gsu77pH+WT/p1F+Hs8Y51/eAzkTg7ck8Vf/ixe7HfzddhZiD1l5TNsfei/gNw8iub84MX8YlSoZPvfL6V/+/OnT+Xud19tNsxP7hCscAC9ZT2L5Nok7AWNQEfLOb+5ne1SPB//25f5vaG2hSNU2VRDx9q7G7i+VY58X/7W0u3H1JtMgyDAAEiRDb+YpuoqqhacV+htKkY5mct/+S+9dZb/K2/9bd46qmn+OlPf8o/+2f/jLa2Nq5evcq3v/1tfvCDHzjxPIUSIWFhqR/AkwdauT04R8/4UrLQI9vq+VLK3lAXXP+EKhe/eHlhc6fp0PPQ/zGM31m6b8cpLUIAwYbNPX6R+sAB/BTWdpFIrPy3OHP6DK1NrcBS8pBTzKt56o3SLZREm4T1iJumpa+PJVZ+/Vef2k5Xk05qFW2yiN3zLIlVit6nv6FPlWDz2mQW74mgH39BC6XVZsELpU2LLGIqsyDzUGth+cr/w//wP/BP/+k/5dVXXyUQWOq4njlzhvfff9/WJyeUHtGkNTH64PZEpkg6trMB0CdKNwZm6WoJbihGPo+IURZ2i/On55aKpK1H9cfei9B3WQtSsHFzj1/Edq9CFkrp4djmBp3u097cDsD45DhtTW20NbU5Xigt4ED8ewERbRLWI2ZBm165Msyb18doSOnPgS06irp/IkRXS1C0KR/s1KZLP9LBDfWpebGOQ/rjxH2tS7ZokzTxQGvTlU+v4Pfpa+7ZtgconDaZmIQJO/b4uWC5ULp27Ro///M/v+L+1tZWJicnbXlSQuliVYxevjzM9tQupYqU1eGJAy28fHmYV64Mb/gYIkYPYGfXJZ1ut+OU/nsy5ck/9IK+/9KPNn+NIu7aFWqP0oVrFzh/9Tynj51mW8c2ABpqGwC4fuc6F65dKMjzKPVCSbRJWI9ctSmtSy+e6CTg16+nx3Y0ADpoKBddAtGmldikTWldOvWL0LRd39e2V3+8+Zo9ugRF3cRzQ5tqq3WzYGvHVqCw2jTPfEGusxaW/7UbGhoYHh5m165dWfdfvnyZrVu32vbEhNLESqGk9yR1MjEXpW8iRH0wwNnjHTx5oJX6oB8zh+hvn0fySLKxUZyVqcWotjU1k6S05e7Q87pbp6ydHq5+jSLu2hn+zFiWk5jK5PSx03Qf7ebiJ3r2K2km6T7aTSKRwLTj3zkHFlRpF0qiTcJ65KpNaV06e7yTdz8dB6CproKzxzuIJcycdAnAL4VSNnY18dK6dPIlePNP9H0en9amRNQeXQLRJrK1aWB0AGYBhTva5OKvk+VC6Zd+6Zf47//7/57vf//7GIaBaZq8++67/PZv/za/8iu/4sRzFEoIK4VSehD2269pa1djTYAnDrQA5BTBCiJGK7DzRCk9CHs/lSiklt1nVwRrEXftCmVvWD4Emx6ajSfiji/ye5BSP1ESbRLWI5rM7Z3l8oCGcEy/PrXWVXBgS52l60kT70Fs0urlAQ3elMXW612am7WLInY7uKlNSqmy0ybLv8n/7J/9M7Zv387WrVtZWFjg8OHDPPPMMzz55JP8T//T/+TEcxRKiFzFaDlpMQpWWE8IEnvDgzggzmkxSjqQAlTMXbsChzkAVFboqPxItHCDumlK/URJtElYC6WUpSYeQDxhkkjpWTCPXX2iTQ/gxDC+L6VNifLSpkJZ75aTLpTC0cLPC7mtTZb/tf1+P//23/5bfvd3f5fLly9jmiYnTpxg3759Tjw/ocSwKkYA4agulKoC+RRK0rXLwomkJSfFqIi7dq6IUaWLYsQCSimMEk3rEm0S1iJuMY0Vlhp4hkFmVilXPIak3q3ASW1K5rbk3hLidsiislI38cIRd7TJTfJ+J7Bnzx727Nlj53MRHgJiFiNYYUmQqvLo2on17gGc6Np5Uy/KjohR8Xbt3BCjTNfOBTFKkiRChCpW7swoJUSbhAfJq4EX069NVQGv5aLHLw28VXBQmxxp4ok2LUdOlDbgH/2jf5TzA/7+7/9+3k9GKH1W2z2xEUuFkljvNk+J2RtQevjWxR0Ja+Gze0FiDqRPlOKJOIlkAp+3sM9hgYWSKpREm4RcsLq2AiC0KaeD6NIKHGniOWkLL94TJTfdDpGIC7bwUjhRunz5ctbfL168SDKZ5MCBAwDcvn0br9fLqVOn7H+GQsmQNBWJHBOBln9PuriqymtGqfjeYLuKE/YGJ8UI9KmSEdj46wqMG127gD+Ax+PBNE3CkXAmkrVQzKt5Wo3Wgl5zM4g2CbmQ34lS/k4HKZRWo8Rs4cXsdihQ6t1y3DxRihIlpmIEXHqfkNMrwLlz5zK3f//3f5/a2lr+7M/+jMZGvdBrenqaX/u1X+Ppp5925lkKJUF+trulF6NKv3TuNo+DJ0pOWO9AzykVYb3rRqFkGAaVFZWEwiHC0cIXSm537qwi2iTkwuYKJWng2YKjJ0rlNaNUbvOzoLWpiSZXrm35J/f3fu/3+OY3v5kRIoDGxkb+6T/9p/ze7/2erU9OKC3ysd2l7Q0Vfg9ei0WPx8Dy9zz0OD2j5MTehCLt3LkhRuDunJLbXvDNINokrEU+1rvNFEoyO7sKjoQ5pLWpvIKG3E5kNfNoim8WN7XJ8ruqubk5RkdHV9w/NjbG/Ly723MFd9lMkIPEr9qFg9Y7KKvOnRtiBEuFkisR4SV2orQc0SZhLTYV5iBrK2zCwROlhAQNOU26UAKIxqIFv76b2mT5J/fnf/7n+bVf+zV+8IMfMDAwwMDAAD/4wQ/4+te/zksv2bSEUihJ8unaRVKFUqXYG+zByV0VUFZecNdOlNyMCC/hEyXRJmEtCr+2QgqlFTipTU6FOVicuS4UbmiT1+OlIlABlJ82Wf7X/pf/8l/y27/92/zyL/8y8biu4n0+H1//+tf5F//iX9j+BIXSIR8xCkX1m+R8ls2KvWEVnLA3eLxgeLVwlNEuJY/hwYuXJIV9funOXTnuq9gMok3CWmxmRikft4PEg6+Gg24HpxJZMQHr702cxm+453aIxqJam+oLe203tcnyK0AwGORP/uRP+Bf/4l9w9+5dlFLs3buX6upqJ56fUEIUfmBWCqWVOCTQvgDEw2VlvQNtcSh0oeTmiVKYMAmVcCUafbOINglrEU1aPxkIiTbZi6MnSg4GDXmLr1By0+0wMz/jijbNK/fs03n/a1dXV3Ps2DE7n4tQ4sTyECNJFrIZp/YRef2pQql8rHfgUrpQhXv7KkB37hpocOXadiDaJDxIPk28tC1cZpRswpHVFQ4unIWUNsnqijSuBg2V0onSmTNnMNb5gX/jjTc29YSE0mVzyUIS5mAPDv2bOLqvorhPlAqNm/sqQHvBG4wGV669GUSbhLXYjC1cmnh2UWILZ6FotcmtQiljC3dBmxZZxFQmHheW01t+d3r8+PGsv8fjca5cucL169f51V/9Vbuel1CC5CdGYm+wFcdOlBwUJLN4T5RcSReqdG9GCUp3Tkm0SVgNpVTBbeEyP7sKTlrvHD1RKj5cDxpyQZsUihAhaqgp+LUt/2v/wR/8war3/2//2//GwkJpCqxgD/nZG/KPYJWB2VVwqlBK76twJIa1OLt2gJ7VKaMN6FC6yXeiTcJqxE2V16+wuB3sxsE9SmZC7/izW/+KNGjIbeudG6srQDfx3CiUbPup+uVf/mW+853v2PVwQglS6KV+Ikar4dC/iZMnSkXatQOXrHeprl00FnVlsd88D9fOIdGm8iafBp6p1NKMkljv7MGRZehO7/grTm1KJ7IWGjeDhsC9Jp5tP7nvv/9+xjIilCd5We8yEaxSKNmCk2EOUFbx4OCOxaEysPQ6KktnN49oU3mTjy5FY8nMKZQ08ezC4WXoZTY/64o2ubi6AtzTJsv/0g8u7lNKMTw8zEcffcT//D//z7Y9MaG0MJUiYeZmcHj58hAew+Ds8c5M1+5q7wzbWqr54PYEplK8eGLLho8jYrQaNv6bXPyBLrxOvrTkBQ/N6PsTUfBVwKlf2Px1irRrB4U9UTp/9Twew0P30W4qKyqJRCNMzU5x7bNrJBIJfD4fp4+ddvx5lKr1TrRJWA0rToe0Nj22pwkArwdevzbCkwdaLWmTzCitgp1NvOXa5PHqZtv8OHzyk7LSpijRglwrrU07tu4A9InSYniR659dL6g2uRURbrlQqqury0oW8ng8HDhwgN/93d/l7Nmztj45oXSw0rXzGAYvXx4GlsIcLtyZwuf18P6tCV480ZnT48iM0ioYBrpYsmGwxvDAxe/r2+lCKTwLV/+Tvn3qFzd/DZCuXQqP4eH81fMAmUJpZm6GC9cuABREiECnCyml1k2QK0ZEm4TVyEeb5kLaxlXp9/HKlRHmwwlL2iTWu1Wws1Bark3eAJhhWJyESz/U99mlTeJ2AJa0KRrThVkkGmExtFhwbSqZE6Xvfve7DjwNodSx0rU7e1yLzcuXh7POP9JClP78RsiJ0hoYHnuKj5OpDv3F70PTdn175Kb+eOiFpc9vliIulAp5otR9tBvQ3buaoB5YvdN/B4Aje49kPu80SZKECRMkWJDr2YVok7AaVgql5doEUOH3sBgVbbIHG/9NlmuTr0LfvvOu/mirNhX3iVKhWK5NAKZpcu32NaCw2lQyM0q7d+9mcnJyxf0zMzPs3r3blicllB5WfeCP72/hc3ubs849HtlWz+GuegYmQpmO3nqIGK2FzYJ07Gdhqk//fUy/cadlF0zc139C05u7RjHHgxuFDXPoPtrNiUMnWAhpQRgYGQCgtbmVsakxxqbGWAwvOv48SnFOSbRJWI18tOnAFt2omFrQcy9WtMkAvKJNK7F7fjatTYmU/ey+fhNvqzYVcxPPJW1Kc/OebpoWUptK5kSpp6eHZHLlD080GmVwcNCWJyWUHotxay8o790a58M72W9qPumf5ZP+WQDOHu9Y1wtuANV+d3YJFD82i3S6Y7ect7+1dPvkVzbnBy9iMXJjYNbnW3nNc+fPZW53H+123OqwoBZoM9ocvYbdiDYJq5GPNt0ayn5DZkWbavOIEy8PnIgHF20q6DVd1qYYMWIqRsAIbPzFNpLzv/SPf/zjzO2f/OQn1NfXZ/6eTCZ5/fXX2blzp61PTigd+matpaA8eaCV9z+dYD6ydJrwyLZ6vpSyNtQF1++W7GmsJugvfDxmaWBzpHRilYHRp7+hO3cAwYbNPX4Rz8IYTsWtr0MisfKE7czpM7Q2tQJQXVXt+HOI4M6ejHwQbRLWIpY0GVqw9rP86M5GXvt4BFMtTXta0aYjrbV5PtuHHCeKDqe1yYXX/2KmWLQpQJEWSl/+8pcBMAxjxZZzv9/Pzp07+b3f+z1bn5xQGsxHE0yErUVz/vWlQeYjCQwDfuOFPXzr1bt80j/Ltpbghj7wgNfDwebCLx0rCZSyV5Au/Qiu/hU074TJHmjdC+N3tK3h4Bfsu44AwIVrF7h88zJb2rYwNDZEY30j07PTjE+O88jeRwr2PEqpUBJtEtaify5MjmGsGX74fh+mgroqH19/YQ9/8J9u5axN7dUVdNRIFP2q2F0opbXJXwXxMOz8HPR8WDbaVOgmXlqbqquqWQwvsr1zO33Dfa5oUx11BbseWJhRMk0T0zTZvn07Y2Njmb+bpkk0GuXWrVv87M/+rJPPVShSemZDlr7+lSvDfPjZFABPHGihttKfuf3y5WFeuTK87vc/0lJLwCupQqtj42nSpR/pYdlTvwgNW/V9Hfv1x5uv6c/bQvF27QopRheuXeD81fOcPnaaHVt0DGt9jT4duX7neiZhqBCElTt7MvJBtElYDaUU92esadN//miQe6N6zuKlJ7Znfv9z0SYDONZW2DdwJYVySJvSO/52P64/ijbZznJtaqhrAGBLm7afloM2WTY53r9/34nnIZQoSVPRO2dNjKYW9HG5x4AvHG3H5/Fw9ngHTx5opT7ox1RrtwDrK3zsrK/a1HN+qLEzzlSZWohOvgSv/aG+r6JW+74TURuFT8QIwFQmp4+dpvtoNx/f+jhzf/fRbhKJBKadbzQ2oJROlNKINgnLmY7EmYtZC4rpGdNFUkdDJUe217MQTuSsTXsbq2U+aT3sPFFark1X/0rfV91kvzaJLRzI1qbRyVFAr18oF23K6bf6j/7oj/iv/+v/msrKSv7oj/5o3a/9rd/6LVuemFAaDC9EiCWteRvmQlq8uvc201SjhzHTw7EbWRsebasruf0uBcVOMVo+BJtOpquqs9/WIP87gexdFH6f7pIqpQq2o2I5pVIoiTYJa3HfotMhEksyNK271V98tAOPYVAX9OekTRViB98Yp7WpptmeJbMlQiELpdW0yePxlI025VQo/cEf/AFf+9rXqKys5A/+4A/W/DrDMESMygyrYtQ/EeLTwTk8Bjx/rMPS926traQluErKjbCEUyk9yVQkrseJjmnxVkpuhDkA+FN2knhi45h8J4io0iiURJuE1YgnTQbmrP0Mv/vpOOFYkrb6Ch7d2Wjpew+31OIXO/j6OKVN6UKpzLTJLdKF0mrBDoXADW3K6SdruaVB7A1CmoVYgvGQtRCHVz/WHu+Tu5toqcu96PEYcFTShDbGqSPwZOpF0VteYuRaoeR3t1AKUxozSqJNwmr0z4dJrmOTe5BoPMmb18cAeOFYBx4Le5DEDp4jThRKpqkDjKDsCiW3tCkdEV5O2mS5BfK7v/u7hEIrTxHC4TC/+7u/a8uTEkoDqyEOQ1MhrvfNYmD9NGl/Uw1B2Zu0MY517VKP64gYFS9ui5FrXTsiKAtvNIsB0SYhjdUQh/dvTbAYTdBcW8GJ3U2WvvfRtnqxg+eCI4XSstdHJ5p4Rfy/1bUmns9lt4ML1jvLhdLv/M7vsLCwcjtuKBTid37nd2x5UkLxYypFr8XdSa99PALAozsbaG/IPUK1yudhf5P4v3NC7A22Uq5ilCRJAneKtHwRbRJAhzjMRnP/2Y0lTM5d1wPqzx9rx2vhNKmrtpKWYGF3upQsTrgdlhdKZaZNblGO1jvLhZJSatXuyccff0xTk7VOjFC6DC9EiCZzf+EbnQnzcc8MAC88un5gw4Mcaa3DZ0G8yhrHZpQctN5JN3YFbhdKUDqBDmlEmwSwfpp0/vYE8+EEjdUBHtuT+8+J19DaJOSIE9qUXF4oObGAvni1yW23QzmdKOX8rqexsRHDMDAMg/3792cJUjKZZGFhgb/39/6eI09SKD7uz1g8Tbo6igKObK9nS1Pufu7mKj9dtbLAL2dK8kSpeHFNjLzuihFoL3gtxT8XKNokpEmYJgNzuWtTImly7po+TfrC0XZ8FgIZtB3ciTfnDylOWu883rJruJWr28GNGaWc3/X84R/+IUopfv3Xf53f+Z3fob6+PvO5QCDAzp07eeKJJxx5kkJxsRhPMBaK5vz143MRLt3TC2a/aPE06Zj4v63hdKEkYQ4FIS1G6cWpHk/hE7UiKlLM/2syiDYJafrnIiQszNZduDPFTChOXZWfz+1rzvn7qnxe9okd3BpOnig51cCT9x4rcLtQihEjqZJ4jcI1KXL+6frVX/1VAHbt2sWTTz6ZSWUSyo8ei7NJb1wdRSk41FXHtpZgzt+3o76Kxkr5ObOE09Y7J+wNIkYrSIsRaEGqCBQ+Fr9UrHeiTUIaKwFDSVPx+lU9N3vmaDt+X+7NiKOttWIHt4qTJ0qONPCgmDtFbjfx3JpRAogSJUju7yU3S04/XXNzc5nbJ06cIBwOEw6v/ma5rk48uw8zOsQhdzGaWohy4c4koJf45YrPY/BIS/HbfooOp+LBxXpXULxeL4ZhoJSSQmkdRJuENDORONOR3Lvcl+5OMbUQo6bSxxMHWnL+vuaqAFvFDm4dR06UnNzvV9yU64wSaG0qukKpoaFhQ/tTepA2mXSooy0UBSOLUSKJ3N+Mv3FtFFPBvs5adrblblU41FxDpU/835YR652tuCVGhmHg8/qIJ+Kude7Cqvh3KYk2CWmsnCaZpuK11GnSc0faCFg4TXq0rU7s4PngZOqdY4VS8f5/dvtEydX5WRUu6P+anH66zp075/TzEEqEHguJQjOLMc7fTp0mHc/9NKnG72VPY7Xl5yZQAOtdeRVKbuL3+Ykn4mWVLmQV0SYBIGEq+i2EOFzpmWZ8LkqwwsuTB1tz/r6d9UEaxA6eH45Y71KP6ZT1rogLYrcLJTetd4XWppx+up599tmcHuzKlSubeS5CkROKJxlZzD3E4dz1UZKmYnd7DXs7crfRHW2rw1PEL1BFjaTe2YpbYgTuC1IpFEqiTQLA4HyYuJlbiIOpVGan37OH26jMMbnO7zF4pEUCHPKmFMMchBUUw4lSobVp01FKs7Oz/Mmf/AknT57k1KlTdjwnoUixMps0H47z/q0JwNpsUnt1BZ014v/OGyfESClnO3dFXBS7WSilveCxRMyV67ux2M9ORJvKByu2u2u9M4zMRKj0e/j8odxPkw4211AhdvD8cTQeXKx3hSKtS4lkAmUhYdJOSqZQeuONN/jlX/5lOjs7+eM//mN+5md+ho8++sjO5yYUEUopS2L05vVREknF9tYg+7fkdppkAMdkgd/mcNLeAOB1wnZSvGLkJm6fKLmxr8IORJvKi7lonMlwbt1ttew06enDbVRV5PYGuyYgdvBN4+SJkqTeFYwHE1ndoNDzs5Z+ugYGBvjud7/Ld77zHRYXF/nqV79KPB7nhz/8IYcPH3bqOQpFwOhilHCOIQ6LkQTvfpo+TerMefB1T2M1tTkKl7AGTg7MQtlZHIrBeiczShsj2lS+WFlXcWNgjsGpMBU+D88cbsv5+46JHXzzlOKJkvwvX4FvWVGaSCQI+AMFfw5Fe6L0Mz/zMxw+fJgbN27wx3/8xwwNDfHHf/zHTj43oYi4b+E06ac3xoglTLY2VXG4K7cTooDXw8Fm8X9vGie7dlB2YQ7FUCi5daIUJYrpVNy8jYg2lS9JU9GXozYppXj1yjAATx5spboyt9eyjuoKOqrFDr4plHK2iScnSoW7biqRFcqniZfzT9crr7zCb/3Wb/Hf/rf/Lfv27XPyOQlFRjiRZGQhtxCHcDTB2zfGAD2blOtp0iMttQS8mx6ZE5zs2hkGeBz4f1TEndpimFGKJ90bmo0SpYoq166fC6JN5cvQQoRYjiEOt4fm6ZsI4fcaPHckt9MkAx0uJGwSpxoujoc5iDatht/vJ5FMuFcoFXh+Nud3PW+//Tbz8/M89thjnD59mv/z//w/GR8fd/K5CUVC72yYtaTo5ctDvJLq0gG8enWESNykta6C4ZkIL18e2vDx6yt87Kwv7jdjJYOdhdLFH8ClHy0t9TO8+r7QtL7/4g/su1aR4oYYnb96ngvXLmROlBbDi5y/ep7F8CIXrl3g/NXzBXsupTCnJNpUvtxfZ13Fcm1SSvHXlwYBOLm7ifdvTeSkTXsbq6kNlJfd2BHsbuCltSndxFOq7LSp0KR1CZbcDvOhec5fPc+7l959qHUp50LpiSee4Fvf+hbDw8P8N//Nf8Nf/MVfsHXrVkzT5NVXX2V+ft7J5ym4xEYhDh7D4OXLw7xyZZhIPMkHqaS7hmo/P7k8nJOvWxb42YidgmR44OL34dpf6797vHDphykh+r7+vD0XsulxHg48hofzV88zOaN3kIXDYS5cu8CFq7pI8tj2774xpTCnJNpUnszHEkyE106EXK5Nd0cW6J/Qb64SpsnLOWhThdjB7cPuQimtTT2pkBZlOqNNRfy+pNBNvLQuXbh2IWO9W1hc4MK1C1y+ebngulTIxD3L/2XBYJBf//Vf55133uHatWv843/8j/nn//yf09bWxt/5O3/HiecouMhYKEYovvaL3Nnjnbx4opOXLw/z3TfuEYnrI/bPhhd48UQnZ493rvv4W2sraQlW2Pqcyxo7BenkS3DqF+GTl/XfPalo3Juv6ftPvmTThUSMltN9tJvTx04zMqHTuZJJ/f/0+p3rnD52mu6j3QV7LqUUES7aVF5stPx8uTb9xTu9mfsv3p3OSZseaanFL3Zwe7C7UEprU/9l/XfRJsdJ69L5q+eJxvQoxr3+ewAc2XukoLpkYhKncLa/Tb0KHDhwgP/9f//fGRgY4Hvf+55dz0koInKJBH98fwun9zVze2ipc/vItnoOd9UzMBFiLrT6D7THgKOtuS+iFXLAbi/4wTOw83P6diz1s7DjFGw/ARP3tdVhsxSvFrnmAz+89zDtze0A3Om/A8CurbvYsXUHY1NjLIYXC/I8SuFEaTVEmx5ukqaid25j+83j+1s4ur2eqYWlk6dctKmhwscOsYPbhxOzswfPQOtefXvgY/3Rbm0qYtxq4p04dCKjP/0j/QC0NrcyNjX20GqTLeZbr9fLl7/8Zb785S/b8XBCETER2njZ5Xu3xjn/2WTWfZ/0z/JJ/ywAZ4938OKJLSu+r6WqgqBf/N+2oVR2lLcd3Hwdej7Mvq/3ov4DcPIrcOoXNnmRIu7aulTEXf/sOqOTo1n33R+8z/3B+8BSd89pSrVQSiPa9HAyH0sQS27cFHrv1jjX+maz7stFm7bVVYkd3E6cKJRuvg7jd7Lvs1ubCmgnKxXSIUPLOXf+XOZ2IbWpjsIErci7VGFdmqsCDC2s/2bpyQOtzIcSvH97InPfI9vq+VLK2lAXXH1J6XgoSjiRpEq2nduDSgI2nygdeh7G7ix17EB37U5+Rd8ONmz+GkW8m8mtzeNH9h2hf7g/Y78DfaLUfUzbG6qrCrP8MunEGxxB2CR1FT78HoP4Bol3Tx5oZXQmwsc9M5n7ctGmvrkwexurpViyCzO31FxLHHoe7p2HmQF0R0vZr01GEWvTmhFbzrLauoozp8/Q2tQKFFCbKJw2SbksrEt79cbzQx/cnuD92xPsbF36Bfmkf5YbA7N0tQTXFCPFxj5zwQLmxqd/lvn03FKR1JayOfRehL7L0LILgo2bv4Zn9Z+PYsAtMbpx50amSNrathXQJ0q9g720NbU9lGIkCLniMQzacpht/eD2BB/3zFCzbGdSLto0G00wFXEvlv+hwyltmhnQt4+8qD+WkTa5QTq4obFO/9t2tuqGw/jkOG1NbYXVpgI28aRQEtZlo0LplSvDvHx5mBdPdPLzj3dl7v/c3uZM4tB63J8JYbrUtX/osFuM0glCXcf03wOpF8BDL+j7L/3InusYIkbLSUeA7+raBZBZ+npk75GsiNZCIIWSUKxY0aZnDi/tTXriQEtO2nRvujCzFmVB0iFtqtVznASC+qPd2lTEhVKhm3hpXTp97DTNDc0AdLR0ADpoqJC6BIXVpuI9VxSKgqDfS23Ax3xs9dkXU6lMgpBSiqaaAFMLMbqaq2iq7dywCIokTYbmI3TVyeDspknabG9Qpk4QSsZg4Kru0J38irY8BBvtC44QMcrCVCanj52mOljN/YH7eDweuo92c2TfEaqD1ZnCqRAksHnmTRBsom2DQmm5Nk3OR/nrS3pv0pMHWqgP+jfUpoH5CEcTSSrFGr557G7ipbWp9yOYB2rbnNGmIm7iFVqb0rrUfbSbn7zzEwAC/gDdR7tJJBIF1SWQQkkoMtqrK9YslJYPwhqGwWN7m3jlygg3B+f4xhf35vT4d2dCUijZgd1ilB6Effvb+mNN89J9tsWvUtwzSi4USulB2Jv3bgLg9Xgz9xUyghV0DKsgFCNBv5e6gI+5HLSpubaCHa3V9I4vcndkYcNocEhZw2dDHGyWZNZN45Q23X5Lf6zvgP3P6NuiTY6wPKAhPbvn9/k5fuh4QZ9HGplREoqKXOaU0pzY1QTArcE5FiK5daMnwzFmxQ++eZzwgQNEF/THSofeMEjXblXS8a9uBUqAnCgJxY0VbTq5W89VXLo/lfP33BNruD04pU2R1EqSCgcWAxveok69c1WbUoVSoU+RliOF0hp885vfxDAM/rv/7r9z+6mUFS1VAbw5hv+0N1SytakKU8HVntz3GNyVUIfNU4piBGK9W4O0GLlZKMmMUm6INrmDlULp+K5GDAP6xkNMzOVmU44kTIY3SH0VcsBuWzjoVRjx1C6tSge0qYh1CUSbCtnEK5lC6cKFC/yrf/WvOHbsmNtPpezwegxackgYSnNytz5VunQv90Kpfy6c014MYR3sHphNkz5RkkKpoHhS3cxy6dqVKqJN7tFsoYlXW+VnX6c+Fb98z9qpkrBJnGjiRVK6hAEBJ06UileXoDi0qVyaeCVRKC0sLPC1r32Nb33rWzQ22hD5KFjGkv1udyMGcG90gemF3F4gk0rRN7vxpnVhHZzYVQHLrHdOFUriA18Nw2Okn4RryB6l9RFtcpfNNPFyfZM3HooxFxVreN4oBaYD/36ZBl4QPA68lS3iBp7bFMOJkhRKD/Cbv/mb/O2//bd54YUXNvzaaDTK3Nxc1h9h81gplBqqA+xq12+qr9zP/VTp3syiq794JY/j1jsnZpQ82gsurKDcfOCliGiT+3RY0KajOxrweQ1GZyMMTefemJNTpU1gxnGk25M+UXJElyjqBh6I9U72KC3jL/7iL7h06RLf/OY3c/r6b37zm9TX12f+bNu2zeFnWB7U+L0E/bm/oc0MzlqwOCzEk4yFHHqzXw44USglopBMdQPFB15Qys3eUGqINhUHVpp4VQEvh7rqAbhswRreNxsmLtbw/HAsZCjVwHPM6SDatBZFUSjJiZKmv7+ff/gP/yF//ud/TmVlZU7f80/+yT9hdnY286e/v9/hZ1keGIZBuwWLw6M7G/EYMDgVZnQm92HYu7LkLz+UcmZGKd21M7zgdyDCXcRo4+dQJmJUSog2FQ/VeTbxLt+bzjnRLqEUfXNiDc8Lx5wODs/OyozSmpSb26GoC6WLFy8yNjbGqVOn8Pl8+Hw+3nrrLf7oj/4In89HMrnyH6qiooK6urqsP4I9WOncVVf6OLhV/9tfthDHOrIYZXGNvRjCOqgkOLHzZnnXzshxatoKUiitiZwoFS+iTcWDYRiWtOlQVz0Vfg/TizF6xnJvzIk1PE8cm5110hKOaNM6yIlSEfH8889z7do1rly5kvnz2GOP8bWvfY0rV67g9cpsQyFpDQaw8lb5RHpw9m7ug7MA92fFD26Zku3aiQ98LdJhDm4+BymUVke0qbiwUigFfB6Obm8ArKXfzceSjIs13DpOa1MZhgyBFEqF1Kai/kmora3lyJEjWfdVV1fT3Ny84n7BefxeD81VASbCub3wHdlej99rMDEfZWAyxLaW6py+r2c2xKHmWrweB04wHlac6tqlgxycWjYrXbs1ydgbTPfsDbJwdnVEm4qLdBMv19/Wk3ua+OjuFFfuz/Dl09ty1pp7M4u0WSjKBEp3bYVY79akGNwOskdJKFqsdO4q/F6OpDp3VnYqxZKKgXnxg1uiVMVICqU1KYaunemEnVMQbMbv0U28XNnXWUtNpY/FaILbQ7mnDw4tRAnF5ZTVEk6nsZZpmIOblJs2lVyh9Oabb/KHf/iHbj+NssVKoQR6pxLA5fvTmGbuv1R3p0PiB7eCY8lCaXtDeUawuomB+2KUICG/hzki2uQuVrTJ6zF4dOdSqIMV7s9I4JAlnNYmmVEqOMUQ5iAnSkLRUl/ho8Kb+4/Nwa11VAW8zIXi3B1d2PgbUsxE40xHZMlfzpTsjJKI0Vpk7A0uJ+/JqZJQClht4qXT7671zhBL5P4z3jMbJmmh6Vf2OO12kBmlgpMulMplGboUSoIlrCYM+bweju1sAKztVAJZ8mcJ2VXhCEUR5uDyiY4EOgilgNUm3s62ahprAkQTJjf6Z3P+vmjSZFCs4bnj2PysNPHcohhOlCT1TihqrHfudPrd1Z4ZEhaW9g3Mh4kk5E1aTiSdFiOxNxSajA/c5e61FEpCKWC1iWcYBid2WV+MDnBXmni540QTT6llTTzRpkJTDGEOUigJRU1bMPehWYA97TXUVfkJx5J8Opj74KypoHdWOnc54fiMktgbCk0xdO1ACiWhdMjXfndzYI5wNPeZh+lInOmIRIVviFJgOmChj0fATL0uOXKiZOgl60VMMWiTFEqCsAYVPi+Nlbl3WzweYynUweLg7L2ZxZy3p5c1TicLOXWiVOT2Bjcphq4dSKEklA5Wo7s7G6voaKgkaSqu9s5Y+t6703KqtCFmHEcGWdINPK8ffA7EtXt8zixYt5FiKJTKxXpX3O1coWhpq67IOWzh5ctDxFIWuut9M0TjSaJxk/dujRNLmAR8Hl48sWXV7w0nTEYWomyprbTtuT+U2FkoXfwBGB44+dKSIN19F+rb4dNzoEw49Qv2XKvI7Q1uBBmcv3oej+FhV9cuQAviYniR659dJ5FI4PP5OH3sdMGejxRKQqlQ4fXQWOnPWZt+cmWY2io/IzMRLt2b5lBXPe/dGufJA618cHsCU6k1tWlgPszRtjpLc1Flh90NvLQ2bTuu/x4IwqUfwqHn7dUmaeCtSlqbfD5dOiTiCc5fPc+RfUe4cecGpjILpk1SKAlFT0ewgluTuaXYeQyD929NEgx4CcWSXO+bpb2+kleujADw4onOdb//7syiFErroZS9yUKGBy5+P+UDT0Xh3nxt6eOpX7TvWkVeKLmBx/Bw/up5QhHdsVZKF0oXrl0AKGiRBFIoCaVFu4Umnscw+GxYn5rfGZlnaCrMK1dGmA8neP/WxLraZCronQmxv9khW/LDgN2FUlqb5vR7B/yVulAKz9qrTSWgS2408dLatH3LdgBiiRgXrl0gHA5z/c71h7aBJ4WSkBeNVX78HoN4DoPmZ49rsXn58jAAl+9NUV+t55yeONCS+fxajIdizEXj1FUU/4uXK6gk2PmiefIl/fHi97PvTwtR+vN2YBT3S5Ab9obuo92A7t6BLpRufHYDgCN7j2Q+XygKua9CEDZLe3UFn+bYxFuuTUqRWT6bLpI20qZ7syH2NVUvxSUL2didePegNgWq9Ee7takECiU3WKFNKX1MF0mF1CaZURKKHo9h0BrM3Rt89ngnn9ur0+9uDMzx/q0JALa1BBmYCDEwEWIutHYXUKLC18GJ+NWDZ2D3E9n37TgF20/AxH0IWZs1WxVDfOBr0X20m0N7DgEQjUW5fuc6AK3NrYxNjTE2NcZiuDCLLwu5r0IQNktjpW7i5crj+1vY2VYNwJufjAHwyLZ6DnfVb6hLoXiSkUWHEkcfBpzYoXTwDLQf0LcnevRHu7WpyEOGwD1tOrz3MJ2tuoEwMDIAwK6tu9ixdUdBdamQy9CL/6dBKFoaKv0MLURy//qalWl5//7dvszts8c71vSDixitgxNidPN1uPd+9n29F/UfgJNf2bwXvAS6dm4uW/V5V748nzt/LnO7+2h3QawObi+8FQQreAyD+go/E+HcXhffuzVOz1j2m7tP+mf5JLVbaT1dAhheiNJZI9bwVXGiiXfzdRi9lX2f3dpUAjNKbgUpXP/sOsPjw1n33R+8z/3B+0DhdKmQSKEk5E3StPaLutr2868+tZ2upiAAdcG1X5ysdAjLjqQDEeqHnoeR2zB0bem+Hae0CAEEGzZ/DW/xv7mIKweibXMkFl/5Ru/M6TO0NrUCUF1VXZDn4S3ymFxBeJCEhU7zkwdaGZ2J8HHPTOa+R7bV86WU7W49XQLRpnVJ5t5IzZlDz8Pd92B2GDAAVZ7ahDvadGTfEfqG+hidHM3ct2vrLrqPadtdwXQJb8Esr2K9E/Iml/mkNK9cGebN62OkNeXErgYA+idCdLUE6WoJblAoyY/qmjhRKH16bqlI6jqmP/ZehL7L0LILgo2bv4bHgVhXm3FLjC5cu8Ct+7prWl9bz5G9RwAYnxynramNtqa2ggmSn+LvrgrCcqwsNv/g9kSmSGpIadAn/bPcGJjdUJcAApJ6tzZOadNs6kTjxM/rj3Zrk1e0aS1u3LmRKZL2btsL6BOl3sHeguqSr4DnPPIbLuRNIsdC6ZUrw7x8eZizxztIf8sTB1oAPTT7ypXhdb5bI2K0DnaL0aUf6WHZtn3675X1+uOhF/T9l35kz3VEjFblwrULnL96ngO7tA/f7/NzeN9hQA/NptPvCkUhBUkQ7CDXJl5am9KLZysC+vT0iQMtvHx5WLRpsyQc0qbKOv33Koe0SZp4q5LWpo6WDgC8Xv37cmTvEc5fPV9QbSqkLokCCnkTz9F6p3dRdPL4/hZeuTKCAbTUVXL2eAexhJnTQlkRo3Ww296gTJ0gNN0PY5/p/Uknv6ItD8FG/Xk7kEJpVdK7KJrqm7h1/xZ+n5/qqmq6j3aTSCQK7k2XQkkoNaxqU2NNgEv3pqmu8HL2eAdPHmilPujPUZvEercqSjmnTdf+Wv+9sUu0qYCktWkhtMDIxAhVVVV0H+3myL4jVAerC6pNUigJJUE8mVvXLj0IOzqju0uVAS8N1YF1B2QfRMRoHezu2qUHYX/8v+qPDV2wOzWcaWc0uHTtViU9CPvpvU8B8Pl8VFdVuzYgK4WSUEqYSpGrKzytQT9Npd3VVfkz920UDZ5GmnhrYMawdW0FaG2KR5biwVt2whZ92m6rNhX5jJJSylVtevXdVwE9j3Ti0AmAgq+tEOudUBLk2rVLE47pmOGqgPXhcBGjdXDCBw6wOKU/Vjc58/hFLkYAMeVAomCOJBJ6f5Hf5+6MkBRKQikRtzCflCajTRXWf9YDMj+7Oo7pUir+218J/ipnruFZmdBbTLg1n5S5flJf3+91T5ukUBJKAithDgChqBajYIUUSrZhxkE5sBBUmUuC5FShJCdK6xJL6CLN7ULJi6TeCaWDVV0CCMX0a6g08WzEsUJpUn+sbnJmD58nAEZx/z91vVCKpwolv4uFUgGX1Rf3T4NQ1CTyPlHKo2snYrQ6TsSvAoTnQCW1EAXrnbmG+MDXpRhOlLx48RT5mwZBWE4+hVI4Km4H27HbEp4m7XQISgPPtesn9PV9PvfcBnKiJBQ9SqmcZ5TShKKb6NqJvWF1nLbdVTU4tKXcKHp7A7grSOUmRoJgB1YbeLDUxAtatN55DfDKHqXVcaqJF3LaEi6F0obXT2mTm008KZSEoiepwGrfLpLxgefTtRMxWhWnu3aO2e4CztgmbKYYCqVyESNBsAOrDTzIf35WTpPWoWRnZ6VQ2ohicDtIoSQUPVaDHABC6a6d2Bvswykxkq4dSZXEtDu1yQJSKAmCdfLSppTbwer8rOjSOjgd5uBYE6/4Q4biSk6UpFASip7Eprp2MqNkG0537ezYcr4aJZB453bXrtzESBDsIK8ZJTlRsh+nrHfLwxycoASaeMWiTeViC5ffciEvNtO1s2q983kMPCVg03IFx8QofaLU7Mzjy8DshpSbvUEQ7GAzM0pWm3gyO7sGZiK1R8kBnD5RkkJpXZRSZdfEk99yIS8207Wzar2Trt06OO4Dd+pEqfjFKIZ7O5SgSLp2BYxgFQQ7sDqjlEiaxBK6uLLaxBNtWgOnGnhmAsKz+rasrXCFZDKZue1qoSTx4EKxs6muncVkIRGjNVCmgydK6a6dQydKJVAouX2iVG5dO0Gwg3wXoQNU+a0WSuJ0WBXHZmdnAKWTWCtrnblGCdjC3WzipXUJwOcV650grEleyUJ57qoISPzq6iSjzjyuUs77wGVgduPrS6EkCJax6nZIF0qVfg8ei1ojTbw1cNoSHmx0bilsKZwouahNGaeD14fHReupFEpC0ZNf6l1+e5REjNbAqa5dLASJVBEmPnDXkBklQbCO9f1++TkdQLRpTZzSpgWHG3iGDzzWU3kLTTGsrXDTEg5SKAklgNWuXdJUROO6uJIIVptwej6pogZ8Di2FLYWuXZFY78olWUgQ7MCqLTycauDJ2gobcWq/X0iCHKA4CiU3G3gghZJQAiQsFkqR5T5wq8lCIkarU6pBDlASgiTJQuCl+LurgrCcvK13+RRKknq3Oo5pk9OW8OLXJXBXm4rB6QBSKAklQDxprWuXtt0FfB684gO3B8e6dk5Hg/ud85fbiJtiZJomSuk3fGK9E4TcsRzmEJVF6LbjeMiQnCi5du0iaOCBpN4JJYDlrp2Ikf0UYmDWCUqkaxdT7iULxRJL13ZTkPyGu2IoCFaxugw9Mzub14ySBA2tQKkCuB2cKpSKP2QIiiTMQWaUBGF98o1gtbqnAiT1bk0cEyOnu3YlIkZFYG/weDxlkywkCJtFKUVC5We9y6eJ55cm3krMKGA9FTcnnC6USqSJJydKhdUmUUEhL3KZUXr58hAew+Ds8c6MGPm9Hl6+PEQsYRLweXjxxJYNH0dOlFbB7q7dxR9oO9zJl5Z84BP39fDsp+f0zqZTv2DPtUSM1uT81fN4DA97tu8BtBgthhe5/tl1EokEPp+P08dOF+z5SKEklBK5Oh2ytCnldjAMLGmT32PgMaSJtwK7G3hpbTrx5SVb+L0PoLbVfm0S692qpHWp+2h3polnYHD+6nlXdAmkUBJKgFxmlDyGwcuXhwGoqdQ/aj6vh1eujADw4onOnK4lhdIqqDio5MZflyuGBy5+X99Od+36LsGlH8HN1+DUL9p3LRGjNfEYHs5fPc9CaAFYKpQuXLsA8FCLkSBsllwT75ZrUygdNGQYlrRJdGkN7J6dTWtTPAJm6v/V9b+BZFy0qUCkdQnASDcHDFzTJZBCSSgBcuncnT2uxebly8Ps36K3aM+H9S/4EwdaMp/fCBGkVUjYPJ908iX98eL3wbssEjwtROnP24GI0Zp0H+0GyIiS3+fnxmc3ADiy90jm84VCCiWhlMh1h9JybWqq0a93/eOLQO7aJLq0BnbPzi7XJoDKGogsOKNNJbAIXSlVcG1arktbWvVJ6+z8LOCOLoEUSkIJkOuM0tnjnUTiSd68PgbA+JxeZLqtJcjARAiAuqCfuuDafle/zCitxIn5pINnYGECbp1bum/HKdh+Qtvwgg32BDyUgBiBewOz3Ue7GZ8a597APabnppme0zNjrc2tjE3p36Pqqmqqq6odfy5SKAmlhJWQoQe16c6IPsXNVZv8Eg2+Ok5p0+gtGLiqiyRwRptKoImXIIFyagZsHbqPdhOLx7h88zIAU7PaeeKGLkFhV1eICgqWMZXCSuhdwLdSUP79u32Z22ePd6zpBw94jKWjXmEJJ8To5uvZRRJA70X9B+DkV+zxgpdImEOUqGvXXk0Iz51f+n/TfbS7IHaHgOHQwmFBcACrIUOb0iZJvFsdp7Rp4Gr2fXZrk+GFAkZO54uburRa0p0rukSgoO8Li/+nQig6rC6bjSVWitdXn9pOV1MQYN3TJJ/YG1bHCTE69DyM3YWBK0v37TilRQh0184OfIXpOG0GpRTzzLt2/XB45f/fM6fP0NrUClCwrl0ttQW5jiDYQbKA2iQnSmvgxH6/Q8/D/Q9huh8wAGW/NvmqdaJHkTPHnGvXTgc5LKccdEl+0wXLWCmUXrkyzJvXx2it00fauztqAOifCNHVEqSrJSi2u3xwQow+PbdUJHUe1h97L0LfZWjZZZPtzp89A1WkhAiRxMawDAtcuHaBkUk9VP74o49zZO8RAMYnx2lraqOtqa1gtrtKSuP0TxAgP21Kvzc+uVu/vuWsTXKitDpONPE+PZcqkoBHf05/tFubSqCBBzCv3GngXbh2gcs3L2diwXd37QYKr0sAtYYUSkKRk2uy0CtXhnn58jAvnujMCM7BVKjD+7cmeOXK8IaPIV27NbBbjC79SA/Ltu3Tf0/vqTj0gr7/0o/suU6JiJFbXbsL1y5w/up5aqv170ltdS2H9+mi9fqd65mUoUJQS63YXoWSItcdSmltOnu8g/S3PL6/Gchdm3zSxFuJGQe18tRhU6S1qTL15rha/38qW21ShdemtC51H+nO7FE6uv8oUHhdgsKfKIn1TrBMrl07UylePNHJ2eOdXO+bAaChOsDZ4x3EEiZmDqImYrQGdhdKytQJQuN39d8bu7St4dDzulunrHn/16RExMitrp2pTE4fO82NOzrprq6mjuqq6sz+CtOu/w85UOiunSBsllybeGlteupgayYSvLm20pI2SRNvFZw4TUrvSbryl/rvLTsd0qYaex7HYdywhKd1ae+OvVy4fgG/z09jfaMrugSF1yYplATL5FooLR+CjcT0L1JTbQWP7W3O+Vqy+XwVVBLMmL2PmR6E/f5v648tu6DrmL5tZ/xqiYiRWydKp4+dJmkm+fDah8BSoeTGnooaSuP/lSCksapNk/N6MN7vNWisCeS0AD2NNPFWwQlL+Klf0Lv90otnW3dD+379OVu1SZp4a5HWn96hXkDrUk2wxhVdAplREkqAXO0Ny4km9LxHhd/aj5zMKK2CE2IEujM3r2M+qWt35hoiRhuysLiAUgqv10uwMuja85ATJaHUsBo0FI2ndcl61LCcKK2CEydKAHOj+mNNC3gc6u+XiDa5GeYwt6CvnbaGu4XMKAlFj9VkIYBoXJ8oVVoUJOnarYJTYhSa0dvODQ/U5H7qZ4lSESMXfOCZa6fEqK66ztUZIUm8E0oN64WS1qW8CiUJc1iJ04WSUw08T4VzBZiNJFSCECHXrp/Rppo6154DFN7tIIWSYBmrYpQ0VSaG1aogSdduFUq6a+feCYkV3IwGn1ssDjGSEyWh1LCqTZHUiVKlRacDgE+0aSVOuR2cLpRKxBLupi5BcWhTgAAVRmEXA8tvumCZXAdm08TiSzHLVgVJrHerUKpi5A3qpX5FTkIlWGTRtesvP1FyEzlREkqNgp4oiTatxKkm3rzD2uQXp0MuzC/oQs1NbXJDl6RQEixjvWunxcjrMSwvkJWFs6tQqvaGErHdLbDg6vUzPvAa9woV2aEklCJJi+lbmzlRkkJpFRzTptTsbG15a5OcKLnjdJB3oYJl8h2YFTGyiVLt2pWIGLndtSsKMZIdSkIJkneYQ8D6iZJY7x7AiTTWNJkmXpszjy/atCGxeIxINAK4r02FRn7TBcvke6Ik9gabkK6do7jdtSsKe4PMJwklSN7a5LOmTR5DOySEZThlCY8uQjR1yl/mTTxXZ2dTToeKQAUBf8C15yEnSkJJYDUefDMRrNK1ewBlQjLizGM73bUTH/iGJBIJQhGdauRm1052KAmlSN5uh4DV2VnRpRU4bQmvqge/E3ZgQ8/PlgBuatP8YqqB53bIkJwoCaWA1TAH8YHbiFNFknTtMri6pyJluwv4A1QECpvssxw5URJKEcsnSrH83A6ytmIVSnl2tgRsxkqpojhRcr1QkhMloRQo7K4K+RHNwrH5pJTtzqmuneEFT2mEA7i5bHb5Qj/ZoSQIuaOUImnV7ZDIr4knDbxVcFqbytwSHiFCnLhr1y+WNFY33A7yLlSwTCHDHKRz9wBOd+1qHRyWla7dhpRz104QNoNVSzjkbwuXBt4qOL62oryDHNyenS2GkCE3diiBFEpCHiQLdKLkNQw8JfDmuqCU6g6lEhGjKFFiOJTclAPFIEYgJ0pC6WG1gQdL2lQp1rvNU8rWuxLA9TTWIjhRckuXpFASLJPv9nPxgduAiJGjuN21K4bEO9mhJJQi+RRKkVhamyTMYdM4bb0TbXLt2kqponA7uOV0kN92wTJWwxzyThbySqG0AimUHMX1rl0RnCjJDiWhFJETJRdxKo01GYeFSX3bMVt4aSR8uqlNkViEeELPR9VWu+c2kBMloWSwHg+e364K6dqtglPWO8e7dqUhRm6fKC0Pc3ALmU8SSpGkxQYeLIU5WD9RkkIpC6fSWOfHAQW+Ch00ZDeGH7zu7QSygqtprCldClYG8fl8rj0POVESSgJTKaw27pasdyJGm0KpEu7ayYnSRkRjUaKxKCA7lATBKpuz3kkTb1MUwungxCl3iez2A3fTWDOW8DKdnZXfdsESm7I3BKzaG+THMwszBljvmm6I0107TwV43OtCWcHNE6X0Qr/Kisqy23wuCJvFqjYlTUU8qb/HsvVObOHZiCXcUZIqyQILrl2/GCzh4J42lca7F6FoyFWMXr48hMcwOHu8M3Oi9EnfLHs7avng9gSmUrx4Ysu6jyEnSg9gpxhd/AEYHjj50pIY1bTApR9CIqqLplO/YM+1SkSMoPAnSuevnsdjeOg+2p2xN1QHqzl/9TyJRAKfz8fpY6cL+pwk8U4oRaxq09OHWjP3vfXJKJ8/1GZBm6SJl4WdlvDl2jSf0qbQDISm4dNzeh6qzLRpkUUU1pvUm2E1baoMVLqqTW65HaRQEiyRa5CDxzB4+fIwsBTmcPn+NJUBL+/fmuDFE50bPoZ07R7ATjEyPHDx+/p2IKg/VtXrQgng1C/ad60SESNTmQXv2nkMD+evngfA7/MDUFVRxYVrFwAKLkQgJ0pCaZLr7Gxam8Ip253XA69dHWUxmsxdm6SJl42dTbzl2jSXmp0d+wwu/QhuvmazNpWGzdgNS/hybUoXShWBCte0ya0dSiCFkmCRXLt2Z49rsXn58nDWbFJaiNKfXw/p2j2AnWJ08iX98eL3oW2vvh1NFQmHXlj6vB34S0OMFlnEdMLauA7dR7sB3b1rb9b2kkhEz6Ed2Xsk8/lCIidKQimSaxNvuTYB+L1ekmZStGkzOKVNlctei9JFkp3aVCJNPDcs4cu1qbJCr4sYnx4H3NEmN3VJCiXBElZ84I/vb2E2FOf9WxOZ+x7ZVs/hrnoGJkLUBf3UBf1rfr9Y7x7Abh/4yZcgHoarf6X/PtWnP7bsgon7+nawAYKNm7tOqYiRS8Oy3Ue7icVjXL55GYCJGf370trcytiU7qhWV1VTXeX8v6PsUBJKFavaNDgZ4lrfbMYaLtq0CexOYz14BkJTcPP1pft2nILtJ7Q22aFLAL7g5h+jALgVMtR9tJtoLMqVT68A0DPYA7ijTW46HaRQEixhJRr8vVvjWUUSwCf9s3zSPwvA2eMd63rBJczhARIh+x/Tt8pR9tvfWrp98iub94OXSKE0xZRr1/Z5V74Unzt/LnO7+2h3QawODTTIDiWhJLFSKL13a5xrfbNZ91nSJrGFL+FEGuvN17OLJIDei/oP2KNL3iowrIV4uIWb2pRIJlbc55Y2uYUUSoIlTAti9OSBVmYW4nx4ZzJz3yPb6vlSytqwXscOpGu3gqQDhVJ8FYF7+hv6VAl0525TGFqQSoBBNejatRfDiyvuO3P6DK1NeuC8EB07gE5jY9uRIBQjSQtNvCcPtNI7tsitoaVTZGvaJE28DMkItqexHnoexu9B/+Wl+3ac0gUS2KBLlMx8UlIlGVbDrl1/Zn5mxX3lpk3y2y5YwsqJ0ge3J7KKJNBduxsDs3S1BDcUIxmYXYZS9p8oXfoRXPvP+rbXr8UJtLWhZZf+Y4ftzij+lxlTmQypIVeufeHaBW7cvQHAltYtHNl7BIDxyXHamtpoa2ormBh1GB0FuY4g2E3SQhPvg9sTmSJpR4u2X4k25UlyZZNn03x6bqlIaj+gP/ZehL7L9ugSlIzTYZxx4sRdufaFaxcYGBkAdHiDm9rUbjgUEZ8Dxf8ORigqchWjV64M8/LlYZ45rLsO/pRV4YkDLbx8eZhXrmzcIZGu3TKSYbAzHvTSj/Sw7N6n9d/r2uFgqlC6+Zr+vB2UkBjFiBX8uheuXeD81fM0NzQDsLV9K4f3HQbg+p3rmYShQiEnSkKpkuuJUlqbDm/TO2H8Pq0zuWqT19DJeUIKJxp4F78Pbfv032ta9MdDL+j77dKmElk265bTIa1NPp82nrmpTc00u5Z4B2K9EyySqxjpXRSdHNlez09vjBPwezhztJUnD7RSH/Rj5vA44gNfht1ipEydIBQIwp23oa5D2xlOfkXvUVI2WSlKpFByS4xMZfK5o5/jkzufAFqMqquq6T7aTSKRwLTr/0MONNBAlVEaNklBeJBcm3hpbfJ7PdzonyNY4ePs8Y6ctUlmZx/AKW0av6v/3rQN6r+iHQ/BRhu1qTSsd4Ome9p0dP9Rrt2+hs/ro725nUgs4oo2ud3Ak0JJsESuYpQehL0/qiOnK/2+zH25xK+C2BuysNvekB6Efe+7+mN9pxYhuxb5pSkVMXKpUDp97DQzczN8eO1DPB4PHS0drizyA7HdCaVNrk28tA69fFlbbWuqrGmT6NIDJBzSpn//j/XH1j2wVVu+yi0aPK7ijDLqyrVPHzvNtdvXAOhs7cTr9VJdVV2W2iStEcESVgZmAWIJ3XVYvkspV8R6twwnEu8AZlM2k3qHXohKwN4QV3FG1Ihr1x8c00VaukhyC7fFSBA2g5XUO4BYPKVNPms6IyFDD+CENplJmEsVCE5ok+EDj3tWrlwZVsMF3+23nIFRPZ+0tX2ra88B3NcmeScqWMLKwCxANJGfGIF07rJwrFBKFQj1Dh1tl8CJ0ogacVWMBkd1oeS2GLltbxCEzZCLnXs56SZewG8tIlqsd8tQypk01oUJUEkdMlTdZP/j+6qhBObM3ExiVUotaVObe9pURx3VhrsNV/mNFyxhJfUOIJZa5mdVjDwyMJuN3fYGgGQCFvSmbUe6dp4AeNZPjyoG3BajYujaBQm6uvlcEDZLwmKvI98mnjTwlmFGdUFjN2mnQ12HM6mpJWC7A3e1aWp2ikg0gs/ro625zbXn4fZpEkihJFgk3xOlgGV7g/xoZnCqazc/qh/bXwlVDfY/vojRhszMzxAKh/B6vHS0uCcInUanLJoVShqrtvBouokn1rv8KVmnQ/FrU1iFmWRy4y90iPRpUno+yS2Kwekg70YFS1gXI+nabRrTxhS65WR17Rz49y4RMZpgwrXrp8WovaUdn1fmkwQhX6w28ZbmZy1a77zytilDqc7OloAl3M0GHoglfDnyGy9YwroY6a6d1TAH6dotw/GuXfmKkVtLZtOkxairvcvV51EMYiQI+aKUKlgTT7RpGU4sm4Ulbaor35Ahty3h6ZAhNwulKqqoo86166eRQkmwhOXUu3jaeicDs3njxHwSiL2BIhCjIujaBQjQhAMD04JQICz274ClJl7AYhNP3A7LcKqJN1fe2qSUYkANuHb9yZnJophPKhZLuLwbFSyR94ySiFH+OG1vcKprV+RiBEUwnxTR80ntLe2uPY8Oo6MoxEgQ8sVqAw+WTpSsNvFkfnYZjoQMxZ0NGfJWgeHezE0uzDHHAguuXT99mtTZ1onX496/VbFYwuU3XrBEvgOzYm/YBE4EOYDDXTsDfEEHHtc+5tQcc8y5dv3BkdT+pNYOV+eTxHYnlDpWdyhB/jv+pImXQilnmnhzY6mQoSqoqrf/8aWBt/H1xRKehRRKgiWsRrDKwKwNONG1S0RhcUrfdqJr5ws6E+tqI66LURF4wKF4unaCkC/5nSjl18QTW3gKMw4qYf/jLg9ycCRkqPhnZ8USXlyWcPmNFyxhdanfkr1BTpTywqmuXXo+qaIGKh3YnyNitC7FsszPi5dWWl27viDYgVVLuGkq4kn9PVZ3/Ik2pXDc6VCelnCllKvaNDkzSTQWxe/z09rknja0G+14iqTZWhzPQigZrFocYrLUb3OYMYe6diJGborR9Ny0nk/yurs/qY02vEXu1xeEjbAcMpRcskZYbeKJNqVwLGQoPTtbnkEOE0wQJera9bP2J8l8EiCFkmCB/CJY80sWkoHZFI6lCpW3GE0xRYSIa9fPiFGLLPMThM1ieW1FyulgGOD3Wit8RJtSlOraiiKPBnfdEl4EtjsoLm2S33ghZ/KLYM1zRkm6dhqn7A1lfqLkZvQqFI8YFVPXThDyZTMhQ1YTH0WbUji+bNaBN8qGFzyV9j+ujbhuCS+C2VkPnqKyhEuhJOTMZiJYxXqXJyW7Q6m4Z5RcF6MiKJQMDNoN92LJBcEu8l9bYf0012fxBOqhxYlls/EIhKb1bSfWVviqnQmIsImESjCiRly7/vL5pLYm9/YntdGGz3AvCfZBpFAScsaqGAFE00v9LIc5yI8mUICunQNi5PGDN2D/49pEUiUZVsOuXX96bppwNIzP66O92b1CpZlmAkbx/n8ShFxJ5LkI3WoDD8BXxG+0C4oj0eDLQ4YcaLYVudNhVI2SwIGZ5BxJN/C2tG3B4+J7sGJzOsi7USFnrJ4omaYikWeykJwopXBCjKKLEEntD3Kka1fcp0mjuCtGAyPa9tfR2uHqfFKxiZEg5Iv1E6X8Gng+jyHLmUFHg5sx+x9XnA6uXn9gVGuTm0msUFzzSQDFc7YlFD25Jt69fHkIj2HwzOGlo9uffjLK5w+18cHtCUylePHElnUfQwqlFHbNKF38gd5rdPKlpa5dZR1c+896p5KvAk79gj3XKvKu3aBZWDE6f/U8HsND99Fuff2UB1wpxbuX3sXn83H62OmCPicoPjEShHzJtYmX1qb2Bj2n4vUYvHx5iCcPtOakTaJLKexs4C3XprTTobpJ319u2lTgQmm5NimlGBobAmBmfsZVbSo2S7gUSkLO5CpGHsPg5cvDRFIDswbw2tVRFqNJ3r81wYsnNn6DJtY77O3aGR64+H19uy71IlTdBJd+qG+f+kV7rgMiRg/gMTycv3oegMeOPJaxNwyODjI4OuiKEIGcKAkPD7meKKW16cj2+szfX7kywnw4kZM2iS6lsDNkaLk2zY3qj5V1DmlT8Z4oRVWUccYLes3l2rRz606isSg+r48bd28AuKJNzTRTYVQU/LrrIYWSkDO5itHZ41psXr6su0N+n0EsoTJClP78esjALPZ27U6+pD9e/D50Hk49fqoIO/TC0uftoIjFKKZijDFW0GumT5LOXz1PKBIiEo1gYKBQHNl7JPP5QlJPPUEjWPDrCoIT5NrEW02bgJy1SU6UUtgZMrRcm6qb9O20Bc92bSre17whNYQij2jhTbBcm4bH9e9EZUUlC6EF17SpGBt4UigJOWNlRunx/S0MTYW52jtDLKG/75Ft9RzuqmdgIkRd0E9d0L/m98vALPYn3p18CeJhuPpX+u+z+pidll0wcV/fDjZAsHFz1yniEyU3xAi0IMXiMS7fvAyQeQ6tza2MTenCrbqqmuqqwvzbie1OeJiwMqP0+P4WbvTP0jcR4rPhBSB3bfJLoaSxe3b2QW0auqY/2qlN3krwFO9bXrfmkx7UpoWQ/p0QbVqieH9qhKIj1xklgPdujXO1dybrvk/6Z/mkfxaAs8c71vSCy8BsCieCHHyrHGm//a2l2ye/sjk/uOEp6q5dj+px7do+78qX23Pnz2Vudx/tLpjVYZexqyDXEYRCYFWb+iayX1tz1yax3gHOrK1YrRFrpzb5avP/XocxlUmv6nXt+mqVf3s3tMmPny6jy/HrWEUKJSFn4qaZ89c+eaCVvvFFPh2cz9z3yLZ6vpSyNqx7miRdO01iwf7HjK9SfD39Dd25A9212wz+Bl0sFSFRFeWuuuva9afnp1fcd+b0GVqb9GK9QnXsmmhim7GtINcShEJgVZuu9swwMhPJ3CfaZBEnCqX5VeZz7NSmik06JRykX/WzgAN6nyMj4yt3N7mhTYeMQ0U3nwQSDy5YIJ7MvWv3we2JTJG0vUWfMHzSP8uNgVm6WoLripHYG1LYXShd+hFc+xt9u6IGDj2vb0/c12LUsmvztrtA8YrRZ+oz12LBL1y7wJ3eOwAc3nuYI3uPADA+OU5bUxttTW0FE6PjnuNyYis8VMQtnCh9cHsiUyQ9fUi/ERRtskAyZn80+KUfQc+H+vaeJ/RsEpSNNt1UN1279vmPzzMyqQulF59+0TVt8uDhmOeY49fJBymUhJzJtWv3ypVhXr48zKGuOmBpV8UTB1p4+fIwr1xZf9mn2BvQNgQ7u3aXfqSHZXec0n9v3gkHU4XSzdf05+0g0GDP49iMUoob5g1Xrn3h2oVMshDAowce5fA+Hahx/c51Lly7ULDnUkste4w9BbueIBSCWNKaNrXW6a51RWq/n2iTBew+TUprU0PKctW8Ew5+Qd+2TZsM8Nfb8Dj2s6AW6FN9rlz7wrULXLiu9ac2WMvurt2uadN+Yz/VRnHON4v1TsiZXE+U9C6KTjyGwc2BOWqq/Jw93sGTB1qpD/oxNwiFEHsDkIyAStr3eMrUMavhGf33lp3aynDyK3pXhcrdurIuRdq1G2WUaVZa3wqBqUw6WzoZnhhmW8c2mhuaWQwv0n20m0QigWnXv30OHPMcw1Ok1khByJdcT5TS2vTZ8Dzjc1Hqgz7RJqvY7XRIa9Nnb+u/N++0X5v8tUUb5HDTvOlKwBCAaZoEK4OEIiGOHjiKx+OhuqraFW161PNowa5lleL8yRGKklxPlNKDsH/1kU5xqavyZ+7LKRpcxMh+MUoPwf7l/6I/Nu/UVga7FvmBTrvzBux7PBtx6zQJ4MShE3z86ccAHDugrQXVVdUF31FRSSUHjAMFvaYgFIJ4jidKaR26lgoaaqqt4KlDejF6Ltok1juc0aZYaGmXUstOvUfJTm0q0gaeqUw+VZ+6dv2tHVu5cP0CPq+Pw3v0SZIb2rTL2EWD0VDQa1pBWotCzsQszCgBRGL6RKQyYO3HTJb64cywrGnCVOqIv3mn/Y9fpGIUURHuqXuuXf/W/VvE4jHqa+vZuXWna8/jqOcofmPt+QtBKEWUUpZmlIDMMvTKlPUuV6SJhzPaNJnSpeomXSTZTZFqU5/qI4QD6bY5cvXTqwAc3H2QyopK157Hcc9x166dC0X9jvSb3/wm3d3d1NbW0tbWxpe//GVu3brl9tMqWxIWkoUAwiJG+eNE4t3csLYy+Cqg3oFdBUU6n3Rb3SaJjTZGCyilsk6T3ApR8OPnEeMRV679MCLaVDwkLOz3S7PUxLOoTd6ifstUGOIOaNNkj/7oRAMPirZQuqHcczrMzs9yb0A3EB894J7tbYuxhTajzbXr50JR/9a/9dZb/OZv/iYffPABr776KolEgrNnz7K46EBHQ9gQKxGsANF8xUgKJWe6dhM9+mPTdnDi1K4IxUgpxU3TvUShvqE+ZuZnCPgDHNp9yLXnUayxq6WKaFPxYCWNFfRrQiSutcxqE6/srXcqCUkHTkDShVLLTvsf21Ohl80WGfNqnn7V79r1r97Wp0nbO7fTWO+edh83jrt27Vwp6hmll19+Oevvf/qnf0pbWxsXL17kmWeecelZlS9WrXfpE6Uqi4WSWO9wuGu3w/7HNnzgq7H/cTfJMMPMMOPa9T++pU+TDu05RMDvzvxWMceuliqiTcWD1QZePKlIpqx6VrWp7FPvnFiCDktNPKcs4UW4DsHNBl4sHuPmXX39Rw+6d5rUQktRLph9kKIulB5kdlZvzm5qalrza6LRKNFoNPP3ubk5x59XuWBVkDL2BrHeWcOMgxnd+Ous4mTXTsRoBVOzU/QN92EYhqvWhmKOXX1YEG1yD6snSmldMoCA31rhU/ba5IQlPBmH6QF924lCqQgXzSZVklvKPavuzXs3icVjNNQ1sL1zu2vPo1R2+pVMe0QpxT/6R/+Iz3/+8xw5cmTNr/vmN79JfX195s+2bbKB3g6SpsLivOySvUGsd9ZwwnanlMNduwb7H3OThFXY1RCHq7e0tWHX1l3U1TgwoJwjxRy7+jAg2uQulht4KadDhd+Dx+KbtLK33sUd0KbpAW3pq6iGmhb7H78ItalX9boW4qCUymjTowceda1QqaOOXcYuV65tlZIplP7+3//7XL16le9973vrft0/+Sf/hNnZ2cyf/n73PKAPE1bFCPI/USp7650TXbvFKYgugOGBRgfeoBXhfNItdQuTwu2BWE4kGuHTezr21U1rQ7HHrj4MiDa5S67R4GnyDXIAaeI5ok3LG3i2v2n3gN+9JtVauBni0DPYw+z8LBWBCg7uPuja83jU82jJ7PQrCevdP/gH/4Af//jH/PSnP6Wra30/Y0VFBRUVMrRsN1bjV/XAbH7x4GUvRk507Sbv64+NW8HnwKxMkXXt3A5xuHHnBolkgpbGFra0bXHteRR77GqpI9rkPoWKBgfwloBNyFGcKJScTLwL1INh/f+zk8yqWQbVoGvXT8/NHt5zGL/PnXURVVSx39jvyrXzoagLJaUU/+Af/AP+w3/4D7z55pvs2lUax3QPI1a7drGESTq1VWaULOJ0185u/HVFt/V8UA0yhzszIKZpZhKF3LQ2lELsaqki2lQ8xAp0ouT3GCUxT+EYSjm0Q6lHf3RqdrbIcLOBNzkzycDIAIZhcHT/UdeexzHPMXxGcb1nWI+ifqa/+Zu/yb/7d/+Ov/zLv6S2tpaRkREA6uvrqaqqcvnZlRdWu3bhlBh5DAj4ZOGsJRwRo179sUzmk24q98ToXv89FkILVFVUsW/nPteeRynErpYqok3FQ8LyiVJ+0eBl38AzI3qWyNbHNMtKm9wOcUjv9Nu9bbdrc7MBAhwy3FuVkQ9F/Y70//q//i9mZ2d57rnn6OzszPz5v//v/9vtp1Z2WPaBZwZmvZa7cD5vGQuSMqVrt0lCKkSP6nHt+lc+vQLAkf1H8Hnd6UWVSuxqqSLaVDzErC5Cz3u/X1G/XXIeJyzhcyN6Cbo3APUOWJSLTJvuq/tEiLhy7XAkzK0eXaS5mcJ62Dhccjv9ivpESeWxcVtwBss+8JgWL6t7KqDMO3eJEGDzz31kHhYm9G2n9lQUEW6GOIxOjjIyMYLH4+HIvrUT0JymVGJXSxXRpuLBcjx4njNKZZ945+h8kgNL0L1B8BbXG3I3nQ6f3PmEZDJJa1Mrna2drjwHL16OeNzTxXwp8xaJkCv5nijllSxUzm/wnLTd1bZBIGjvY3sC4C0eq5HbIQ5pa8O+HfuornJnd1Epxa4KwmbJd79flYQMWaPUZmeLzHY3o2YYUkOuXDtpJrl2+xrg7txsqe70k0JJyAmr9obNLJst6064k127Mlg0O6AGmGfelWsvhBa403cHcNfaUEqxq4KwWfJdOGtdm8r8d8pJS3gZOB3cbODd7bvLYniRYGWQfTvcmZs1MEp2p1+Z/+YLuZJ3BKt07axRcl274hIjN/dTXP/sOqZp0tnaSVuzO2lzpRa7KgibJd+Fs7II3SJxm7VJKWebeBXFo00JlSiKEIcj+4/g9boTl77L2EW9Ue/KtTeLFEpCTuS91E984NZwZIdSj/74kBdKi2qRXtXryrUTyQTXP7sOuLtgttRiVwVhs+RrvcsnHrxsMeNgRu19zMUpPT/rxBJ0wwu+WnsfcxPcU/eIYvO/X46MTIwwOjlaFHOzpYoUSkJO5BsPLslCFlDK/hOlRBRmU75o27t2HggUz9bzT9WnKLuDMHLkds9tItEItcFadnftduU5lGLsqiBsBqWUZetdOM8wh7LWJidtdw0OLEEPNBSVJbwY5mb379xPsNLmGeUc6TK6aDVaXbm2HUjrUciJXE6UXr48hMcwOHu8M9O1M1L3xxImAZ+HF0+sHwFa1vYGMwYqsfnHufgD3aU7+RJM9ukCrLIWbr6uCydfBZz6hc1fx19XNFvPTWXyqflpwa53/up5PIaH7qPdKKUyYlRfV8/7V97H5/Nx+tjpgj0fKM3YVUHYDEmVW2tkNW261jvDjtZqPrg9ganUhtpU1idKdhVKWdrUk7rTgNA0fHpOr8ewQ5uKyOkwpaYYYaQg11quS6DnZj/r/QzQTYXzV88XXJeg9Hf6SaEk5EQuJ0oew+Dly8PAkg/cMOCVK/pF4sUTG0dSlnWhZNdpkuGBi9/XtytT9oO6Drj0Q3371C/ac50i8oD3q34WcGC+aw08hofzV88D0NnWyeTMJF6Pl4GRAQZGBgouRqUauyoImyHX06RsbdJNv4/uTuH3eXj/1oRo00bYNZ+0XJvSs7PTfXDpR3DzNfu0qYgKpUKeJi3Xpe6j3ZmkO4Bb92+5UiS10soWw4EdWQVECiUhJ3LxgZ89rsXm5cvDtNXrzvbgZBiAJw60ZD6/Hv6ytjfYJEYnX9IfL34fWlIx0cm4/njohaXPb5Yiil8t9H6KdMfu/NXzNNQ1AFBXU8f03DRH9h7JfL5QlGrsqiBshlznk5Zrk3dZwZMuknLRJp9XtGnTLNem5asq0kXSQ6ZNcRXntrpdsOst16WkmczMzQKu6BI8HDv9pFASciLXzt3Z451E4knevD4GwP0xfWS/rSXIwEQIgLqgn7qgf9XvL++unY0+8JMvQTwMV/9K/z2TLrQLJu7r28EGCG6i81YkXbsFtUCf6iv4dbuPdjO7MMun97Tlb3puGoDW5lbGpvTPf3VVteP7lEo5dlUQNoOV+aTH97cwuxjn/dsTmfse2VbP4a56BiZC6+oSlLk22TmjdPAMzI3BZ28t3bfjFGw/obVps7rkqwHP2v8fC8k9dY8YsYJes/toN7F4jI+uf5R1f6F1CaCeenYaOx2/jtNIoSRsSMI0SVrYRB/wrey8/ft3l97Inj3esaYfvKKcu3bxWZsfcBVhf/tbS7dPfiV/P7ivBryV+X2vzVwwL7gS4pBIJOgdXJmyd+78uczt7qPdjtsdHjUeLdnYVUHYDJFkMuevfe/WeFaRBPBJ/yyf9OvX3fV0CcpYm8y4vYXSzdeziySA3ov6D2xOlwAqWvL/XhuJqziXzEvuXDsRX3FfoXXJwODzns8/FDv9pFASNmQxnrsYAcQSK+0QX31qO11N+qh9va5d0GIS0UODGYfYjL2POd2/8r6nv7Fkxws25P/YVR35f6+N3DPvFdTasJx3Lr1DOKqtpYZhoFLNhDOnz9DapBN+nO7abTW20u0pvJ1CEIqBkAVtevJAK0OTYa73LzWkHtlWz5dStrv1dAnKWJuiU2BnI+rQ83DnXZgbQTfzlD5ROvkV/fnN6BIUjTa9b77PHHMFv248EedO750V9xdSlwC6Pd10ebocv04hKP1ST3AcK4XSK1eGM7Y7gNP7mgHonwjR1RKkqyUohdJq2C1Gl34E/Vf07eP/hZ5NAm1taNml/2zG3lC1saffaRbVIm+bb7ty7Tu9dzL+7wO7DvCbv/SbHNmrwxTGJ8dpa2qjranNUUGqoYbnPc8/FB07QcgHK9r0we2JTJG0takK0CdKNwZmN9QljwGV5XqiFJ3Y+GuscPONVJEEfP7r+mPvRei7vHld8lQUhSW81+wt+Nxsmh+9+iMisQh+n59ff+nXC65LADuNnSWfdLecMv3NF6yQa9fulSvDvHx5mCcO6KPv2iofTx3UHYz3b03wypXhDR8j6CvXQslGMbr0Iz0s600J//aTcPAL+vbN1/TnN4OvWlvvXEQpxVvmW0SIFPzas/OzvPreqwBsad3CF5/8IgCH9x0G4Pqd61y4dsHR5+DFy1nvWaqMKkevIwjFjFVt2rdFp4Cmi6InDrTw8uXhDbWpyuct+YH0vLFbmy79QN8OBKF5h7596AWtWZvVpqoO1/cnhVWYt8y3Nv5CB/ibt/+G8alxAH7m2Z8hWBUsqC4BNNDAGc+Zh+r3Rax3wobkKkZ6F0Un7Q2VvH9rgqaaCuqCfs4e7yCWMDFzmHOqKtsTJRvFSJmw/1m4/ZaOB2/dC5FZbW1IRPXnN0MRiNENdYN+tYq10GGSySQ/eecnJM0kNcEavvzClzOfq66qpvtoN4lEAnOz/8Yb8HnP50t6gZ8g2EGuJ0ppbZpZjPMZ87TVV7CtpYMnD7RSH/RvqE1l63RIhO2dT1ImdByEkU9h26NQ06x16dDz+iTJDm1yEaUUPzV/Sphwwa89MzfD/X4d1NR9pJttHduAwuqSHz9nvWcJGDYvEHYZKZSEDVmM57YENT0I++b1UQCaagLUBf0bLvJLU+Xz4HmIuhA5Y7cYnfoF+ODf6NvbjoPHo0XIjkV+AJXu2u5m1AwfmB+4cu33rrzH2NQYFYEKvnL2K3iWxdlXV1UXZE/FIeMQBz0HHb+OIBQzSqmcm3hpDfr//UQv3+xsDPK5lC08l2jwsi2U7LbdnfoFuP+hvr39ZLYubTYa3BOAQNPmHmOT3FK36FE9Bb9uuoFnKpMtbVuyYsALpUsAz3meo9Fw3/poN2K9EzbEysAswNSCjsNsrLHWVRAxspG+y/rj9lP2Pq43CP5aex/TAkmV5I3kGyTIrXi3k/sD9/n4048BeOGJF6itLvy/QxttPOV5quDXFYRiI5q0lsYKm9AmsYTbw/y4DhkyDOg6bu9ju+x0mFNzvGe+58q13738LuPT41RWVHL2qbNZDbxCcdw4zm7P7oJftxBIoSSsi1LKcurd1EIU0CdKVhAxsomZYZgdBo8Xuo7a+9gui9Fl8zLjjBf8uvOL87z2/msAPHrwUXZ17Sr4c6iiii96v4jXKNPfE0FYhtUGnqkU04u6ULKsTeXYxFMKopP2PmZfKi67/QBU2jznWume7c5UJueS54izMpbbae723+XqrauAbuDVBAs/P/ywp69KoSSsS9xUJEyLXbv5lBjVVlj6vrKcT3JEjFL7KDoPZW8/twMXPeCjapRLqvB7KZKmtjVEY1Hamtp48viTBX8OBgYveF6gxnA3REMQigWrDbyFcIJEUmEY0FAthdKGxOfAtHlZarpQ2n7S3sf1+KHCPdvdx+pjRhgp+HXnFuZ444M3ADhx6AQ7t+4s+HMoh/TVh/e/TLAFq2KklGJ6Qbp2OeOIGDllu6sCvzuLTeMqzrnkOVcWy3549UNGJkYI+AN86fNfwust/M/p457H2eLJbdZPEMoB65Zw7XRoCAbweqydipel28Fup0MsDEM39O0dNhdKlR3g0hv1CTXBR+ZHBb/u8gZee0s7jx9/vODPoVzSV6VQEtYllGOQQ+bro0miqYWz0rXLAbvFKLqgE4UAtp+w97FdtN19YH7ALLMbf6HN9A71cvETfUL3hdNfoL628IXiHmMPRw2bLZSCUOJYt4TnN58EZep2sFubBq+DmYC6dqi3uenjktMhoRK8kXwDE2fT5FbjgysfMDo5SkWggi899SW8nsL/jJZL+qoUSsK65CtGtVU+Aj5rP17VvjIMYbRbjAau6ojVhq1akOzEJTHqNXu5oW4U/LqL4UVee0/PJR3Zd4S9O/YW/Dk00cSznmcfqp0UgmAHVpt4U3k6HcoyjdVMQnTa3sdMW8K3n7S34Wb4oaLZvsezwHnzPNPY/O+UAz2DPVy+qZ0jX3j8C9TV1BX8OZRT+qoUSsK65GtvaKqxNp8EZdi1Uw6IUa9DHnBvJfgb7H3MHHBreZ9pmrzy7iuEo2GaG5r5/KnPF/w5BAhw1nsWv+Ev+LUFodix3MTLzM6K02FDYlNg5ymJMqE/bQm3WZuq2lyx3Q2YA1xX1wt+3YXQQiZY6NiBY+zZtqfgz6Hc0lelUBLWxaoY5TufVOH14LPoGy95ojaLkZmEgSv6tiMe8ML+/3Fzed9Hn3zE4Oggfp+fF59+EZ+38KedZzxnqDfcmQkThGLGyg6lNNN5NvFkPskGxu9BeA78VXrhrJ1UFX6vX0RFeNN8s+DXNU2TV955hUg0QmtTK0+dKHyxUkll2aWvSqEkrEuhdiiV3WkS2C9Go7chuggVNdC2z97HdsF259byvoHRAS5cuwDAs93P0lhX+AV6J42T7PTsLPh1BaEUCCdMy7Eust/PAhGbtSmddtd1DOxsOhk+V2x375jvsIiNS+Jz5MK1CwyND+H3+fVcUoGDhQwMvuj5Ytmlr0qhJKyJ7tpZ9YHLDqWcsbtQSovRtuN6h5JdeCogUNhiwa3lfeFImFfefQWlFAd3H+Tg7sJ7sLcZ23jM81jBrysIpUJhdyiV2exsMgqJeXsfM20J32FzEmtlGxT4ZOOOeYe76m5BrwnQP9LPheu6gXfm9Bka6hoK/hzKNX1VCiVhTfTmc2vfk+8OpbLr2iWjELdZjJzaUVHgtDu3lvcppXj1vVcJhUM01jXybPezBb0+QB11fMHzBQlvEIR1WLTYwJMdShawu4G3MAlTvVpDtj1q72MX2Ha3oBZ423y7oNcECIVDvPruqwAc3nOY/Tv3F/w5lHP6qhRKwpoUcodStYjR5pgdgZkh3V2zXYwKa7tza3nf5RuX6Rvuw+v18qXPfwm/r7AhCj58nPWepdKoLOh1BaHUKOgOJdGmzZFu4LXth0ob09kML1S2ue6xXgAAU/pJREFU2Pd4G6CU4px5jhg27z3M4bqvvvcqoUiIpvomnn7s6YJeH6CRxrJOX5VCSVgTq2K0mR1KZTej5JQYdR6EQNC+x/UEIFC4jeduLe8bHh/m/Y/fB+CZx56hpbFwApzmac/TNBvuxNwKQilRyB1KZWULV8q5+SS7nQ4Ftt1dU9cYUkMFu16ai59cpH+kH5/Xx4tPv1jwBl6AAF/yfqms01elUBLWJN/Eu3x2KJWfGE3a+5iOiVF7wWx3bi3vi0QjvPKOnkvat2Mfh/ccLuj1AY4YR9jvKbydQhBKEeuJd/mnsVo9gSppEgtgRu17vHgEhj7Rt21fgF44292UmuJD88OCXS/N0NgQ56+eB+CZ7mdoqi9c0zKNpK9KoSSsQ/5BDtZ3KJWVvSGxCGbEvseLhWD4U33b9vmkwonRh+aHBV/ep5Ti9Q9eZz40T31NPWdOnym4vaCDDh73PF7QawpCKZPviZLsUNoAu50OQ9chGYfaNmjssu9xDS9UtNr3eOuQVEneSL5BEms/c5slHAnzk3d+glKKAzsPcGj3oYJeHyR9NY0USsKa5BsNbrVr5/MYBLxl9KNotxj1f6yX19ZvgXob54k8fqgoTAdrwBzgmrpWkGst5+qtq9wfuI/H4+FLT3+JgN+6NWczBAnygveFstpJIQibwVSKcCJfbZIdSutit+0uswD9hL3OhMpWe5Nd1+Ej8yMmsdkBsgFKKV57/zUWw4s01Dbw7OcKPx+0zdjGKY/NKYUlShm9OxWsUigfeNmJke3zSamN57YvmW0vyMbzqIq6srxvdHKUdy+/C8BTJ5+iramtoNf34OGL3i9SbVQX9LqCUMqELeoSLC2blR1K66BMiE3Z+3j9KW2y3RJeGKfDsBrmirpSkGst58qnV+gd6sXr0cFChW7g1VLLFzxfwFMA/S8FymxBgJAruW4+f/nyEB7D4OzxzowPfHg6zFwozge3JzCV4sUT6+ful50YRTfZnbr4A13AnHwJzGViFJ6D8/8WfBVw6hc2/1wLZLt723zb8eV956+ex2N46D7aDUA0FuVvfvo3mKZJfU09kYiNVsgcecLzBB1G4Rf5CkIpk2sDL61NX3y0I9PEu947Q3t9pWjTasRmtDNhMyzXpon7EJrRJz/1nXDpR1r/Nq1NHn2i5DAxFeON5BuOXuNBXQLoGezh3Uu6gdfV0UVrU2Eshml8+PiS90uSvroMKZSEVcl187nHMHj58jCwNKN0c2COn1wZ5v1bE7x4YuM32yJGFjE8cPH7+vaWRyC6AL5K+Oyn+r5Tv7i5x4eCbTwv1PI+j+HJDMU+duQxzp0/x0JoAYDZhVk8nsJ2zvYb+3nEeKSg1xSEh4FcC6W0NkXjSRKphYBv3xwnYSrRptWww+mwXJvSOmcm4eMfw83X7NGmylbwOP/W9V3zXRZYcPQay3Wp+2g30ViUNz5YKs7am9sdvf5qSPrqSqRQElYl1yCHs8e12Lx8eTgrHSgtROnPr4eIkUVOvqQ/Xvw+DF7Vt6vqYT4Ch15Y+vxmqHLedlfI5X3pjt35q+cZnRylZ7An87kje49kdfScpplmnvY8XbY7KQRhM+Q6O7tcmwBqK33MRxLWtKmcbOF2zCct16Zgw9L96SLJFm1y/hT+nnmP2+q249dZrktKKSZnJglFQgAc2n2Izx37nOPPYTmSvro6YkAUVsXKfNLj+1s4tqOBpLl0BvXItnoOd9UzMBFiLhRf9/vLqlCya1j24Beg4yCM3NJ/nx/VH1t2acvDxH0IbSJBrtJZMSrk8j6lFBPTE/h9fmqra7OKJIDW5lbGpsYYmxpjMeysBbCCCs56z+IzpEclCPlgJY318f0tbG/Re+XmI/r7RJtWwYxDfMaex2rbBw1d2naXZscpHeiwWV3Co/cnOciiWixYAy+ZTNLZ1kl7czsfXvuQu/1L7oqO1o6C6RJI+up6iFoLK4glTe5M5/6L+Z8uDHC1dybrvk/6Z/mkfxaAs8c71vSC76yvoqP6IffCKqXnkhbub06MzAT0XYHbb+oAB7XKvqG3v7V0++RXrPnBPX5dIAW3OLJk1lQmI4zQa/bSq3qZZdb2a6SZW5hjYHSA/uF+BkYHCEfCa37tufPnMre7j3Zz+thp256HBw8ttNBpdNJhdNBhdIj3WxDyZCocY3gxtz0/Sin+zVv36ZsIZd2fizZ5DDjWVof/YU9jVUkIDWlt2gzRRbj7Htw6p4uhB+m9qP+AdV0C8FXrmdmqLVqnbCamYgyoAXpVL32qjwjOzKymm3b9I/30j/QzPDZMIrl64e+kLoFeJNtutGd0qY02SV9dAymUhCzipsm7A1PMRnPr2n1we4JL95Y6RIah64JHttXzpZS1oS648oXN5zE42V5PV12VPU+8GFkuQolNeJ1nBuHWm/DZ2xBeVlxUNUB4Ru+USPvBn/6GPlWCbOvDWhg+bbOr2qJnkmy228VUjH7VnxGgKDYuM1xGOBpmcHSQgZEB+kf6mZ3PLsJ8Xh9b2raQSCYYGhvCMAyU0iegZ06fyQzMVldtLoHuQfFppbWsN5oLgl3MRuO8OzBFwtx4ejaRNPn+e33cHVl63c1Vm2oDPj63pYH6iof49zYZhcVeWOwDM89TfWXC0A3duLv/od6XBFpDqltgYUzfVqY+UTr5Ff35XHQJwFu1VBz5a21ffL6gFuhVvfSoHobUkGOLzmfnZ+kf6WdgZICB0QEi0ewiLFgZpCJQwfTctGO6BFBNdVbDrpFGSbXLESmUhAxJU/H+wDTTkfXtCKB3Wfz1xSHeuDaaue/s8Q6ObGvg9//Tp3zSP8u2luCqPvDGSj+f62ygOvCQ/vjZIULxCNx7XxdIo8u80lV1sO8ZSMTgxitLvu93/rX2gU/c17a89TC82r5QtQUqW/TfbWRezdOr9KmRUwKUSCQYGh/KFEbjU+NZnzcMg/bmdrZ1bKOro4uOlg4u3bjE+avnOX3sNN1Hu3nz/Jtcv3Od8clxHtmbX7BCNdUZ4ek0OkV8BMEB5mMJ3umfIp5DkRSOJvjTN+5xZ2QBA1DAiyc6OdxVv6E27ayv4lhbPT7PQzo/GJuDxfsQGoZ8X5cXJuH2W/rP/NjS/Y3b4MBzEJqFqz/W2rT9BPyH/1GfJrXs3nhGyVOhi6PgFvDX21ocKaUYZzzjaHBqN1IoEtJFUUqb5hfnsz7v9/nZ2r6Vro4utnVs427fXT689qGtugTQRFNGmzqMDmqN2s3+p5UtD+k7VcEqplJ8MDTNRHjjN/bxhMn33unlyv2lk6T0cOxAyubwxIGWzBDtckHa31TN4ZZaPA/jIPtmRUgpXRTdelMXSYnU6YvhgW3HtQhtPwFXfgxX/yp7OPbgF3ShdPM1CDauIkipSNXgFqhos3VZn1KKMcYyAjSFjbs4UpimydjUWEZ8RsZHSJrZc3RN9U0Z8dnavjVr98SFaxeyiiSAw/sOc/3Oda7fuU51sDqnQIcHxaeGGgllEAQHCcUTvNM/STS58Wvq1HyUb716l9HZCF6PQdJUOWnTQ+1wUAoiY9rZkO+epGRcFzu3zsHANUhn4vqrYM+TcPCMLoQu/4elIikdEQ46ZCidhvegNnkCOqChagsEGm0tjhIqwaAapEf10Kf6CBHa+JssEovHGB4b1qdGowNMTGfPIXsMDx0tHXR1drGtfRttLW14U/p74dqFrCIJ8tMlDx7aaMvSpgrD2nJlYW2kUBIwleLC0AyjOXi/FyIJvvP6XXrGFvF6DA5traNrWXeuLujn7PEOnjzQSn3Qj5k6Rq7weniss4H26ofsl9cOEQrN6GjvW2/B7NDS/XUdcOAM7Ps8VC+bGVLmygShYIO2NiSiy2aXDF0cVXXqEyQbvd1xFWdQDWZOjsKsPQOUD0opZuZmsiwLsXh2EV8TrMkqjGqCNWs+nqnMLDECbWfoPtpNIpHAXGXe60HxaTfaZb5IEApIOJHk7f4pwomNi6Te8UX+9Wt3WYgkqA/6ObytjvpgYENtemgdDmYCQgOw0APJPAuEyV5trfvsHb2GIk3nYd242/U5vbcvzYPalNalQ8/rBl76ddbwp4qjTqhostXyHVKhjC4NqkES5B7+kQtJM8nY5JjWpuEBRiZHMM3sn8/mhma2dWxjW8c2Ots611wYm48ugQ4FajfaM1a6FlokIMhBDJU2RD6kzM3NUV9fz+zsLHV1dW4/naJDKcXFkVn65jZ+ozs+G+Fbr95lYj5KZcDLr31hN/s6Nz7ObQsGeKyzgcqHKWp1syJkJqD/ij49Wh7M4KuA3Y/D/ueg40B+3bWKlpS3u11362xiUS1mCVCSTe6DeoCF0ELmxGhgZGBF0k/AH8gURl0dXTTUNth6mhMgkNWRa6VVxGeTyOvv2si/zfpEEyY/7Z9kPrbxG92rvTP827fuE08qtjZV8fUX9tBQvfFr30PpcEiEUtbvflB5FAmZYIY3YeLe0v3VTdr2vf9ZqM8jFdXwQWU7BDu1RtlUHCmlmGJKa5PZyxhjG3+T1cefncpo0+DoIPFE9nhCbXVtRpe6OroIVgZtfQ411GTs3en5InEybA4rr7/yLqCMUUrx8dhcTkXSvZEFvvPGXULRJE01Ab7xxT20N6xvUzCAwy217G+qfnh+qTcrQjNDy4IZZpbub9unO3S7H4dAHi+ygaZUcdQBXntO7ZRSTDKpB17NHiawKdo8RTQWZWhsSCcADfczPZcdG+v1eOls7cwUR61NrbYuhhXxEYTiJJ40eXdg4yJJKcVbn4zxny4MooCDW+v4lTO7qNwg1vuhczgopZeZL9yHyEge32/C8E1trVsezODx6iCGA2dg6zGw+vpreHRxVNWp3Q02zcMmVZIhNZRp3Nm9GHZ+cX7JzTAykNltlKYiUJEpjLZ1bKOups5W7WimOdvibaztlhCcRwqlMkUpxScT89yb2fg05OLdKf7inV6SpmJ7S5Cvv7CH2qr1bVxBn5fuLQ00V9l3ouEamxWheATufZAKZri1dH9lHex7WhdIjV3WH9ffoLtzVZ3gtccSllCJLAFaxL79DclkkuGJ4UxnbmxyjAcPtFubWpcsC62d+Hz2vUSl54s6jU7ajXYZbhWEIiRhmrw3OMXMBsmrSVPxH8/38+6nuoHz5MEWfv70tqzF56vxUDkclAnhkdTqiTzWLawZzNCli6O9n9cBQpbwPGD5tuc1PKzCmQTVftVPnI1Dp3IlEo0wODqYKY5m5meyPu/z+uhs68wUR62NrbYVRl68KyzeMl9UXEihVKbcmlrg9tT6b4KVUrx2dYS/uaQHX49ur+drz+4i4Fu/q7S1ppITHfUESn0HxWZESCkY+2wpmCGeigQ1DNh2Qlvrtp8Ar8VfQX9d6uSoE3z2HO+HVZg+1UeP6mFADdjm6V6+M2JgZIChsaEVOyPqa+uXLAvtXVRW2FPwifgIQumRNBUfDE4zGV7/TXA0nuTfvHmfGwNzGMDPdW/l2Ufa1n3z+lA5HMyYdjUs9IJpcedPMg69l/Tp0eBVrVWwFMxw4Dlo3WPR9m08YPne/DysUooZZjKWulFGUdgzKZJIJhgeH9Z79kYGGJvKtusZhkFbU5vWps4uOls68XrtKawrqFhh8Zb9RcWNFEplyJ2pRW5MrH9UnTQV33+vjw8/0xGazz7Sxs89thXPOt06jwGPttWzs76qtIVoMyIUmtG2uttvaptdmroOLUD7ns4OZsgFX81SceTf/BG8UoppprMEyC422hlRVVmVZVmorbbnVEfERxBKG1Mpzg9NMxZaP3l1NhTj26/eZXAqjM9r8LVndvLozsZ1v+ehcTjEF2CxR8/HrjHovyZTfUu276xghkP69OjBYIZcqGhOnRx1gHfz/7amMhlRI5n9RnPMbfoxQaemjk+PZ9wMw2PDK1JTG+sas8KBKgL2NNbqqMvSpgbsna0VnEcKpTLj/kyIq+Prv/iEowm+e+4+nw3PYxjw0ultPHWodd3veSiW9OUrQmbygWCG1AuwrwJ2ndYiZDWYwRtcstX5Nr9sL6mSjKiRTEyqXQIUjoQz4rPWzogtbVvY1qntdE31TbaIRC21WfuLRHwEoXRRSvHR8AwjGySvDk2F+Pard5kJxamp9PHrz+9hZ9v6yzi31lZyor2EHQ5KQXRCBwdFxzf88ixiIbjzrrbWjd9duj/YqEMZ8glmCDQuNe5smIeNqmiWpc6OpeRKKWbmZ7ICGKKx7MetrqrOCgdaLzU1VwyMFfNF1cbml8UK7iKFUhnRPxfm8uj6FrKphSjffvUuIzMRAj4Pv/LcLg5vq1/3e3bWBznWVleaS/o2I0IzQyl/908fCGbYmwpmeMJaMIO3ctkm8rpNF0dRFaVP9WUEKEaey2+XEU/EGRodon9UnxqtuTMiJUDLd0bki4iPIDy8KKW4NDrLwPz6p/efDs7xZ+fuEY2btNVX8I0v7qW5du036iXvcFBJCA1p63fCQliBMmH401Qww/mlYAYjHczwHHQds7ZLz1+/zPK9+V1Tc2ouc2o0okZsWUq+GF7MSk1dCGX/mwX8Aba2b80URo11mw/v8eGjzWijgyWLd8Ao8VNLYQVSKJUJQ/MRPhqeWfdr+icW+fZrd5kPJ6ir8vMbX9xDV/Pab/R9HoOTHfV01Zbgkr58RWjdYIbP69mjpm25P156E3lVJwQaNl0czarZTBDDsBretKc7a2fEyAAjE2vvjOjq6GJL25Y1d0bkioiPIJQHSimujs3RO7t+8ur7tyb44ft9mAr2dNTwa1/YTbBi7bcvdQEf3aXqcEhGYLFP/zEtNLcWJlP7+N7MDmZo2Jrax/e0tWAGX+0yV8PmGlOmMrOWkk8zvfE3bUAsHmNwdDBTHE3NZu8x9Hg8dLYuBTC0NbVtOjW1ksqspNRmmsXiXQZIoVQGjC5G+XB4et23zNd7Z/jzn/YQS5h0NlbyGy/spbFm7TenJbukLx8RWi+Yoeu47tBtP5l7MIPHrz3dwS061nsTxZGpTEYZzQjQDDN5Pxa4szMiLT7pPy20iPgIQhlwY2KBu+skr5pK8Z8/GuLcdT1H+dieJr761HZ869joStbhEJvVzobwEOTa4EomoPeinokd+HjzwQy+6mWuhs1Z0eIqzoAayNi9I1ic932AZDLJyMQIA6MD9A/3Mzo5umpqald7F9s6dWqq37e5Qjk9X5QujOqpL83TSWFTlNi7XMEqE6EYHwxOYa7zuvvTT8b4yw8HUMCBrXX86nO7qAys/Ua1JJf05SNCoRm4844ukGYGl+6v64ADz+rle7kGMxg+nQZUtUUPwG5i2V5MxRhQA/SqXlsEaH5xPsuysNrOiLSVzo6dESI+giDcmlzg1tTap/mxhMn33u7h454ZAL50vJOzxzvWfK0oSYeDUhAZ1doUm9rwyzNM9WtduvM2RJbNhXYcXApm8OeYIOqt0sVRcMum52EX1ELG0TCkhja1lFwpxeTMZEaXBkcHV6am1tRrberUAQxVFfn/vzcwaKElq2kXNOxdHCuUJlIoPcRMR2K8NzhFco26wDQV//HDAd65qWdzHt/fwleeWHsPRckt6ctHhMwk9H+s/d3Lgxm8AdidDmY4mJuYGF69R6JqC1S2bGrZ3ryazxKgzXi60zsj0sXRgzsjvF6vDmBo19Gom9kZsXy+KF0YifgIQnlzd3qRTybm1/z8QiTOd167R8/4Il6PwVef2k733uY1v77kHA5mQocGLfRAcuNdhoAOZrj7ni6QsoIZGpYFM3Tm9lieSr2cPLhFzx/l+fqulGKCiYyjYbNLyecW5jKFUf9I/8rU1IqqrACGuhqrO56W8OGj3WjXRRHa4u03StCqKThOibyqCFaZjcZ5t3+KxBpHSdF4kj9/q4dP+nW4w88+toUzR9rXfENcUkv68hGhmWFtX/jsp/okKU3bXj13tCfXYAaPLo6CnVDRZm1gdhlKKcYZzwjQJJN5PQ48sDNidIDxqfEsy0LWzoiOLjpaO/BZ3e+UIiM+qfmiNqNN5osEQcjQOxvi47G1UzfHZiN869U7TM7HqAp4+bUv7GZv59prBErK4ZAIwWKvXj+hcthXpxSM3IRP30wFM6Ts4plghmeh69HcdMYTWDYP25h3cZRQCQbVYKZxFyJHjV2FcCTMwOhApjCaW8j+uUinpqaLo+aG5rybdlVUrZgv8mzC2SGUD1IoPYQsxBK80z9FbI0iaS4U59uv3WVgMoTPa/BLT+/k+K7V91AYwCMttewrhSV9VkUoHtHic+tNGPl06f7KWj34mnMwg7FsE3l73pvI4yqeEaA+1Ze3AK3YGTE+TDLpzM6ItPikBaiJJpkvEgRhVQbmw1wcWTt59e7IPN95/R7hWJKmmgDf+OIe2htWt1OVjMNBKYhN68ZdZCS371mc0mmqt9+EuWV77jLBDJ+HqvXTaAEw/PrkqKoTKprytnyHVCiToLqZpeTxRJyhsSG9Z29kgPHp7KRZwzCyUlPbm9vzXvTaQEOWja6OzVnGhfJFCqWHjFA8wdv9k0STq1uzhqfDfPvVu0wvxqiu8PH1F3azs231oc2g38vnOhtoKuYlfVZFSCkYu6MF6O77EE+lLRmG7swdeA62n8ohmMFYWrZX1ZH3JvJFtZglQPl4ugu5M6Ke+qzCSMRHEIRcGF6IcGFoZs3PX7w7xV+800vSVGxvDfL15/dQW7X662pJOByUCeFhrU3x9ddyADqYoe+ibtytCGZ4Qjfu2vZufBJk+HTDLtgJFS15FUdKKaaYyiwlH2Ns429aBdM0GZsao39Y79lbLTW1qb6JbZ3b6GrvYmv71rxSUz14VswXVRklNKsmFDVSKD1EhBNJ3u6fIpxYvUi6ldpDEYmbtNbpPRQtdat344p+SZ9VEQrP6o3kK4IZ2rUA7Xsaatb2wGcINC0VR3ks20sLUI/qodfsZRyLu5tS5LozIl0c5bMzQsRHEAQ7GFuMcn5o9eRVpRSvfTzC31weBuDYjgZ+6ZmdBHwrtackHA7JGIT6YKEXzByWp64bzPCcXlq+UTCD4dHFUVWndjfkcaqfVEmG1XDGUjfP2jNka6GUYnpuOiuAIRbPTpetCdZkpaZWV1mPHvfjz5ovajPaZL5IcAwplB4SokmTd/unWIyvfiLxwe0JfvCe3kOxu72GX3t+N9Wr7KEo+iV9VkTITOrO3K03ofdSdjDDrtNw8LlUMMMGxaC/YWmfhDfHJKHlT1klGVJDGQFawMLephSF2Bkh4iMIgt1MhmO8Pzi9avJqImny/ff6uHBHv549d6SNn31s66rzRkXvcIgv6L184UHdyFuPWEg7Gm6dWxnMsO8Z3bxr2CiYwbPM8t2Wl+U7oiJZjoZ8lpIvhBayAhhC4VVSU9u7Mk27+lrrKadBglnzRU00yXyRUDCkUHoIiKeKpLnYSt+wqRR/c2mI169qn/PJ3Y38l5/fseoeirqAj89taaCuGJf0WRGh2WG4/Zb2eIeWLbZr3aM7dHue3DiYwV+3bBO59ZS2sApnCVCc+MbftIxkMsno5Cj9I/2O7YxIi0/6jwy3CoJgJzOROO8NTJFUK6ukcDTBd8/d57PheQwDXnp8G08dbF31cYrW4aAURCe0syG6gTtAKT0Le+sc3HswmOGkLo62bRTMYGg7XTA9D2tdq2fUTMZSN8KI5aXk0ViUwdHBTHE0PZe9PNbr9bKldUvmxKi1sdVy066RxixtqqW2OBu3QlkghVKJkzBN3hucYia68o14PGHyvXd6uXJfv5B98dEOXjzRueoLzq76IEeLbUmfFRFaL5hh79O6QNoomMFXs1QcWVy2p5RihiUBGmXUkgA9uDNiaGxoxaLXzM6IVABDVaU1G1x6uDXdlRPxEQTBKeaicd4ZmCK+ylHS1HyUb712l9GZCBU+D79yZheHulaGExStw0ElITSotSmxgUNgcUqnqd56C+aWzdE2bNW6tPfz+iRpPdLzsJUd2hFhAVOZjDCSSVCdJQer+jISyQQj4yMZbRqbGluRmtra1JrZs2c1NdWDh1ZaswqjSsO6c0MQnEIKpRImaSo+GJxmMryySFqIJPjT1+9yf2wRjwFffWoHn9u3cgbH7zE4UWxL+nIVIaW0beHWufyDGbzBlK1uC/jXjqBdjaRKMqJGMpa6OdaOvF2N5TsjBkYGCEfDWZ9P74xIF0dWdkak54vSRVG70S7zRYIgFITFWIJ3BqaIrRIq1De+yL9+/S7z4QR1QT/feGEPW5tXntoXpcMhGYHFPv3HXMemlkxA3yWtTVnBDJWw+wmdXLdRMEOgcalxZ3EeNqqiWUvJo+QwK5XCNE0mpicyVrqh8aEVqakNdQ2ZPXtb27ZSWZF7YRMgsGTxNjpoow2fIW9FheJFfjpLFFMpPhyeZiy08sV6fDbCt169y8R8lMqAl187s5t9W1YWAUW3pC9XEQrPwmfv6OS66YGl+2vbdHG075n1gxm8lSkB2qItdhY6lVEVpV/1ZwTIiqc7HAlnLAt274x4UHxaaZX5IkEQCk4onuTtgSkiq4QKXeud4c/fuk88qdjSVMVvvLCHhuqVJyRF53CIzerGXXgI1nMKTA/o4uizdyCy7PW9/QAcPLNxMIO/fpnl21pja07NZZp2w2o456XkSilmF2YZGB6gf1Q37h5MTQ1WBrMCGGqrc28qVlOdadh1GB000igWb6GkKJJ3yIIVlFJ8NDzD8MLKLtG90QX+9PW7LEaTNKb2UHSssoeiqJb05SJCmWCGt6D34spghgPPQec6wQyeimXL9hosFUezajYjQCNqJGcBcnJnRDXVWTHdIj6CILhNJJHknYFJQg+ECiml+OmNcX784QAKOLi1jl85s4tKf/brXVE5HJSCyKjWptjU2l8XC8G997Xte+zO0v25BjP4apfCgny5J8AppRhjLGOpm2Kd5/gAoXCIgdGl1NT5xeyEO7/Pz9b2rdpO12ktNbWJpuz5IsOaU0MQig0plEoMpRSXR2cZmI+s+Nzle1P8u7f1HoptLXoPRV0w+1ShaJb05SpCsyP65CifYAaPX3u6g1t0rHeOL/SmMrMEaJrpjb+J7J0RA6MDDI8P27Yz4kHxqaGmuDz7giCUNbGkybsDUyzEsoukpKn4yw8HeOembhQ9eaCFn398G94HTouaKv10b2mg2u/y2xIzDqEBnayaXGPpdyaY4U09G5tINS0NL2w/oa116wUz+KqXuRpyn4eNq3iWpS5MeONvQqemDo0NZQqjyZnJrM97PB46WjqWUlOb2/CuGyqR+j48tNGWpU0VRpEvABYEi0ihVEIopbg2Pk/PbHjF/a9fHeWvLw0BcGR7Pb/87K4VeyiKYklfLiKUiOpUoNtvwvDNpfsravS+owPPQdP21b/X8C3bRN6c87K9uIpnWeoirCxEH8SpnREPik+70S7DrYIgFC1xUxdJs9Hs5NVoPMm/ees+N/q1De3nHtvKc0faVjR5isLhkAjpxl1oANTKBFkgFcyQ2seXFcywRRdH6wUzeKu0LgW36FOkHP9bF9VixtEwqAZzWkqeNJOMToxm5oxGJ0YxH0iLbWlsybgZtrRtySk1NUAgKxCohRaZLxIeeuQnvIS4ObnAnenFrPuSpuIH7/Vx/jPdIXr2kTZ+7rGteJZ164piSd9GIpQJZngT7r63FMyAAV3HtAjtOAneVV7MDe+yZXstOS/bW1ALWQKUi6VuIbSQEZ+1dkZkLAs57oxIi8/y+SIRH0EQSoGEqXh/YJrpSHao0GwoxrdfvcvgVBif1+Brz+zk0Z2NWV/jusNBKYhN69UTkdHVvyaZgL7LunHXf3mVYIbnoG3f6oWPp3LJVuevz6k4UkoxyWRmKfkEE7l9z8zkUgDDKqmpdTV1ujBq1427XFJTa6jJKowasb64XBBKHXk3ViLcnlzg08nsBLhwLMmfnbvH7SG9h+LnT2/j84ey91C4uqQvFxEKz8Gdd/QA7IPBDPuf1X9WDWbw6CV7wU6oaNtg90T66SgmmKDH7KFX9TLJ5Ibfs+HOCI83E8CQ684IER9BEB4GTKU4PzTNRDj7JH1oKsy3X7vDzGKcmkofv/78Hna2ZZ+mu+pwUCaEh3XzLr5GXPb0gG7cffb2ymCGA8/B7sdXD2bwBJbNwzbmVBwlVCJrKfkiixt+z9zCnJ4zGu5ncHSQUCS7aVdZUZnZs9fV3kV97cr49Qdppjnb4m1YW5MhCA8jUiiVAHenF7k+kT1sObUQ5duv3mVkJkLA5+HvPreLR7ZlvxC6tqRvIxEyTR3McPtNHcxgpoMZ/MuCGQ6tYpszlm0ib89pE3lCJRhUgxkBCrGG3S/99RvsjABoa27L2Ok6Wzrx+dZ/Hun5ok6jk3ajXYZbBUEoeUyl+HBohtHF7FChW4NzfPfcPaJxk7b6Cr7xxb001y6dGLnqcEjGINSnrd/mKpHZsRDc+yAVzPDZ0v1VDbD/Gd24a9iy8vsM/zLLd1NOlu+wCmd0aUANkGANu1+KSDTCwOhA5tRodj5bW31eX1Zqaktjy7r/vl68KyzeMl8kCCuRQqnI6Z0N8fFYdox0/0SIb792R++hqPLzGy/soatlKdDAa8AxN5b0bSRCc6OpDt1Ptdc7TcvupWCGigdneIylZXtVHTltIg+pEH2qjx7Vw6AaXFeAlFKMT4/raNSRfobHh0kks7++obZBF0Y57IwQ8REE4WFHKcWlkVmGFrJnOd+/NcEP3+/DVLCno4b/6gu7qa5YepvhmsMhvqCdDeFB3chbjlIwcks37u59sCyYwQPbT2pt2vboysac4dMNu2AnVLRsWBwppZhmOmsp+XokEgmGxocyhdH41MrU1Pbm9kzTrqOlY93U1AoqVli8vTna1AWhnJFCqYgZnA9zcSS7a3S9b4Y/f6uHWMKks7GS33hhL401S6LjypK+9UQoEYX7H2pr3Ypghs/r6NTmHSsfM9CkBaiyY8Nle0opppjKCNAYY+t+7ezCbEZ81toZke7KbbQzQsRHEIRyQinFlbE5+uaWQoVMpfjri0O8cU2/+T+1p4n/x1Pb8S1zM2ytreRkez3+QjkclILohHY2RMdXfj40rdNUHwxmqN+S2sf39MpgBsOrLd9VndrdsMFrfVIlGVbDmZOjeebX/FrTNBmfGs/o0vD4MEkzO7ihqb4po00bpabWUZelTQ00iMVbEPJACqUiZWQhwodDM1n3/fTGGH95Xu+hOLClll89s5vKwNIL9a76IMfa6lbErjrCeiK0YTDDc7Dj1MpgBn/D0uCrd/2Ut7QA9Sg9b7TAwppfa2VnRFdHF031TWsKSi21WfuLRHwEQSgXlFJcH5/n/syShTmeMPne2z1c6ZkB4OzxDr50vDPzulhwh4NKQmhQa1PiAV0wU8EMt96E/itLjT1fhXY0rBrM4Flm+W7b0PIdUZFMgmq/6l9zKblSipm5maXU1LHBFU276qpqtnVuyxRGNcHVZ4YMjBXzRdVG7juZBEFYGymUipDxUJQPhqYzq1dNU/GXFwZ4+4YuSB7f38xXntieKYj8HoOTHfVsLcSSvvVEKDKnN5LfehOm+5fuXy+YwV+3bBP5GvuQ0g+vIvSpvowAxYmv+nV27YwQ8REEQVji08kFPluWvLoQSfCd1+/SM7aI12Pw1Se3071v6TW+oA6HZAQWe2GxT6+hWM70oLbWffZTHSCUpv0AHHhWp9dlBTMY2k4XTM/Drv/800vJe8weRhhBrbE4PZ2amg5hWAxnhzYE/AEdDJQKYWioXb0R58NHm9FGB0sW74DhQmCTIJQBUigVGVPhGO8NTGOmXmej8SR//lYPn/RrC97fPrWFLxxtz7x4FmxJ31oiZJoweFUXR70fPRDM8DltrdtyONu/7atZKo42WLY3o2YyMamjjK4qQHbtjBDxEQRBWJ3Ppha4uSx5dWw2wrdevcvkfJTKgJdf+8Ju9nUu2ZQL5nCIzaas38OwXB9iYbj3/irBDPWw7xldIDVszX6s9DxsZQd4137tN5XJKKOZpeQzzKz6ddFYNKtpNzWbvVzd4/GwpXUpgKG1afXU1Eoqs5JSm2kWi7cgFAgplIqImUicdwemSKZS1uZCcb792l0GJkP4vAa/9PROju9a2kNRkCV9a4mQ1WAGb1Av2qvqBP/aMz+mMhlhJCNAs6xMzctlZ0Rtda22LKyzMyItPuk/LbSI+AiCIDzA/ZkQ18aXLMv3Rhb4zht3CUWTNNUE+MYX99DeoF9jC+JwUEqvnFi4r1dQLL9/9JbWphXBDCdSwQzHs+1zgcalxt0687AxFWNADdCjeuhX/asuJU8mk4xMjGT27I1NrkxNbW1qzezZ62xdPTU1PV+ULozq2XgfnyAIziCFUpEwH03w7sAU8dRR0vB0mG+/epfpxRjVFV5+/fk97GrXpy8VXg/dnQ20ObWkby0RSsTg/nktQsM3lu6vqNEbyQ88lx3M4K2EqnRxVLfmPomoimZ5uqOsTMybX5zX4rOJnREiPoIgCNbomwtzeXSpYXXx7hR/8U4vSVOxvSXI11/YQ22VPqF33OFgxvXS8oUeSC6FSehghre1vW52eOn++i365GjfM9nBDP76ZZbvtQu6eTWfCWIYUkMrlpIrpZiYnsicGA2NDa1ITa2vrc/YvLvau1akphoYtNCS1bQLGuvb0AVBKBxSKBUBi7EEbw9MEk3qF+HbQ3N89417ROImrXUV/MYX99Bap19c24IVPNZZ78ySvtVESCmYuLcUzBBLFygGdB3V1rqdjy0FM3gqli3ba1izOJpTcxkBGlbDKwRoszsjls8XpQsjER9BEITcGZqPcHF4BtBFwWsfj/A3l3UhcnR7PV97dhcBn7aKOepwSIS0LoUGQKUKETMBfVd0ouqDwQy7n9CNu/b9Sxrkr01p05Y152GVUowznllKPsXUiq+ZnZ/NFEYDowNEotknS1WVVVmFUV1NXdbnffhoN9p1UYS2ePuNAqbUCoJgCSmUXCYcT/L2wBSRhH6RP397gu+/p/dQ7G6v4de+sJvqSp9e0tday75GB5b0rSZC6WCG22/C1LJghppWLUD7n4GaFn2fJ5DaJ7FFx3qv8vxMZTLGWMZSN8101udz3RmRLowe3BmREZ/UfFGb0SbzRYIgCHkyuhjlw2EdKpQ0Fd9/r48PP9PBOM890sbPPrYVj8dwzuGglHY0LNzXDoc0M4Mp2/fbEF7WQGvfr7Vp1+MQSJ0S+aqXiqM15mHjKp5ZSt6n+lYsJQ9HwkvrJEYHmFvI3mvo9/nZ0rYl42ZobmjO0ugqqlbMF3lyWEgrCEJxIIWSi0QSSd4ZmCQUT2IqxcuXhnjtqhaEk7sb+S8/vwOf1+PMkr7VRGi9YIadn9MilA5mMHzLNpE3r7psL67iDKiBzMnRck+31Z0RW9q2UBFYEuK0+KQFqIkmmS8SBEGwgYlQjA8GpzAVhKMJvnvuPp8Nz2MY8NLpbTx1qBVwyOGgTD0Tu3Af4qmiJBbWM0e334TR20tfW1WXCmZ4bimYwVulC6NgJ/hqV23cLarFjC4NqkGSLGlPPBHPCmCYmJ7I+l6P4aG9pT0zZ9TWkp2a2kBDlo2ujjqxeAtCCSOFkkvEkibvDkwxH0sST5j8xTu9XL6vT1m++GgHL57Qeyi6ais5YeeSvtVEaG4Ubr+l/2QFM+xaFsxQk1q2155KBWpZddneglqgT/XRo3oYUkMZAVJKMTM/Q/9wfjsj6qnPKoxEfARBEOxnKhzjvcEpkgqmFqJ869W7jM5ECPg8/Mpzuzi8rd4Zh0MyBqE+WOgFM5oKZritrXUPBjNsOw4HzsD24zqYwVO5tIPPX7+iOFJKMclkZin5OEuOhaSZZGxyLHNqNDIxgmlmW8GbG5qzmnbpRa8ePCvmi6qMAqzpEAShYEih5AJx0+S9gSlmowkWIwm+88Zd7o8u4jHgq0/t4HP7mvEa8GhbPTvsWtL3oAglYtDzIXx6bo1ghmeheSd62V6bFqGKNnhg35BSigkmMpa6CZa6b4vhxYz4rLkzor1LC9CynREiPoIgCIVnNhrnvYEpEqaif2KRb792l/lwgrqgn994YQ9dzUH7HQ7xBd24Cw0CJoRmdJrqrbdgdmjp6+o7deNu39MQbNSW78w8bOOK4iipklmWuvRScqUUU7NTGW0aHB1cmZoa1Kmp6TmjYJWeafLjz5ovajPaZL5IEB5ypFAqMElT8f7ANFOROONzEb796l3G56JU+j38V1/Yzf4tdfYu6VsuQiq5djDD1qNahHac0sOwmU3k7Ss2kSdUgiE1RI/qoU/1sYgugPLdGSHiIwiC4C7zsQTv9E8RMxXXe2f4N2/dJ55UdDZW8Y0v7qGhOmCfw0EpiE5obYpOLAUz3H4T+i4/EMzwuD49at+fKo7Slu+mFZbvsApnlpIPqIHMUvL5xfmlOaORgRWpqRWBiowudXV0UV+jE1GDBLPmi5pokvkiQSgzpFAqIKZSfDA0zUQ4xv3RBb7z+l0Wo0kaawJ844U9dDRW2bOk70ERiszDnXd0gTTVt/R1Na365Gj/s/p2etleVceKTeQhFcoSoASJrJ0RAyMDjE6Orrkzoquji87WTvw+f0Z80n9kuFUQBME9QvEE7/Tr5NWffjLGX344gAIObq3jV57bRXWF1x6Hg0rqpt1CDyQWUsEMb+kTpOXBDG37dHG0+3GoqE2FBXVCRUtWcaSUYoYZelUvPWYPo+h520g0wuDYIAPDujiamZ/Jehper1cHMLRvo6uzi9bGVgzDoJHGLG2qpVYs3oJQ5kihVCBMpbgwNMPoYpTL96b43ju9JJKKbS1Bvv78HpprAptf0rdchGJzMHhN+7t7L+qOHaSCGbq1CG05rIUnmN5EvhSWoJRimml6VA+9Zi9jjOW9MyI93Jruyon4CIIgFAfhRJK3+6dYjCX5jx8O8M5NPb/zxIEWXnp8G42V/s07HJIRbfsO9UF0Hu69rwuk0VtLX5MOZtj/HDRt15bvqk7tblg2D5tUSUbUSCaMYY45EskEw+PDWampy5t2hmHQ1tSW0aaO1g4C3gCttGYVRpVG9o4jQRAEKZQKgFKKSyOzDMyHef3aKH99Ufuuj2yv52vP7KSztpLPbWkgmO+SvuUiNDO4LJhhculrWnZpAdr7JNR0LQ2+epeEIamSDKvhjADNM8/s/CwDowM6hGGNnRHLF7021DTQQkumKGo32mW+SBAEoQiJJkze7Z9iKhTjz9/q4ZN+farzs49t5cyRNnY3VnOsdRMOh9hsyvo9BGO39UzsvfdXCWZ4DrafWtKlyrYsy3d6KXmP6qFf9RMxI4xPj+tdRiMDDI0PkUxmp6Y21jVm7HRb27dSG6hdsngbHbTRhs+Qt0CCIKyPvEo4jFKKj8fmuD8T4gfv9XE+tYfimcNt/J3urRxqqeFQvkv60iI036uDGW6dg6FPlj5fUZ0KZngOOo4t20S+tGwvoiJZlrrZyKzuyo3qU6M1d0ak7XQNnXR4ljpyrbTKfJEgCEKRE0+avDswycBMmG+/doeByTA+r8EvPb2T7j1N+TsclNIrJxbuw8x9ve/o9pswsyyYoa5Duxr2PQ1N+1OuhvYsy/esms007YbMIZ2aOtKfCWBYLTV1+ZxRe7A907DrMDpopFEs3oIgWEYKJQdRSvHJxDyfjM3zZ+fucXtI76H48ue6eOFoR35L+tIiNH8Phi5pAbrzHsTSiXIGbD2iRWjPs1C7M7VPojrzEDNqJhOT2p/oZ3BsMKedEV0dXexu3s1W39aMlU7ERxAEobRImCbvDU5xY3ieb792h5nFONUVPr7+wm5Obm/Mz+FgxvXS8rm70POettb1XVolmOE52P4kBLfq4sir0/NMZTKmRugxe/R+o/Bg5sSof6SfhdBC1uUC/gBb27dmiqM9dXvo9CwVRrVGrQ3/UoIglDtSKDnIrakFzvdN861X7zCS2kPxd5/dyZmD7daX9KVFaOIq3Ho9FczQu/T5mhYdynDoRWg/ntonoYXCVCYjaohes5f7yfvcnryd886Iw22H2RHYkenM1VAj80WCIAglStJUfDA4zXt3Jvmzc/eIxE1a6yr4xhf38tTOJusOh0RIz8UOnYdPX9cnSOGZpc+37dPF0cG/BfV7UpZv3SCMqRgD5j16VS93Yne4O3o3Y/VeLTW1s7Uzs+j1SNMRtnq3ZgqjCsNi01EQBCEHpFByiDtTi/zk0zG+/dod5sMJaqt8fOOFvbx4qN3akr5ESHfo7rwMn74GPR+tDGY4dBb2fkl36Px1YBjEVIx+8y49Zg+XZy5zb+TehjsjtnVs40T7CfYG92bmi2S4VRAE4eHAVIoPh6f58ZUhfvBeH6aC3e01/L0v7uW5XS25OxyUgtg0TN2Amz/WjbvlwQyVddpW98jPwdbTKcu3tvHNq3l6zc+4m7jL5YnL9I306dTUiVFMld20a21spauji12duzjZdpId/h10GB200CLzRYIgFAR5pXGA+zMhvnexj3/zVg+xhElHQyX/8Gf286V97bkt6UuL0OB7cP2HcPunsLDMEte8Ew6+AEd/ARoPQqABDEMLkPqEK/NXuDh8MSNAa+2M2Nm+k1NbTvFI7SN0ejpppVXERxAE4SFEKcWHQ9N8+617vH5Vx2if3N3Ib31pP49vbczN4aBMHcxw92/gk/+sgxniqYAfw4BtJ+Dwi3Dw70DNDvAFUUoxzjj3E1f5aPojro1cy6SmPti0q6+pp6uji30d+3is4zH2Ve3LzBeJk0EQBDeQd8U20z8X5o/OfcZ//HAApWD/llr+x587xFPbmzde0qdMmLsP174HN/4Ghq4vfa6iGvY+A49+FXY8C4EmFDDGGDfCb/LO6DvcHL659s6I1i3s6djDqc5TPNb8GFs8W0R8BEEQygCltN3u//ufP+XK/WkAzj7awT8+u5/9TTnYqZMxGL8MV/5c2+tmBpc+V9ehXQ2P/j+h9Rj4a4irOINqkEuzl3h/+H3ujtxlYGSAcDSc9bBVFVV0dXRxsOMgn+v8HEdqj2iLt1Fj9z+BIAhCXkihZCP9s2H+3395nZ/eGAPgif3N/H/+iyPsadrAapeMwf2fwKU/hztvrwxmOPoSHPkqVG8hTpL7ifucG/oBF4YvcH/k/po7I/Z17ONU5ymebHuSbb5tMtwqCIJQZiileKdvkv/lh9e5P7aIx4C/+8wu/uFzezd2OESn4fpfwNUfQN9lvasPUsEMT8Kj/yXs+1vgryNEmGvha7zZ/yZXhq/QP9LP7MJs1sP5vD62tm/lcMdhTnee5lTjKTo9nTJfJAhC0SKFkk30TIf4+9+7xPU+LQwvfa6L//VnDlFfuY4QzfXBxX8N1/8jTPYs3V/TAod/Fk7+CrQfZ85c5K2pt3j77h9xfeT6mjsjDnQc4FTnKZ7peIY9FXtEfARBEMqcV++M8z/++6tMzEepDHj5f/3tg/zdx7av7XBQCoYvwEffhps/yQ5maN+vG3eP/jKqeitDyWFeG/2PvD/0PrdHbjM+PZ71UIZh0NncyeHOwzze+ThPtj7JFu//v717D4uyzPsA/p2BYTiDATKDIATiAQ+ooHKIAFO8zFfz2oOWratGu+Ie0kxbrd5M3fd1yzc3dbPWUqwN081DeZWptAuE4ll0t0VBUfEQqCjKQUBgfu8fxOQAAsNhDvL9XBfX1dw8z3N/b5l7ft0zz/OMD2wURtzIiIjIjLhQ6gRnrpfhVx8fw+Xiu7C1UWDuuL74zWNBzX9Jn64OyN0FnNgE5O//8cYMSlsg6HFg2LPQBU/Ev+6exr7v9+FYzps4f+18s98Z0U/TDyO0IxDnE4cBjgNYfIiISG/7qav47x3/xt3qOjzibIdVTw9FbJBn82c4VN0BTn0EZH8KFOX82G7vCoRMAIbPRLVmKL69mYn0/Pdxsugkrty40uSuqV5uXvqFUZx3HHrZ9eIp3kRktbhQ6qBjl27h1x8fx63ye3BS2+D/poZifIi26Ya3LgDH/lp/CkP5fe+6efYBhk5FUf8J2HfnOPYX7sN3n69C2d0yg93VKjWCvYMRrg3HaO1ohLqFQqnk9xcREVFTHxw4jz99dQZ1OkGAlxOSZ4bjUY9G1/6IAJf2A0c/AHL33ndjBiXgHwEZ9ixO9xqMfdfTcDh3NfK+zcO9mnsGh3B1dMUg7SCM0ozCE9on4O/kb6IREhF1PS6UOmDf6SLM/fQkKu/VwdvNHptmhWOAxu3HDWqqgJwdwPFk4NJRAD9cR6R2RsWA8cgKCMc/qi/ieFEqir76m8GxlUol+nj1QbgmHKN9RiPMMwy2Sv65iIjowUQE/7PnND7MuAAAiOjjgQ9/EQ5n+/vqR/kNIDu5/rrYkvu+j8+tF4oGTUK6JgDpt0/iX7nrUHbS8E07ezt7DPQeiAhtBMb4jEGQaxA/MSKihxb/z7ud/naoAEu++A90IhjYyxUfzxoJD+cfrgkqPFV/fvd3O4Dq+m8TrwFwqvcwZPoEYX/dLZy7eRS6U4cNjtm7R+/6U+m0cRjpPRKOKkcTj4qIiKxVTZ0O8/5+El+dKgQATB3ph/+dPLj+NPC6WuBcav11sef+WX8aOIAylT2OBo1CukdPHCwvQNH3XwHf/3hMW6Ut+vXsh0htJOK18RjoMRA2Sp7mTUTdAxdKRhIRvLknF+9n5AMAEgZ6Y83Tw2Bfcwc4vKn+06Prp6EDcFalwiEvH+z31CK75g6q624C127qj9XTuSdGaEcgVhuLCG0Eetj3MM+giIjIqpVW1SDxo2M4euEWFArg1QkD8PxjgUDxOSD7Y+DkZqDiBu4BOGmvxiGvQOx3ccaZyluQ6gvA9/WfQCmgQKBHICK1kXhc+ziG9RwGe1t+8TgRdU9cKBmhurYOL/39FL78V/27dUmPB+Dl4GtQfp4InPkKVxV1OGxvj4M9vXDIyRm38cOd6arqr0lyVbsiXBuOGG0MIrQR8HXxNddQiIjoIXGl5C5+ufEIzt+ogL1KiXd/3g9P6A4BG5Kgu3wYZ+xUOORgj0M+PjihtkM1dACqgcr6mwT5uPogUhuJGG0MwjXhcFO7tdwhEVE3YRULpXXr1mHlypUoLCzEwIED8c477yAmJqbL+lucPBlKKPE/s3Yg90I2NqUvxU8iXsGbGbVwrFiGsT2rMdc7Ar55LyP1u5s47GCPQ1oPXFap7jtKHdQ2agzXDEe0NhoR2ggE9wiGUsEbMBARPQwsoTY9PuglvLa3CgMd3kaI910s9R6Au1/vxt9tdTjkYI+jvXvhts39p8rp0MOhByI0EYjyiUKENgIaJ02XZSYismYWv1DaunUr5s2bh3Xr1iE6Ohp//etfMX78eOTk5KB3795d0qcSSuxSngWSf4LH+/8MXyrzcXHX1/BR7UGaZzmGVVZhWcUOnHFXQRReP+6nUGKw52BE+kRilGYUQr1CobJRtdATERFZI0upTWf2fIXHXb7BNz2qMaC6GtPu3sD3GneD/RxVjhjhPQIR2ghEaCMQ5M4bMBARtYVCRMTcIVoyatQoDB8+HO+9956+bcCAAZg8eTJWrFjR6v6lpaVwc3PDnTt34Orq2uZ+X03+CXYpz+LxO1741u0GBpU64DvXyibbBbkFIvKHd+XCvMPgbOfczNGIiLqf9r7+WgNz16bokkdwoMct9C91wJlGtclWYYNQr6GI8KlfGA30HAiVkm/aEREBxr3+WvQnSvfu3cPx48exaNEig/aEhARkZWU1u091dTWqq3/8ctY7d+4AqP9HaauzF08hzO9J3DyRgmKUoc6uDrpKgbbaHs5KW/h5ByN60H8h3Dscno6e+v10VTqUVrW9HyKih1nD666Fvx9nNHPXpqvHPkSJ8i7qKuug/KE2edg6ItA3FI8PmoBQr1CDu6ZWlleiEk3f6CMi6o6MqU0WvVAqLi5GXV0dvL29Ddq9vb1RVFTU7D4rVqzA0qVLm7T7+fl1KMtpg0eHsAZ/e8CWRER0v7KyMri5PTw3CLDc2vQt/hdrO3Q8IqLuoi21yaIXSg0an0stIg88v3rx4sWYP3++/rFOp8OtW7fg4eHRrnOyS0tL4efnh8uXL1vtqSPWPgbmNz9rH4O15wescwwigrKyMvj4+Jg7SpdgbWo/a88PWP8YrD0/YP1jsPb8gHWOwZjaZNELJU9PT9jY2DR5h+769etN3slroFaroVarDdrc3d07nMXV1dVqngAPYu1jYH7zs/YxWHt+wPrG8DB9ktSAtanzWHt+wPrHYO35Aesfg7XnB6xvDG2tTRZ9r2o7OzuEhYUhNTXVoD01NRVRUVFmSkVERN0ZaxMRUfdg0Z8oAcD8+fMxffp0hIeHIzIyEuvXr8elS5eQlJRk7mhERNRNsTYRET38LH6hNHXqVNy8eRPLli1DYWEhBg0ahN27d8Pf398k/avVaixZsqTJKRPWxNrHwPzmZ+1jsPb8wMMxhocJa1PHWHt+wPrHYO35Aesfg7XnBx6OMbTE4r9HiYiIiIiIyNQs+holIiIiIiIic+BCiYiIiIiIqBEulIiIiIiIiBrhQomIiIiIiKgRLpQArFu3Do8++ijs7e0RFhaGzMzMFrfPyMhAWFgY7O3tERgYiPfff99ESZtnTP4dO3Zg7Nix8PLygqurKyIjI7F3714Tpm2esX+DBgcOHICtrS2GDh3atQFbYWz+6upqvPrqq/D394darUZQUBA2btxoorTNM3YMKSkpCA0NhaOjI7RaLWbNmoWbN2+aKK2hb7/9FhMnToSPjw8UCgU+//zzVvexpHlsbH5LncfUuVibzP+cZm1ibeoI1ibLmMcdIt3cli1bRKVSyQcffCA5OTkyd+5ccXJykoKCgma3P3/+vDg6OsrcuXMlJydHPvjgA1GpVLJt2zYTJ69nbP65c+fKm2++KUeOHJG8vDxZvHixqFQqOXHihImT/8jYMTS4ffu2BAYGSkJCgoSGhpombDPak3/SpEkyatQoSU1NlQsXLsjhw4flwIEDJkxtyNgxZGZmilKplNWrV8v58+clMzNTBg4cKJMnTzZx8nq7d++WV199VbZv3y4AZOfOnS1ub2nz2Nj8ljiPqXOxNpn/Oc3axNrUUaxN5p/HHdXtF0ojR46UpKQkg7b+/fvLokWLmt3+5Zdflv79+xu0zZ49WyIiIrosY0uMzd+ckJAQWbp0aWdHa7P2jmHq1Kny2muvyZIlS8xajIzN//XXX4ubm5vcvHnTFPHaxNgxrFy5UgIDAw3a1qxZI76+vl2Wsa3a8mJuafP4fm3J3xxzz2PqXKxN5n9OszaZH2sTa5O5detT7+7du4fjx48jISHBoD0hIQFZWVnN7nPw4MEm248bNw7Hjh1DTU1Nl2VtTnvyN6bT6VBWVoZHHnmkKyK2qr1jSE5ORn5+PpYsWdLVEVvUnvy7du1CeHg43nrrLfTq1Qt9+/bFggULUFlZaYrITbRnDFFRUbhy5Qp2794NEcG1a9ewbds2TJgwwRSRO8yS5nFnMPc8ps7F2mT+5zRrE2uTOVjSPO4M5p7HncHW3AHMqbi4GHV1dfD29jZo9/b2RlFRUbP7FBUVNbt9bW0tiouLodVquyxvY+3J39jbb7+NiooKTJkypSsitqo9Yzh79iwWLVqEzMxM2Nqa9yncnvznz5/H/v37YW9vj507d6K4uBi/+c1vcOvWLbOcC96eMURFRSElJQVTp05FVVUVamtrMWnSJKxdu9YUkTvMkuZxZzD3PKbOxdpk/uc0axNrkzlY0jzuDOaex52hW3+i1EChUBg8FpEmba1t31y7qRibv8Gnn36KN954A1u3bkXPnj27Kl6btHUMdXV1mDZtGpYuXYq+ffuaKl6rjPkb6HQ6KBQKpKSkYOTIkXjyySexatUqbNq0yWzv3AHGjSEnJwcvvPACXn/9dRw/fhx79uzBhQsXkJSUZIqoncLS5nF7WdI8ps7F2mT+5zRrE2uTqVnaPG4vS5rHHdGtP1Hy9PSEjY1Nk3cmrl+/3mRF30Cj0TS7va2tLTw8PLosa3Pak7/B1q1bkZiYiM8++wxjxozpypgtMnYMZWVlOHbsGLKzs/G73/0OQP2Lu4jA1tYW+/btw+jRo02SHWjf30Cr1aJXr15wc3PTtw0YMAAigitXriA4OLhLMzfWnjGsWLEC0dHRWLhwIQBgyJAhcHJyQkxMDP74xz9a/LteljSPO8JS5jF1LtYm8z+nWZvqsTaZliXN446wlHncGbr1J0p2dnYICwtDamqqQXtqaiqioqKa3ScyMrLJ9vv27UN4eDhUKlWXZW1Oe/ID9av8mTNnYvPmzWY/b9fYMbi6uuLf//43Tp48qf9JSkpCv379cPLkSYwaNcpU0QG0728QHR2N77//HuXl5fq2vLw8KJVK+Pr6dmne5rRnDHfv3oVSafjyYWNjA+DHd78smSXN4/aypHlMnYu1yfzPadameqxNpmVJ87i9LGkedwpT3jnCEjXcenLDhg2Sk5Mj8+bNEycnJ7l48aKIiCxatEimT5+u377h1o0vvvii5OTkyIYNGyziFqxtzb9582axtbWVd999VwoLC/U/t2/fNkt+EePH0Ji57yxkbP6ysjLx9fWVn/3sZ/Kf//xHMjIyJDg4WJ5//nlzDcHoMSQnJ4utra2sW7dO8vPzZf/+/RIeHi4jR440S/6ysjLJzs6W7OxsASCrVq2S7Oxs/S1kLX0eG5vfEucxdS7WJvM/p1mbWJs6irXJ/PO4o7r9QklE5N133xV/f3+xs7OT4cOHS0ZGhv53M2bMkNjYWIPt09PTZdiwYWJnZycBAQHy3nvvmTixIWPyx8bGCoAmPzNmzDB98PsY+ze4n7mLkYjx+U+fPi1jxowRBwcH8fX1lfnz58vdu3dNnNqQsWNYs2aNhISEiIODg2i1Wnn22WflypUrJk5dLy0trcXntaXPY2PzW+o8ps7F2mT+5zRrE2tTR7A2WcY87giFiBV8FklERERERGRC3foaJSIiIiIiouZwoURERERERNQIF0pERERERESNcKFERERERETUCBdKREREREREjXChRERERERE1AgXSkRERERERI1woURERERERNQIF0pEFiA9PR0KhQK3b9+2yOM1Pq5CocDkyZM79dit2bRpk77vefPmmbRvIqLuiLWpdaxNDzculMhivP/++3BxcUFtba2+rby8HCqVCjExMQbbZmZmQqFQIC8vr9XjdtULMwBcu3YNKpUKn3zySbO/nz17NoYMGdLp/bYmKioKhYWFcHNzA1D/Qu7u7t5px8/NzcWmTZs65VgFBQVQq9UoLS1tcbupU6eisLAQkZGRndIvEVFbsDZ1HtYmsjZcKJHFiI+PR3l5OY4dO6Zvy8zMhEajwdGjR3H37l19e3p6Onx8fNC3b1+T5RMRg0IJAN7e3pgwYQKSk5ObbF9ZWYktW7YgMTHRVBH17OzsoNFooFAouuT4PXv27LTi9sUXXyAuLg6urq4tbufg4ACNRgM7O7tO6ZeIqC1YmzoPaxNZGy6UyGL069cPPj4+SE9P17elp6fjqaeeQlBQELKysgza4+PjAQCffPIJwsPD4eLiAo1Gg2nTpuH69esAgIsXL+q369GjBxQKBWbOnAmgvri89dZbCAwMhIODA0JDQ7Ft2zaDPhQKBfbu3Yvw8HCo1WpkZmY2yZ2YmIi0tDRcvHjRoH3btm2oqqrCL37xi1b7as727dsxcOBAqNVqBAQE4O233zb4fXV1NV5++WX4+flBrVYjODgYGzZsMMh++/ZtpKenY9asWbhz547+9IA33ngDy5Ytw+DBg5v0GxYWhtdff73FbI3FxcXh97//PebNm4cePXrA29sb69evR0VFBWbNmgUXFxcEBQXh66+/brLvF198gUmTJulzjxw5Ek5OTnB3d0d0dDQKCgqMykJE1JlYmwyxNrE2dStCZEGmTZsmCQkJ+scjRoyQzz77TObMmSOvvPKKiIhUV1eLg4ODfPjhhyIismHDBtm9e7fk5+fLwYMHJSIiQsaPHy8iIrW1tbJ9+3YBILm5uVJYWCi3b98WEZFXXnlF+vfvL3v27JH8/HxJTk4WtVot6enpIiKSlpYmAGTIkCGyb98+OXfunBQXFzfJXFtbK1qtVpYsWWLQHhcXJ1OmTDGqr5KSEhEROXbsmCiVSlm2bJnk5uZKcnKyODg4SHJysv74U6ZMET8/P9mxY4fk5+fLN998I1u2bGlyvOrqannnnXfE1dVVCgsLpbCwUMrKyuTy5cuiVCrlyJEj+mOeOnVKFAqF5OfnN/v3aZyzQWxsrLi4uMjy5cslLy9Pli9fLkqlUsaPHy/r16+XvLw8mTNnjnh4eEhFRYV+v5KSElGpVHLp0iWpqakRNzc3WbBggZw7d05ycnJk06ZNUlBQ0KSvuXPnNpuPiKgrsDaViAhrE2tT98OFElmU9evXi5OTk9TU1EhpaanY2trKtWvXZMuWLRIVFSUiIhkZGQLggS+YR44cEQBSVlYmIs2/gJaXl4u9vb1kZWUZ7JuYmCjPPPOMwX6ff/55q7n/8Ic/iL+/v+h0OhEROX/+vCgUCtm7d69RfTVknDZtmowdO9Zg+4ULF0pISIiIiOTm5goASU1NbTZP4+MlJyeLm5tbk+3Gjx8vc+bM0T+eN2+exMXFPXCcLRWjxx57TP+4trZWnJycZPr06fq2wsJCASAHDx7Ut6WkpMjw4cNFROTmzZsCQF+gH4TFiIhMjbWpPiNr04OxNj2ceOodWZT4+HhUVFTg6NGjyMzMRN++fdGzZ0/Exsbi6NGjqKioQHp6Onr37o3AwEAAQHZ2Np566in4+/vDxcUFcXFxAIBLly49sJ+cnBxUVVVh7NixcHZ21v98/PHHyM/PN9g2PDy81dyJiYkoKCjAP//5TwDAxo0b4evrizFjxhjVV4PTp08jOjraoC06Ohpnz55FXV0dTp48CRsbG8TGxraarSW/+tWv8Omnn6Kqqgo1NTVISUnBc889165j3X9hsI2NDTw8PAxOn/D29gYA/akngOGpDY888ghmzpyJcePGYeLEiVi9ejUKCwvblYWIqDOxNtVjbWJt6m5szR2A6H59+vSBr68v0tLSUFJSon+x1Wg0ePTRR3HgwAGkpaVh9OjRAICKigokJCQgISEBn3zyCby8vHDp0iWMGzcO9+7de2A/Op0OAPDVV1+hV69eBr9Tq9UGj52cnFrNHRwcjJiYGCQnJyM+Ph4fffQRZs2aBaVSaVRfDUSkycWuIqL/bwcHh1YztcXEiROhVquxc+dOqNVqVFdX46c//Wm7jqVSqQweKxQKg7aG8TT8e9TU1GDPnj1YvHixfpvk5GS88MIL2LNnD7Zu3YrXXnsNqampiIiIaFcmIqLOwNpUj7WJtam74UKJLE58fDzS09NRUlKChQsX6ttjY2Oxd+9eHDp0CLNmzQIAnDlzBsXFxfjTn/4EPz8/ADC4MxEA/Z1o6urq9G0hISFQq9W4dOlSh9/5apCYmIg5c+bgqaeewpUrV/QZ29NXSEgI9u/fb9CWlZWFvn37wsbGBoMHD4ZOp0NGRgbGjBnT6vHs7OwMxt/A1tYWM2bMQHJyMtRqNZ5++mk4Ojq2KWNHpaWlwd3dHUOHDjVoHzZsGIYNG4bFixcjMjISmzdvZjEiIrNjbWJtYm3qfrhQIosTHx+P3/72t6ipqTF48Y6NjcWcOXNQVVWlv1tQ7969YWdnh7Vr1yIpKQnfffcdli9fbnA8f39/KBQKfPnll3jyySfh4OAAFxcXLFiwAC+++CJ0Oh0ee+wxlJaWIisrC87OzpgxY4bRuX/+85/jhRdewOzZs/HEE08gICAAANrV10svvYQRI0Zg+fLlmDp1Kg4ePIi//OUvWLduHQAgICAAM2bMwHPPPYc1a9YgNDQUBQUFuH79OqZMmdLkeAEBASgvL8c//vEPhIaGwtHRUV90nn/+eQwYMAAAcODAAaPH3V67du3Sn9oAABcuXMD69esxadIk+Pj4IDc3F3l5efjlL39pskxERA/C2sTaxNrUDZn3Eimipi5cuCAApH///gbtly9fFgASFBRk0L5582YJCAgQtVotkZGRsmvXLgEg2dnZ+m2WLVsmGo1GFAqFzJgxQ0REdDqdrF69Wvr16ycqlUq8vLxk3LhxkpGRISIPvji0Jb/+9a8FgGzevNmgvT19bdu2TUJCQkSlUknv3r1l5cqVBsesrKyUF198UbRardjZ2UmfPn1k48aNDzxeUlKSeHh4CIAmd0GKiYnRX4zbkpYumG18Eau/v7/8+c9/NmgDIDt37hQRET8/P4MLfouKimTy5Mn68fj7+8vrr78udXV1rfZFRNTVWJvqsTaxNnUnCpH7Ti4lom5HRNC/f3/Mnj0b8+fPb3Hbhu8IKSkp6dCX+p04cQKjR4/GjRs3mpw/3pq4uDgMHToU77zzTrv7JyIiy8baRJaAd70j6sauX7+OVatW4erVq/rz1tvC19cXzzzzTLv7ra2txdq1a40qRCkpKXB2dm72ixWJiOjhwdpEloKfKBF1YwqFAp6enli9ejWmTZvW6vaVlZW4evUqAMDZ2RkajaarI+qVlZXh2rVrAAB3d3d4enqarG8iIjId1iayFFwoERERERERNcJT74iIiIiIiBrhQomIiIiIiKgRLpSIiIiIiIga4UKJiIiIiIioES6UiIiIiIiIGuFCiYiIiIiIqBEulIiIiIiIiBrhQomIiIiIiKiR/wdzgV7aCsjPcAAAAABJRU5ErkJggg==", - "text/plain": [ - "
" - ] - }, - "metadata": {}, - "output_type": "display_data" - } - ], - "source": [ - "def plot_velocity_profiles(avg_profile, rms_profile, std_profile, ax):\n", - " alt = avg_profile.index\n", - " mean = avg_profile.values.T\n", - " rms = rms_profile.values.T\n", - " std = std_profile.values.T\n", - "\n", - " ax.plot(mean[0], alt, '-x', label=avg_profile.columns[0])\n", - " ax.plot(mean[1], alt, '-x', label=avg_profile.columns[1])\n", - " ax.plot(mean[2], alt, '-x', label=avg_profile.columns[2])\n", - "\n", - " ax.fill_betweenx(alt, mean[0]-std[0], mean[0]+std[0], facecolor='lightblue')\n", - " ax.fill_betweenx(alt, mean[1]-std[1], mean[1]+std[1], facecolor='moccasin')\n", - " ax.fill_betweenx(alt, mean[2]-std[2], mean[2]+std[2], facecolor='palegreen')\n", - "\n", - " ax.plot(rms[0], alt, '+', color='C0')\n", - " ax.plot(rms[1], alt, '+', color='C1')\n", - " ax.plot(rms[2], alt, '+', color='C2')\n", - " ax.set(xlabel='Water Velocity [m/s]', ylabel='Altitude [m]', ylim=(0,10))\n", - " ax.legend()\n", - "\n", - "fig, ax = plt.subplots(1, 2, figsize=(10, 7))\n", - "plot_velocity_profiles(avg_profile_ebb, rms_profile_ebb, std_profile_ebb, ax[0])\n", - "ax[0].set_title('Ebb Tide')\n", - "plot_velocity_profiles(avg_profile_flood, rms_profile_flood, std_profile_flood, ax[1])\n", - "ax[1].set_title('Flood Tide')" - ] - }, - { - "attachments": {}, - "cell_type": "markdown", - "metadata": {}, - "source": [ - "### Current Energy Converter Efficiency\n", - "\n", - "The CEC efficiency, or device power coefficient, can be found using the `device_efficiency` method." - ] - }, - { - "cell_type": "code", - "execution_count": 13, - "metadata": {}, - "outputs": [], - "source": [ - "efficiency_ebb = performance.device_efficiency(\n", - " power=power_ebb,\n", - " velocity=ebb,\n", - " water_density=ds['water_density'],\n", - " capture_area=np.pi*1.5**2,\n", - " hub_height=4.2,\n", - " sampling_frequency=1,\n", - " window_avg_time=600)\n", - "efficiency_flood = performance.device_efficiency(\n", - " power=power_flood,\n", - " velocity=flood,\n", - " water_density=ds['water_density'],\n", - " capture_area=np.pi*1.5**2,\n", - " hub_height=4.2,\n", - " sampling_frequency=1,\n", - " window_avg_time=600)" - ] - }, - { - "attachments": {}, - "cell_type": "markdown", - "metadata": {}, - "source": [ - "And these efficiency curves can be plotted as profiles:" - ] - }, - { - "cell_type": "code", - "execution_count": 14, - "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "Text(0.5, 1.0, 'Flood Tide')" - ] - }, - "execution_count": 14, - "metadata": {}, - "output_type": "execute_result" - }, - { - "data": { - "image/png": "", - "text/plain": [ - "
" - ] - }, - "metadata": {}, - "output_type": "display_data" - } - ], - "source": [ - "def plot_efficiency(efficiency, ax):\n", - " means = efficiency.U_avg.values.T\n", - " eta = efficiency.Efficiency.values.T\n", - " ax.plot(means, eta, '-o')\n", - " ax.set(xlabel=\"Hub Height Flow Velocity [m/s]\", ylabel='Efficiency [%]')\n", - "\n", - "fig, ax = plt.subplots(1, 2, figsize=(7, 6))\n", - "plot_efficiency(efficiency_ebb, ax[0])\n", - "ax[0].set_title('Ebb Tide')\n", - "plot_efficiency(efficiency_flood, ax[1])\n", - "ax[1].set_title('Flood Tide')" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [] - } - ], - "metadata": { - "kernelspec": { - "display_name": "base", - "language": "python", - "name": "python3" - }, - "language_info": { - "codemirror_mode": { - "name": "ipython", - "version": 3 - }, - "file_extension": ".py", - "mimetype": "text/x-python", - "name": "python", - "nbconvert_exporter": "python", - "pygments_lexer": "ipython3", - "version": "3.9.15" - }, - "vscode": { - "interpreter": { - "hash": "357206ab7e4935423e95e994af80e27e7e6c0672abcebb9d86ab743298213348" - } - } + "cells": [ + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Tidal Power Performance Analysis\n", + "\n", + "The following example demonstrates a simple workflow for conducting the power performance analysis of a turbine, given turbine specifications, power data, and Acoustic Doppler Current Profiler (ADCP) water measurements.\n", + "\n", + "In this case, the turbine specifications can be broken down into\n", + " 1. Shape of the rotor's swept area\n", + " 2. Turbine rotor diameter/height and width\n", + " 3. Turbine hub height (center of swept area)\n", + "\n", + "Additional data needed:\n", + " - Power data from the current energy converter (CEC)\n", + " - 2-dimensional water velocity data\n", + "\n", + "In this jupyter notebook, we'll be covering the following three topics:\n", + " 1. CEC power-curve\n", + " 2. Velocity profiles\n", + " 3. CEC efficiency profile (or power coefficient profile)\n", + "\n", + "Start by importing the necessary tools:" + ] + }, + { + "cell_type": "code", + "execution_count": 1, + "metadata": { + "scrolled": true + }, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "c:\\Users\\mcve343\\Anaconda3\\lib\\site-packages\\xarray\\backends\\cfgrib_.py:29: UserWarning: Failed to load cfgrib - most likely there is a problem accessing the ecCodes library. Try `import cfgrib` to get the full error message\n", + " warnings.warn(\n" + ] + } + ], + "source": [ + "import numpy as np\n", + "import matplotlib.pyplot as plt\n", + "\n", + "from mhkit.tidal import performance\n", + "from mhkit.dolfyn import load" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "In this case, we'll use ADCP data from the ADCP example notebook. I am importing a dataset from the ADCP example notebook. This data retains the original timestamps (1 Hz sampling frequency) and was rotated into the principal coordinate frame (streamwise-cross_stream-up)." + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "metadata": { + "scrolled": true + }, + "outputs": [], + "source": [ + "# Open processed ADCP dataset\n", + "ds = load(\"data/tidal/adcp.principal.a1.20200815.nc\")" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Next, since we don't have power data, we'll invent a mock timeseries based off the cube of water velocity, just to have something to work with." + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "metadata": {}, + "outputs": [], + "source": [ + "# Streamwise and hub-height water velocity\n", + "streamwise_vel = ds[\"vel\"].sel(dir=\"streamwise\")\n", + "hub_height_vel = abs(streamwise_vel.isel(range=10))\n", + "\n", + "# Emulate power data\n", + "power = hub_height_vel**3 * 1e5\n", + "# Emulate cut-in speed by setting power at flow speeds below 0.5 m/s to 0 W\n", + "power = power.where(abs(streamwise_vel.mean(\"range\")) > 0.5, 0)" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "The first step for any of the following calculations is to first split velocity into ebb and flood tide. You'll need some background information on the site to know which direction is positive and which is negative in the data." + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "metadata": {}, + "outputs": [], + "source": [ + "ebb = streamwise_vel.where(streamwise_vel > 0)\n", + "flood = streamwise_vel.where(streamwise_vel < 0)" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "With the ebb and flood velocities, we can also divide the power data into that for ebb and flood tides." + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "metadata": {}, + "outputs": [], + "source": [ + "# Make sure ebb and flood are on same timestamps\n", + "power = power.interp(time=streamwise_vel[\"time\"])\n", + "\n", + "power_ebb = power.where(~ebb.mean(\"range\").isnull(), 0)\n", + "power_flood = power.where(~flood.mean(\"range\").isnull(), 0)" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Power-curve\n", + "\n", + "Now with power and velocity divided into ebb and flood tides, we can calculate the power curve for the CEC in both conditions\n" + ] + }, + { + "cell_type": "code", + "execution_count": 6, + "metadata": {}, + "outputs": [], + "source": [ + "power_curve_ebb = performance.power_curve(\n", + " power_ebb,\n", + " velocity=ebb,\n", + " hub_height=4.2,\n", + " doppler_cell_size=0.5,\n", + " sampling_frequency=1,\n", + " window_avg_time=600,\n", + " turbine_profile=\"circular\",\n", + " diameter=3,\n", + " height=None,\n", + " width=None,\n", + ")\n", + "power_curve_flood = performance.power_curve(\n", + " power_flood,\n", + " velocity=flood,\n", + " hub_height=4.2,\n", + " doppler_cell_size=0.5,\n", + " sampling_frequency=1,\n", + " window_avg_time=600,\n", + " turbine_profile=\"circular\",\n", + " diameter=3,\n", + " height=None,\n", + " width=None,\n", + ")" + ] + }, + { + "cell_type": "code", + "execution_count": 7, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
U_avgU_avg_power_weightedP_avgP_stdP_maxP_min
U_bins
(0.0, 0.1]0.0674590.0000000.0000000.0000000.0000000.000000
(0.1, 0.2]0.1156140.0000000.0000000.0000000.0000000.000000
(0.2, 0.3]0.2496760.2256390.0000000.0000000.0000000.000000
(0.3, 0.4]0.3396000.3155610.0000000.0000000.0000000.000000
(0.4, 0.5]0.4593930.4372492890.7249862660.8100225551.535008229.914964
(0.5, 0.6]0.5485070.53297419677.3435184645.89093624323.23445415031.452582
(0.6, 0.7]0.6714490.65536240369.4355173679.26013545506.30667737083.470337
(0.7, 0.8]0.7261890.70484552413.9720242856.73714257360.86147350670.102583
(0.8, 0.9]0.8439580.82591679944.0008559798.56967496206.92802566531.815452
(0.9, 1.0]0.9387010.920960103970.0421755828.263891112163.97743499100.055332
(1.0, 1.1]1.0466071.026293148511.10000818809.350864171583.550611124179.073981
(1.1, 1.2]1.1473481.127691200340.8205816299.518554209073.741656187772.752668
\n", + "
" + ], + "text/plain": [ + " U_avg U_avg_power_weighted P_avg P_std \\\n", + "U_bins \n", + "(0.0, 0.1] 0.067459 0.000000 0.000000 0.000000 \n", + "(0.1, 0.2] 0.115614 0.000000 0.000000 0.000000 \n", + "(0.2, 0.3] 0.249676 0.225639 0.000000 0.000000 \n", + "(0.3, 0.4] 0.339600 0.315561 0.000000 0.000000 \n", + "(0.4, 0.5] 0.459393 0.437249 2890.724986 2660.810022 \n", + "(0.5, 0.6] 0.548507 0.532974 19677.343518 4645.890936 \n", + "(0.6, 0.7] 0.671449 0.655362 40369.435517 3679.260135 \n", + "(0.7, 0.8] 0.726189 0.704845 52413.972024 2856.737142 \n", + "(0.8, 0.9] 0.843958 0.825916 79944.000855 9798.569674 \n", + "(0.9, 1.0] 0.938701 0.920960 103970.042175 5828.263891 \n", + "(1.0, 1.1] 1.046607 1.026293 148511.100008 18809.350864 \n", + "(1.1, 1.2] 1.147348 1.127691 200340.820581 6299.518554 \n", + "\n", + " P_max P_min \n", + "U_bins \n", + "(0.0, 0.1] 0.000000 0.000000 \n", + "(0.1, 0.2] 0.000000 0.000000 \n", + "(0.2, 0.3] 0.000000 0.000000 \n", + "(0.3, 0.4] 0.000000 0.000000 \n", + "(0.4, 0.5] 5551.535008 229.914964 \n", + "(0.5, 0.6] 24323.234454 15031.452582 \n", + "(0.6, 0.7] 45506.306677 37083.470337 \n", + "(0.7, 0.8] 57360.861473 50670.102583 \n", + "(0.8, 0.9] 96206.928025 66531.815452 \n", + "(0.9, 1.0] 112163.977434 99100.055332 \n", + "(1.0, 1.1] 171583.550611 124179.073981 \n", + "(1.1, 1.2] 209073.741656 187772.752668 " + ] + }, + "execution_count": 7, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "power_curve_flood" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Next we can plot the two power curves. A velocity bin is missing in the ebb tide power curve in this example because the data is so short, there are no samples for that bin." + ] + }, + { + "cell_type": "code", + "execution_count": 8, + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "def plot_power_curve(P_curve, ax):\n", + " ax.plot(P_curve[\"U_avg\"], P_curve[\"P_avg\"], \"-o\", color=\"C0\", label=\"Avg Power\")\n", + " ax.plot(\n", + " P_curve[\"U_avg\"],\n", + " (P_curve[\"P_avg\"] - P_curve[\"P_std\"]),\n", + " \"--+\",\n", + " color=\"C1\",\n", + " label=\"Power - 1 Std Dev\",\n", + " )\n", + " ax.plot(\n", + " P_curve[\"U_avg\"],\n", + " (P_curve[\"P_avg\"] + P_curve[\"P_std\"]),\n", + " \"-+\",\n", + " color=\"C1\",\n", + " label=\"Power + 1 Std Dev\",\n", + " )\n", + " ax.plot(P_curve[\"U_avg\"], P_curve[\"P_min\"], \"--x\", color=\"C2\", label=\"Min Power\")\n", + " ax.plot(P_curve[\"U_avg\"], P_curve[\"P_max\"], \"-x\", color=\"C2\", label=\"Max Power\")\n", + " ax.set(xlabel=\"Flow Speed at Hub Height [m/s]\", ylabel=\"Power [W]\")\n", + " ax.legend()\n", + "\n", + "\n", + "fig, ax = plt.subplots(1, 2, figsize=(10, 7))\n", + "plot_power_curve(power_curve_ebb, ax[0])\n", + "plot_power_curve(power_curve_flood, ax[1])" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Velocity Profiles\n", + "Various velocity profiles can be created next from the water velocity data, and we can do this again with ebb and flood tide. These functions are following three steps:\n", + " 1. Reshape the data into bins by time (ensembles)\n", + " 2. Apply a function to the ensembles to get ensemble statistics (mean, root-mean-square (RMS), or standard devation)\n", + " 3. Regroup and bin the ensemble statistics by flow speed\n", + "\n", + "These profiles are created using the `velocity_profiles` method, and a profile is specified using the \"function\" argument. For the average velocity profiles, we'll set the function = 'mean'.\n" + ] + }, + { + "cell_type": "code", + "execution_count": 9, + "metadata": {}, + "outputs": [], + "source": [ + "avg_profile_ebb = performance.velocity_profiles(\n", + " velocity=ebb,\n", + " hub_height=4.2,\n", + " water_depth=10,\n", + " sampling_frequency=1,\n", + " window_avg_time=600,\n", + " function=\"mean\",\n", + ")\n", + "avg_profile_flood = performance.velocity_profiles(\n", + " velocity=ebb,\n", + " hub_height=4.2,\n", + " water_depth=10,\n", + " sampling_frequency=1,\n", + " window_avg_time=600,\n", + " function=\"mean\",\n", + ")" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### RMS Tidal Velocity\n", + "\n", + "For RMS velocity profiles, we'll set the function = 'rms'." + ] + }, + { + "cell_type": "code", + "execution_count": 10, + "metadata": {}, + "outputs": [], + "source": [ + "rms_profile_ebb = performance.velocity_profiles(\n", + " velocity=ebb,\n", + " hub_height=4.2,\n", + " water_depth=10,\n", + " sampling_frequency=1,\n", + " window_avg_time=600,\n", + " function=\"rms\",\n", + ")\n", + "rms_profile_flood = performance.velocity_profiles(\n", + " velocity=ebb,\n", + " hub_height=4.2,\n", + " water_depth=10,\n", + " sampling_frequency=1,\n", + " window_avg_time=600,\n", + " function=\"rms\",\n", + ")" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Std Dev Tidal Velocity\n", + "\n", + "And to get the standard deviation, we'll set function = 'std'." + ] + }, + { + "cell_type": "code", + "execution_count": 11, + "metadata": {}, + "outputs": [], + "source": [ + "std_profile_ebb = performance.velocity_profiles(\n", + " velocity=ebb,\n", + " hub_height=4.2,\n", + " water_depth=10,\n", + " sampling_frequency=1,\n", + " window_avg_time=600,\n", + " function=\"std\",\n", + ")\n", + "std_profile_flood = performance.velocity_profiles(\n", + " velocity=ebb,\n", + " hub_height=4.2,\n", + " water_depth=10,\n", + " sampling_frequency=1,\n", + " window_avg_time=600,\n", + " function=\"std\",\n", + ")" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Finally, we can plot these variables together based on ebb and flood tides. The following code plots the mean and RMS profiles as line plots with \"x\" and \"+\" markers, respectively, and shades the area between +/- 1 standard deviation from the mean." + ] + }, + { + "cell_type": "code", + "execution_count": 12, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "Text(0.5, 1.0, 'Flood Tide')" + ] + }, + "execution_count": 12, + "metadata": {}, + "output_type": "execute_result" }, - "nbformat": 4, - "nbformat_minor": 4 + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "def plot_velocity_profiles(avg_profile, rms_profile, std_profile, ax):\n", + " alt = avg_profile.index\n", + " mean = avg_profile.values.T\n", + " rms = rms_profile.values.T\n", + " std = std_profile.values.T\n", + "\n", + " ax.plot(mean[0], alt, \"-x\", label=avg_profile.columns[0])\n", + " ax.plot(mean[1], alt, \"-x\", label=avg_profile.columns[1])\n", + " ax.plot(mean[2], alt, \"-x\", label=avg_profile.columns[2])\n", + "\n", + " ax.fill_betweenx(alt, mean[0] - std[0], mean[0] + std[0], facecolor=\"lightblue\")\n", + " ax.fill_betweenx(alt, mean[1] - std[1], mean[1] + std[1], facecolor=\"moccasin\")\n", + " ax.fill_betweenx(alt, mean[2] - std[2], mean[2] + std[2], facecolor=\"palegreen\")\n", + "\n", + " ax.plot(rms[0], alt, \"+\", color=\"C0\")\n", + " ax.plot(rms[1], alt, \"+\", color=\"C1\")\n", + " ax.plot(rms[2], alt, \"+\", color=\"C2\")\n", + " ax.set(xlabel=\"Water Velocity [m/s]\", ylabel=\"Altitude [m]\", ylim=(0, 10))\n", + " ax.legend()\n", + "\n", + "\n", + "fig, ax = plt.subplots(1, 2, figsize=(10, 7))\n", + "plot_velocity_profiles(avg_profile_ebb, rms_profile_ebb, std_profile_ebb, ax[0])\n", + "ax[0].set_title(\"Ebb Tide\")\n", + "plot_velocity_profiles(avg_profile_flood, rms_profile_flood, std_profile_flood, ax[1])\n", + "ax[1].set_title(\"Flood Tide\")" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Current Energy Converter Efficiency\n", + "\n", + "The CEC efficiency, or device power coefficient, can be found using the `device_efficiency` method." + ] + }, + { + "cell_type": "code", + "execution_count": 13, + "metadata": {}, + "outputs": [], + "source": [ + "efficiency_ebb = performance.device_efficiency(\n", + " power=power_ebb,\n", + " velocity=ebb,\n", + " water_density=ds[\"water_density\"],\n", + " capture_area=np.pi * 1.5**2,\n", + " hub_height=4.2,\n", + " sampling_frequency=1,\n", + " window_avg_time=600,\n", + ")\n", + "efficiency_flood = performance.device_efficiency(\n", + " power=power_flood,\n", + " velocity=flood,\n", + " water_density=ds[\"water_density\"],\n", + " capture_area=np.pi * 1.5**2,\n", + " hub_height=4.2,\n", + " sampling_frequency=1,\n", + " window_avg_time=600,\n", + ")" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "And these efficiency curves can be plotted as profiles:" + ] + }, + { + "cell_type": "code", + "execution_count": 14, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "Text(0.5, 1.0, 'Flood Tide')" + ] + }, + "execution_count": 14, + "metadata": {}, + "output_type": "execute_result" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "def plot_efficiency(efficiency, ax):\n", + " means = efficiency.U_avg.values.T\n", + " eta = efficiency.Efficiency.values.T\n", + " ax.plot(means, eta, \"-o\")\n", + " ax.set(xlabel=\"Hub Height Flow Velocity [m/s]\", ylabel=\"Efficiency [%]\")\n", + "\n", + "\n", + "fig, ax = plt.subplots(1, 2, figsize=(7, 6))\n", + "plot_efficiency(efficiency_ebb, ax[0])\n", + "ax[0].set_title(\"Ebb Tide\")\n", + "plot_efficiency(efficiency_flood, ax[1])\n", + "ax[1].set_title(\"Flood Tide\")" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [] + } + ], + "metadata": { + "kernelspec": { + "display_name": "base", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.9.15" + }, + "vscode": { + "interpreter": { + "hash": "357206ab7e4935423e95e994af80e27e7e6c0672abcebb9d86ab743298213348" + } + } + }, + "nbformat": 4, + "nbformat_minor": 4 } diff --git a/examples/upcrossing_example.ipynb b/examples/upcrossing_example.ipynb new file mode 100644 index 000000000..cbb67838a --- /dev/null +++ b/examples/upcrossing_example.ipynb @@ -0,0 +1,182 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# MHKit Upcrossing Analysis Example\n", + "\n", + "The following shows an example of using the upcrossing functionality in the [MHKiT Utils module](https://mhkit-software.github.io/MHKiT/mhkit-python/api.utils.html).\n", + "\n", + "This example performs an upcrossing analysis on a surface elevation trace to plot some quantities of interest. Such an upcrossing analysis could be applied to any time domain signal, such as a device response." + ] + }, + { + "cell_type": "code", + "execution_count": 1, + "metadata": {}, + "outputs": [], + "source": [ + "from mhkit.wave.resource import jonswap_spectrum, surface_elevation\n", + "from mhkit.utils import upcrossing, peaks, troughs, heights, periods\n", + "import numpy as np\n", + "import matplotlib.pyplot as plt" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Compute the surface elevation" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "metadata": {}, + "outputs": [], + "source": [ + "# Peak period and significant wave height\n", + "Tp = 10 # s\n", + "Hs = 2.5 # m\n", + "gamma = 3.3\n", + "\n", + "# Create frequency vector using a return period of 1hr\n", + "Tr = 3600 # s\n", + "df = 1.0 / Tr # Hz\n", + "f = np.arange(0, 1, df)\n", + "\n", + "# Calculate spectrum\n", + "spec = jonswap_spectrum(f, Tp, Hs, gamma)\n", + "\n", + "# Calculate surface elevation\n", + "fs = 10.0 # Hz\n", + "t = np.arange(0, Tr, 1 / fs)\n", + "\n", + "eta = surface_elevation(spec, t)" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "plt.figure()\n", + "plt.plot(t, eta)\n", + "plt.xlabel(\"t [s]\")\n", + "plt.ylabel(\"$\\eta$ [m]\")\n", + "plt.title(f\"Surface elevation for Tp={Tp}s, Hs={Hs}m\")\n", + "plt.grid()" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Plot the individual wave heights and periods" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "heights = heights(t, eta.values.squeeze())\n", + "periods = periods(t, eta.values.squeeze())\n", + "\n", + "plt.figure()\n", + "plt.plot(periods, heights, \"o\")\n", + "plt.xlabel(\"Zero crossing period [s]\")\n", + "plt.ylabel(\"Wave height [m]\")\n", + "plt.grid()" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Plot the crest probability of exceedance distribution" + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "crests = peaks(t, eta.values.squeeze())\n", + "crests_sorted = np.sort(crests)\n", + "\n", + "N = crests_sorted.size\n", + "\n", + "# Exceedance probability. Crests are in ascending order\n", + "# meaning the first element has P(exceedance) = 1, and\n", + "# the final element has P(exceedance) = 1 / N\n", + "Q = np.arange(N, 0, -1) / N\n", + "\n", + "plt.figure()\n", + "plt.semilogy(crests_sorted, Q, \"o\")\n", + "plt.xlabel(\"Crest height [m]\")\n", + "plt.ylabel(\"P(exceedance)\")\n", + "plt.grid()\n", + "plt.show()" + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3 (ipykernel)", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.9.17" + } + }, + "nbformat": 4, + "nbformat_minor": 2 +} diff --git a/examples/wave_example.ipynb b/examples/wave_example.ipynb index 728a0b526..02680f530 100644 --- a/examples/wave_example.ipynb +++ b/examples/wave_example.ipynb @@ -236,12 +236,12 @@ } ], "source": [ - "ndbc_data_file = 'data/wave/data.txt'\n", + "ndbc_data_file = \"data/wave/data.txt\"\n", "\n", "# ndbc.read_file outputs the NDBC file data into two variables.\n", - " # raw_ndbc_data is a pandas DataFrame containing the file data. \n", - " # meta contains the meta data, if available. \n", - "[raw_ndbc_data, meta] = wave.io.ndbc.read_file(ndbc_data_file) \n", + "# raw_ndbc_data is a pandas DataFrame containing the file data.\n", + "# meta contains the meta data, if available.\n", + "[raw_ndbc_data, meta] = wave.io.ndbc.read_file(ndbc_data_file)\n", "raw_ndbc_data.head()" ] }, @@ -487,7 +487,7 @@ ], "source": [ "# Transpose raw NDBC data\n", - "ndbc_data = raw_ndbc_data.T \n", + "ndbc_data = raw_ndbc_data.T\n", "ndbc_data.head()" ] }, @@ -568,8 +568,8 @@ } ], "source": [ - "# Compute the enegy periods from the NDBC spectra data \n", - "Te = wave.resource.energy_period(ndbc_data) \n", + "# Compute the enegy periods from the NDBC spectra data\n", + "Te = wave.resource.energy_period(ndbc_data)\n", "Te.head()" ] }, @@ -642,8 +642,8 @@ } ], "source": [ - "# Compute the significant wave height from the NDBC spectra data \n", - "Hm0 = wave.resource.significant_wave_height(ndbc_data) \n", + "# Compute the significant wave height from the NDBC spectra data\n", + "Hm0 = wave.resource.significant_wave_height(ndbc_data)\n", "Hm0.head()" ] }, @@ -717,11 +717,11 @@ ], "source": [ "# Set water depth to 60 m\n", - "h = 60 \n", + "h = 60\n", "\n", "# Compute the energy flux from the NDBC spectra data and water depth\n", - "J = wave.resource.energy_flux(ndbc_data,h) \n", - "J.head() " + "J = wave.resource.energy_flux(ndbc_data, h)\n", + "J.head()" ] }, { @@ -756,8 +756,8 @@ } ], "source": [ - "# Convert the energy period DataFrame to a Series. \n", - "Te = Te.squeeze() \n", + "# Convert the energy period DataFrame to a Series.\n", + "Te = Te.squeeze()\n", "Te.head()" ] }, @@ -799,10 +799,10 @@ ], "source": [ "# Alternatively, convert to Series by calling a specific column in the DataFrame\n", - "Hm0= Hm0['Hm0']\n", + "Hm0 = Hm0[\"Hm0\"]\n", "print(Hm0)\n", "\n", - "J = J['J'] \n", + "J = J[\"J\"]\n", "print(J)" ] }, @@ -822,9 +822,9 @@ "outputs": [], "source": [ "# Set the random seed, to reproduce results\n", - "np.random.seed(1) \n", + "np.random.seed(1)\n", "# Generate random power values\n", - "P = pd.Series(np.random.normal(200, 40, 743),index = J.index) " + "P = pd.Series(np.random.normal(200, 40, 743), index=J.index)" ] }, { @@ -1407,18 +1407,20 @@ ], "source": [ "# Calculate capture length\n", - "L = wave.performance.capture_length(P, J) \n", + "L = wave.performance.capture_length(P, J)\n", "\n", "# Generate bins for Hm0 and Te, input format (start, stop, step_size)\n", - "Hm0_bins = np.arange(0, Hm0.values.max() + .5, .5) \n", + "Hm0_bins = np.arange(0, Hm0.values.max() + 0.5, 0.5)\n", "Te_bins = np.arange(0, Te.values.max() + 1, 1)\n", "\n", "# Create capture length matrices using mean, standard deviation, count, min and max statistics\n", - "LM_mean = wave.performance.capture_length_matrix(Hm0, Te, L, 'mean', Hm0_bins, Te_bins)\n", - "LM_std = wave.performance.capture_length_matrix(Hm0, Te, L, 'std', Hm0_bins, Te_bins)\n", - "LM_count = wave.performance.capture_length_matrix(Hm0, Te, L, 'count', Hm0_bins, Te_bins)\n", - "LM_min = wave.performance.capture_length_matrix(Hm0, Te, L, 'min', Hm0_bins, Te_bins)\n", - "LM_max = wave.performance.capture_length_matrix(Hm0, Te, L, 'max', Hm0_bins, Te_bins)\n", + "LM_mean = wave.performance.capture_length_matrix(Hm0, Te, L, \"mean\", Hm0_bins, Te_bins)\n", + "LM_std = wave.performance.capture_length_matrix(Hm0, Te, L, \"std\", Hm0_bins, Te_bins)\n", + "LM_count = wave.performance.capture_length_matrix(\n", + " Hm0, Te, L, \"count\", Hm0_bins, Te_bins\n", + ")\n", + "LM_min = wave.performance.capture_length_matrix(Hm0, Te, L, \"min\", Hm0_bins, Te_bins)\n", + "LM_max = wave.performance.capture_length_matrix(Hm0, Te, L, \"max\", Hm0_bins, Te_bins)\n", "\n", "# Show mean capture length matrix\n", "LM_mean" @@ -2002,7 +2004,9 @@ ], "source": [ "# Create capture length matrices using frequency\n", - "LM_freq = wave.performance.capture_length_matrix(Hm0, Te, L,'frequency', Hm0_bins, Te_bins)\n", + "LM_freq = wave.performance.capture_length_matrix(\n", + " Hm0, Te, L, \"frequency\", Hm0_bins, Te_bins\n", + ")\n", "\n", "# Show capture length matrix using frequency\n", "LM_freq" @@ -2022,7 +2026,9 @@ "outputs": [], "source": [ "# Demonstration of arbitrary matrix generator\n", - "PM_mean_not_standard = wave.performance.capture_length_matrix(Hm0, Te, P, 'mean', Hm0_bins, Te_bins)" + "PM_mean_not_standard = wave.performance.capture_length_matrix(\n", + " Hm0, Te, P, \"mean\", Hm0_bins, Te_bins\n", + ")" ] }, { @@ -2041,7 +2047,9 @@ "outputs": [], "source": [ "# Demonstration of passing a callable function to the matrix generator\n", - "LM_variance = wave.performance.capture_length_matrix(Hm0, Te, L, np.var, Hm0_bins, Te_bins)" + "LM_variance = wave.performance.capture_length_matrix(\n", + " Hm0, Te, L, np.var, Hm0_bins, Te_bins\n", + ")" ] }, { @@ -2599,7 +2607,7 @@ ], "source": [ "# Create wave energy flux matrix using mean\n", - "JM = wave.performance.wave_energy_flux_matrix(Hm0, Te, J, 'mean', Hm0_bins, Te_bins)\n", + "JM = wave.performance.wave_energy_flux_matrix(Hm0, Te, J, \"mean\", Hm0_bins, Te_bins)\n", "\n", "# Create power matrix using mean\n", "PM_mean = wave.performance.power_matrix(LM_mean, JM)\n", @@ -2639,7 +2647,9 @@ "print(\"MAEP from timeseries = \", maep_timeseries)\n", "\n", "# Calcaulte maep from matrix\n", - "maep_matrix = wave.performance.mean_annual_energy_production_matrix(LM_mean, JM, LM_freq)\n", + "maep_matrix = wave.performance.mean_annual_energy_production_matrix(\n", + " LM_mean, JM, LM_freq\n", + ")\n", "print(\"MAEP from matrices = \", maep_matrix)" ] }, @@ -2671,7 +2681,7 @@ ], "source": [ "# Plot the capture length mean matrix\n", - "ax = wave.graphics.plot_matrix(LM_mean) " + "ax = wave.graphics.plot_matrix(LM_mean)" ] }, { @@ -2715,10 +2725,17 @@ "source": [ "# Customize the matrix plot\n", "import matplotlib.pylab as plt\n", - "plt.figure(figsize=(6,6))\n", + "\n", + "plt.figure(figsize=(6, 6))\n", "ax = plt.gca()\n", - "wave.graphics.plot_matrix(PM_mean, xlabel='Te (s)', ylabel='Hm0 (m)', \\\n", - " zlabel='Mean Power (kW)', show_values=False, ax=ax)" + "wave.graphics.plot_matrix(\n", + " PM_mean,\n", + " xlabel=\"Te (s)\",\n", + " ylabel=\"Hm0 (m)\",\n", + " zlabel=\"Mean Power (kW)\",\n", + " show_values=False,\n", + " ax=ax,\n", + ")" ] } ], diff --git a/examples/wecsim_example.ipynb b/examples/wecsim_example.ipynb index 4106fb52f..3dceda943 100644 --- a/examples/wecsim_example.ipynb +++ b/examples/wecsim_example.ipynb @@ -26,7 +26,7 @@ "metadata": {}, "outputs": [], "source": [ - "from mhkit import wave\n", + "from mhkit import wave\n", "import scipy.io as sio\n", "import matplotlib.pyplot as plt" ] @@ -59,7 +59,7 @@ ], "source": [ "# Relative location and filename of simulated WEC-Sim data (run with mooring)\n", - "filename = './data/wave/RM3MooringMatrix_matlabWorkspace_structure.mat' \n", + "filename = \"./data/wave/RM3MooringMatrix_matlabWorkspace_structure.mat\"\n", "\n", "# Load data using the `wecsim.read_output` function which returns a dictionary of dataFrames\n", "wecsim_data = wave.io.wecsim.read_output(filename)" @@ -226,13 +226,13 @@ ], "source": [ "# Store WEC-Sim output from the Wave Class to a new dataFrame, called `wave_data`\n", - "wave_data = wecsim_data['wave']\n", + "wave_data = wecsim_data[\"wave\"]\n", "\n", "# Display the wave type from the WEC-Sim Wave Class\n", "wave_type = wave_data.name\n", "print(\"WEC-Sim wave type:\", wave_type)\n", "\n", - "# View the WEC-Sim output dataFrame for the Wave Class \n", + "# View the WEC-Sim output dataFrame for the Wave Class\n", "wave_data" ] }, @@ -313,8 +313,8 @@ } ], "source": [ - "# Store WEC-Sim output from the Body Class to a new dictionary of dataFrames, i.e. 'bodies'. \n", - "bodies = wecsim_data['bodies']\n", + "# Store WEC-Sim output from the Body Class to a new dictionary of dataFrames, i.e. 'bodies'.\n", + "bodies = wecsim_data[\"bodies\"]\n", "\n", "# Data fron each body is stored as its own dataFrame, i.e. 'body1' and 'body2'.\n", "bodies.keys()" @@ -343,8 +343,8 @@ } ], "source": [ - "# Store Body Class dataFrame for Body 1 as `body1`. \n", - "body1 = bodies['body1']\n", + "# Store Body Class dataFrame for Body 1 as `body1`.\n", + "body1 = bodies[\"body1\"]\n", "\n", "# Display the name of Body 1 from the WEC-Sim Body Class\n", "print(\"Name of Body 1:\", body1.name)" @@ -384,7 +384,7 @@ ], "source": [ "# Print a list of Body 1 columns that end with 'dof1'\n", - "[col for col in body1 if col.endswith('dof1')]" + "[col for col in body1 if col.endswith(\"dof1\")]" ] }, { @@ -427,11 +427,11 @@ "body1.position_dof3.plot()\n", "plt.xlabel(\"Time [s]\")\n", "plt.ylabel(\"Heave Position [m]\")\n", - "plt.title('Body 1')\n", + "plt.title(\"Body 1\")\n", "\n", - "# Use Pandas to calculate the maximum and minimum heave position of Body 1 \n", - "print(\"Body 1 max heave position =\", body1.position_dof3.max(),\"[m]\")\n", - "print(\"Body 1 min heave position =\", body1.position_dof3.min(),\"[m]\")" + "# Use Pandas to calculate the maximum and minimum heave position of Body 1\n", + "print(\"Body 1 max heave position =\", body1.position_dof3.max(), \"[m]\")\n", + "print(\"Body 1 min heave position =\", body1.position_dof3.min(), \"[m]\")" ] }, { @@ -472,14 +472,14 @@ ], "source": [ "# Create a list of Body 1 data columns that start with 'position'\n", - "filter_col = [col for col in body1 if col.startswith('position')]\n", + "filter_col = [col for col in body1 if col.startswith(\"position\")]\n", "\n", "# Plot filtered 'position' data for Body 1\n", "body1[filter_col].plot()\n", - "plt.xlabel('Time [s]')\n", - "plt.ylabel('Position [m or rad]')\n", - "plt.title('Body 1')\n", - "plt.legend(loc='center left', bbox_to_anchor=(1, 0.5))" + "plt.xlabel(\"Time [s]\")\n", + "plt.ylabel(\"Position [m or rad]\")\n", + "plt.title(\"Body 1\")\n", + "plt.legend(loc=\"center left\", bbox_to_anchor=(1, 0.5))" ] }, { @@ -763,8 +763,8 @@ } ], "source": [ - "# Store Body Class dataFrame for Body 2 as `body2` \n", - "body2 = bodies['body2']\n", + "# Store Body Class dataFrame for Body 2 as `body2`\n", + "body2 = bodies[\"body2\"]\n", "\n", "# Display the name of Body 2 from the WEC-Sim Body Class\n", "print(\"Name of Body 2:\", body2.name)\n", @@ -814,13 +814,13 @@ ], "source": [ "# Store WEC-Sim output from the PTO Class to a DataFrame, called `ptos`\n", - "ptos = wecsim_data['ptos']\n", + "ptos = wecsim_data[\"ptos\"]\n", "\n", "# Display the name of the PTO from the WEC-Sim PTO Class\n", "print(\"Name of PTO:\", ptos.name)\n", "\n", "# Print a list of available columns that end with 'dof1'\n", - "[col for col in ptos if col.endswith('dof1')]" + "[col for col in ptos if col.endswith(\"dof1\")]" ] }, { @@ -854,10 +854,10 @@ "source": [ "# Use Pandas to plot pto internal power in heave (DOF 3)\n", "# NOTE: WEC-Sim requires a negative sign to convert internal power to generated power\n", - "(-1*ptos.powerInternalMechanics_dof3/1000).plot()\n", + "(-1 * ptos.powerInternalMechanics_dof3 / 1000).plot()\n", "plt.xlabel(\"Time [s]\")\n", "plt.ylabel(\"Power Generated [kW]\")\n", - "plt.title('PTO')" + "plt.title(\"PTO\")" ] }, { @@ -1133,7 +1133,7 @@ ], "source": [ "# Store WEC-Sim output from the Constraint Class to a new dataFrame, called `constraints`\n", - "constraints = wecsim_data['constraints']\n", + "constraints = wecsim_data[\"constraints\"]\n", "\n", "# Display the name of the Constraint from the WEC-Sim Constraint Class\n", "print(\"Name of Constraint:\", constraints.name)\n", @@ -1376,7 +1376,7 @@ ], "source": [ "# Store WEC-Sim output from the Mooring Class to a new dataFrame, called `mooring`\n", - "mooring = wecsim_data['mooring']\n", + "mooring = wecsim_data[\"mooring\"]\n", "\n", "# View the PTO Class dataFrame\n", "mooring.head()" @@ -1411,8 +1411,8 @@ ], "source": [ "# Use the MHKiT Wave Module to calculate the wave spectrum from the WEC-Sim Wave Class Data\n", - "sample_rate=60\n", - "nnft=1000 # Number of bins in the Fast Fourier Transform\n", + "sample_rate = 60\n", + "nnft = 1000 # Number of bins in the Fast Fourier Transform\n", "ws_spectrum = wave.resource.elevation_spectrum(wave_data, sample_rate, nnft)\n", "\n", "# Plot calculated wave spectrum\n", @@ -1514,7 +1514,7 @@ "Hm0 = wave.resource.significant_wave_height(ws_spectrum)\n", "\n", "# Display calculated Peak Wave Period (Tp) and Significant Wave Height (Hm0)\n", - "display(Tp,Hm0)" + "display(Tp, Hm0)" ] } ], diff --git a/figures/logo.png b/logo.png similarity index 100% rename from figures/logo.png rename to logo.png diff --git a/mhkit/__init__.py b/mhkit/__init__.py index 49c1b44b9..05a04dcf1 100644 --- a/mhkit/__init__.py +++ b/mhkit/__init__.py @@ -11,12 +11,13 @@ # Register datetime converter for a matplotlib plotting methods from pandas.plotting import register_matplotlib_converters as _rmc + _rmc() # Ignore future warnings -_warn.simplefilter(action='ignore', category=FutureWarning) +_warn.simplefilter(action="ignore", category=FutureWarning) -__version__ = 'v0.7.0' +__version__ = "v0.7.0" __copyright__ = """ Copyright 2019, Alliance for Sustainable Energy, LLC under the terms of diff --git a/mhkit/dolfyn/__init__.py b/mhkit/dolfyn/__init__.py index 307a6932f..cb459e50f 100644 --- a/mhkit/dolfyn/__init__.py +++ b/mhkit/dolfyn/__init__.py @@ -1,5 +1,10 @@ from mhkit.dolfyn.io.api import read, read_example, save, load, save_mat, load_mat -from mhkit.dolfyn.rotate.api import rotate2, calc_principal_heading, set_declination, set_inst2head_rotmat +from mhkit.dolfyn.rotate.api import ( + rotate2, + calc_principal_heading, + set_declination, + set_inst2head_rotmat, +) from .rotate.base import euler2orient, orient2euler, quaternion2orient from .velocity import VelBinner from mhkit.dolfyn import adv diff --git a/mhkit/dolfyn/adp/__init__.py b/mhkit/dolfyn/adp/__init__.py index f1d1e0517..4dc7607ef 100644 --- a/mhkit/dolfyn/adp/__init__.py +++ b/mhkit/dolfyn/adp/__init__.py @@ -1,2 +1 @@ from . import api - diff --git a/mhkit/dolfyn/adp/clean.py b/mhkit/dolfyn/adp/clean.py index f4cc896b0..e89124d11 100644 --- a/mhkit/dolfyn/adp/clean.py +++ b/mhkit/dolfyn/adp/clean.py @@ -1,5 +1,6 @@ """Module containing functions to clean data """ + import numpy as np import xarray as xr from scipy.signal import medfilt @@ -40,15 +41,15 @@ def set_range_offset(ds, h_deploy): the surface and downward-facing ADCP's transducers. """ - r = [s for s in ds.dims if 'range' in s] + r = [s for s in ds.dims if "range" in s] for val in r: ds[val] = ds[val].values + h_deploy - ds[val].attrs['units'] = 'm' + ds[val].attrs["units"] = "m" - if hasattr(ds, 'h_deploy'): - ds.attrs['h_deploy'] += h_deploy + if hasattr(ds, "h_deploy"): + ds.attrs["h_deploy"] += h_deploy else: - ds.attrs['h_deploy'] = h_deploy + ds.attrs["h_deploy"] = h_deploy def find_surface(ds, thresh=10, nfilt=None): @@ -78,9 +79,13 @@ def find_surface(ds, thresh=10, nfilt=None): # This finds the first point that increases (away from the profiler) in # the echo profile edf = np.diff(ds.amp.values.astype(np.int16), axis=1) - inds2 = np.max((edf < 0) * - np.arange(ds.vel.shape[1] - 1, - dtype=np.uint8)[None, :, None], axis=1) + 1 + inds2 = ( + np.max( + (edf < 0) * np.arange(ds.vel.shape[1] - 1, dtype=np.uint8)[None, :, None], + axis=1, + ) + + 1 + ) # Calculate the depth of these quantities d1 = ds.range.values[inds] @@ -101,12 +106,17 @@ def find_surface(ds, thresh=10, nfilt=None): dfilt[dfilt == 0] = np.NaN d = dfilt - ds['depth'] = xr.DataArray(d.astype('float32'), - dims=['time'], - attrs={'units': 'm', - 'long_name': 'Depth', - 'standard_name': 'depth', - 'positive': 'down'}) + ds["depth"] = xr.DataArray( + d.astype("float32"), + dims=["time"], + attrs={ + "units": "m", + "long_name": "Depth", + "standard_name": "depth", + "positive": "down", + }, + ) + def find_surface_from_P(ds, salinity=35): """ @@ -137,9 +147,9 @@ def find_surface_from_P(ds, salinity=35): .. math:: \\rho - \\rho_0 = -\\alpha (T-T_0) + \\beta (S-S_0) + \\kappa P Where :math:`\\rho` is water density, :math:`T` is water temperature, - :math:`P` is water pressure, :math:`S` is practical salinity, - :math:`\\alpha` is the thermal expansion coefficient, :math:`\\beta` is - the haline contraction coefficient, and :math:`\\kappa` is adiabatic + :math:`P` is water pressure, :math:`S` is practical salinity, + :math:`\\alpha` is the thermal expansion coefficient, :math:`\\beta` is + the haline contraction coefficient, and :math:`\\kappa` is adiabatic compressibility. """ @@ -153,31 +163,37 @@ def find_surface_from_P(ds, salinity=35): a = 0.15 # thermal expansion coefficient, kg/m^3/degC b = 0.78 # haline contraction coefficient, kg/m^3/ppt k = 4.5e-3 # adiabatic compressibility, kg/m^3/dbar - rho = rho0 - a*(T-T0) + b*(S-S0) + k*P + rho = rho0 - a * (T - T0) + b * (S - S0) + k * P # Depth = pressure (conversion from dbar to MPa) / water weight - d = (ds.pressure*10000)/(9.81*rho) + d = (ds.pressure * 10000) / (9.81 * rho) - if hasattr(ds, 'h_deploy'): + if hasattr(ds, "h_deploy"): d += ds.h_deploy description = "Depth to Seafloor" else: description = "Depth to Instrument" - ds['water_density'] = xr.DataArray( - rho.astype('float32'), - dims=['time'], - attrs={'units': 'kg m-3', - 'long_name': 'Water Density', - 'standard_name': 'sea_water_density', - 'description': 'Water density from linear approximation of sea water equation of state'}) - ds['depth'] = xr.DataArray( - d.astype('float32'), - dims=['time'], - attrs={'units': 'm', - 'long_name': description, - 'standard_name': 'depth', - 'positive': 'down'}) + ds["water_density"] = xr.DataArray( + rho.astype("float32"), + dims=["time"], + attrs={ + "units": "kg m-3", + "long_name": "Water Density", + "standard_name": "sea_water_density", + "description": "Water density from linear approximation of sea water equation of state", + }, + ) + ds["depth"] = xr.DataArray( + d.astype("float32"), + dims=["time"], + attrs={ + "units": "m", + "long_name": description, + "standard_name": "depth", + "positive": "down", + }, + ) def nan_beyond_surface(ds, val=np.nan, beam_angle=None, inplace=False): @@ -204,7 +220,7 @@ def nan_beyond_surface(ds, val=np.nan, beam_angle=None, inplace=False): Notes ----- - Surface interference expected to happen at + Surface interference expected to happen at `distance > range * cos(beam angle) - cell size` """ @@ -212,29 +228,32 @@ def nan_beyond_surface(ds, val=np.nan, beam_angle=None, inplace=False): ds = ds.copy(deep=True) # Get all variables with 'range' coordinate - var = [h for h in ds.keys() if any(s for s in ds[h].dims if 'range' in s)] + var = [h for h in ds.keys() if any(s for s in ds[h].dims if "range" in s)] if beam_angle is None: - if hasattr(ds, 'beam_angle'): - beam_angle = ds.beam_angle * (np.pi/180) + if hasattr(ds, "beam_angle"): + beam_angle = ds.beam_angle * (np.pi / 180) else: - raise Exception("'beam_angle` not found in dataset attributes. "\ - "Please supply the ADCP's beam angle.") + raise Exception( + "'beam_angle` not found in dataset attributes. " + "Please supply the ADCP's beam angle." + ) # Surface interference distance calculated from distance of transducers to surface - if hasattr(ds, 'h_deploy'): - range_limit = ((ds.depth-ds.h_deploy) * np.cos(beam_angle) - - ds.cell_size) + ds.h_deploy + if hasattr(ds, "h_deploy"): + range_limit = ( + (ds.depth - ds.h_deploy) * np.cos(beam_angle) - ds.cell_size + ) + ds.h_deploy else: range_limit = ds.depth * np.cos(beam_angle) - ds.cell_size bds = ds.range > range_limit # Echosounder data needs only be trimmed at water surface - if 'echo' in var: + if "echo" in var: bds_echo = ds.range_echo > ds.depth - ds['echo'].values[..., bds_echo] = val - var.remove('echo') + ds["echo"].values[..., bds_echo] = val + var.remove("echo") # Correct rest of "range" data for surface interference for nm in var: @@ -251,7 +270,7 @@ def nan_beyond_surface(ds, val=np.nan, beam_angle=None, inplace=False): def correlation_filter(ds, thresh=50, inplace=False): """ - Filters out data where correlation is below a threshold in the + Filters out data where correlation is below a threshold in the along-beam correlation data. Parameters @@ -268,7 +287,7 @@ def correlation_filter(ds, thresh=50, inplace=False): Returns ------- ds : xarray.Dataset - Elements in velocity, correlation, and amplitude are removed if below the + Elements in velocity, correlation, and amplitude are removed if below the correlation threshold Notes @@ -280,27 +299,30 @@ def correlation_filter(ds, thresh=50, inplace=False): ds = ds.copy(deep=True) # 4 or 5 beam - if hasattr(ds, 'vel_b5'): - tag = ['', '_b5'] + if hasattr(ds, "vel_b5"): + tag = ["", "_b5"] else: - tag = [''] + tag = [""] # copy original ref frame coord_sys_orig = ds.coord_sys # correlation is always in beam coordinates - rotate2(ds, 'beam', inplace=True) + rotate2(ds, "beam", inplace=True) # correlation is always in beam coordinates for tg in tag: - mask = ds['corr'+tg].values <= thresh + mask = ds["corr" + tg].values <= thresh - for var in ['vel', 'corr', 'amp']: + for var in ["vel", "corr", "amp"]: try: - ds[var+tg].values[mask] = np.nan + ds[var + tg].values[mask] = np.nan except: - ds[var+tg].values[mask] = 0 - ds[var+tg].attrs['Comments'] = 'Filtered of data with a correlation value below ' + \ - str(thresh) + ds.corr.units + ds[var + tg].values[mask] = 0 + ds[var + tg].attrs["Comments"] = ( + "Filtered of data with a correlation value below " + + str(thresh) + + ds.corr.units + ) rotate2(ds, coord_sys_orig, inplace=True) @@ -332,22 +354,22 @@ def medfilt_orient(ds, nfilt=7): ds = ds.copy(deep=True) - if getattr(ds, 'has_imu'): + if getattr(ds, "has_imu"): q_filt = np.zeros(ds.quaternions.shape) for i in range(ds.quaternions.q.size): q_filt[i] = medfilt(ds.quaternions[i].values, nfilt) ds.quaternions.values = q_filt - ds['orientmat'] = quaternion2orient(ds.quaternions) + ds["orientmat"] = quaternion2orient(ds.quaternions) return ds else: # non Nortek AHRS-equipped instruments - do_these = ['pitch', 'roll', 'heading'] + do_these = ["pitch", "roll", "heading"] for nm in do_these: ds[nm].values = medfilt(ds[nm].values, nfilt) - return ds.drop_vars('orientmat') + return ds.drop_vars("orientmat") def val_exceeds_thresh(var, thresh=5, val=np.nan): @@ -373,15 +395,15 @@ def val_exceeds_thresh(var, thresh=5, val=np.nan): var = var.copy(deep=True) - bd = np.zeros(var.shape, dtype='bool') - bd |= (np.abs(var.values) > thresh) + bd = np.zeros(var.shape, dtype="bool") + bd |= np.abs(var.values) > thresh var.values[bd] = val return var -def fillgaps_time(var, method='cubic', maxgap=None): +def fillgaps_time(var, method="cubic", maxgap=None): """ Fill gaps (nan values) in var across time using the specified method @@ -404,14 +426,14 @@ def fillgaps_time(var, method='cubic', maxgap=None): xarray.DataArray.interpolate_na() """ - time_dim = [t for t in var.dims if 'time' in t][0] + time_dim = [t for t in var.dims if "time" in t][0] - return var.interpolate_na(dim=time_dim, method=method, - use_coordinate=True, - limit=maxgap) + return var.interpolate_na( + dim=time_dim, method=method, use_coordinate=True, limit=maxgap + ) -def fillgaps_depth(var, method='cubic', maxgap=None): +def fillgaps_depth(var, method="cubic", maxgap=None): """ Fill gaps (nan values) in var along the depth profile using the specified method @@ -434,8 +456,8 @@ def fillgaps_depth(var, method='cubic', maxgap=None): xarray.DataArray.interpolate_na() """ - range_dim = [t for t in var.dims if 'range' in t][0] + range_dim = [t for t in var.dims if "range" in t][0] - return var.interpolate_na(dim=range_dim, method=method, - use_coordinate=False, - limit=maxgap) + return var.interpolate_na( + dim=range_dim, method=method, use_coordinate=False, limit=maxgap + ) diff --git a/mhkit/dolfyn/adp/turbulence.py b/mhkit/dolfyn/adp/turbulence.py index 72c4704ae..d85f365ab 100644 --- a/mhkit/dolfyn/adp/turbulence.py +++ b/mhkit/dolfyn/adp/turbulence.py @@ -16,7 +16,7 @@ def _diffz_first(dat, z): 1 dimensional vector to be differentiated z : array-like Vertical dimension to differentiate across - + Returns ------- out : array-like @@ -36,7 +36,7 @@ def _diffz_centered(dat, z): 1 dimensional vector to be differentiated z : array-like Vertical dimension to differentiate across - + Returns ------- out : array-like @@ -48,7 +48,7 @@ def _diffz_centered(dat, z): Can use 2*np.diff b/c depth bin size never changes """ - return (dat[2:]-dat[:-2]) / (2*np.diff(z)[1:, None]) + return (dat[2:] - dat[:-2]) / (2 * np.diff(z)[1:, None]) def _diffz_centered_extended(dat, z): @@ -61,7 +61,7 @@ def _diffz_centered_extended(dat, z): 1 dimensional vector to be differentiated z : array-like Vertical dimension to differentiate across - + Returns ------- out : array-like @@ -70,19 +70,31 @@ def _diffz_centered_extended(dat, z): Notes ----- Top - bottom centered difference with endpoints determined - with a first difference. Ensures the output array is the + with a first difference. Ensures the output array is the same size as the input array. """ - out = np.concatenate((_diffz_first(dat[:2], z[:2]), - _diffz_centered(dat, z), - _diffz_first(dat[-2:], z[-2:]))) + out = np.concatenate( + ( + _diffz_first(dat[:2], z[:2]), + _diffz_centered(dat, z), + _diffz_first(dat[-2:], z[-2:]), + ) + ) return out class ADPBinner(VelBinner): - def __init__(self, n_bin, fs, n_fft=None, n_fft_coh=None, - noise=None, orientation='up', diff_style='centered_extended'): + def __init__( + self, + n_bin, + fs, + n_fft=None, + n_fft_coh=None, + noise=None, + orientation="up", + diff_style="centered_extended", + ): """ A class for calculating turbulence statistics from ADCP data @@ -99,12 +111,14 @@ def __init__(self, n_bin, fs, n_fft=None, n_fft_coh=None, n_fft_coh : int Number of data points to use for coherence and cross-spectra ffts Default: `n_fft_coh`=`n_fft` - noise : float, list or numpy.ndarray - Instrument's doppler noise in same units as velocity + noise : float or array-like + Instrument noise level in same units as velocity. Typically + found from `adp.turbulence.doppler_noise_level`. + Default: None. orientation : str, default='up' Instrument's orientation, either 'up' or 'down' diff_style : str, default='centered_extended' - Style of numerical differentiation using Newton's Method. + Style of numerical differentiation using Newton's Method. Either 'first' (first difference), 'centered' (centered difference), or 'centered_extended' (centered difference with first and last points extended using a first difference). @@ -115,11 +129,11 @@ def __init__(self, n_bin, fs, n_fft=None, n_fft_coh=None, self.orientation = orientation def _diff_func(self, vel, u): - """ Applies the chosen style of numerical differentiation to velocity data. + """Applies the chosen style of numerical differentiation to velocity data. - This method calculates the derivative of the velocity data 'vel' with respect to the 'range' - using the differentiation style specified in 'self.diff_style'. The styles can be 'first' - for first difference, 'centered' for centered difference, and 'centered_extended' for + This method calculates the derivative of the velocity data 'vel' with respect to the 'range' + using the differentiation style specified in 'self.diff_style'. The styles can be 'first' + for first difference, 'centered' for centered difference, and 'centered_extended' for centered difference with first and last points extended using a first difference. Parameters @@ -135,14 +149,14 @@ def _diff_func(self, vel, u): The calculated derivative of the velocity data. """ - if self.diff_style == 'first': - out = _diffz_first(vel[u].values, vel['range'].values) + if self.diff_style == "first": + out = _diffz_first(vel[u].values, vel["range"].values) return out, vel.range[1:] - elif self.diff_style == 'centered': - out = _diffz_centered(vel[u].values, vel['range'].values) + elif self.diff_style == "centered": + out = _diffz_centered(vel[u].values, vel["range"].values) return out, vel.range[1:-1] - elif self.diff_style == 'centered_extended': - out = _diffz_centered_extended(vel[u].values, vel['range'].values) + elif self.diff_style == "centered_extended": + out = _diffz_centered_extended(vel[u].values, vel["range"].values) return out, vel.range def dudz(self, vel, orientation=None): @@ -171,16 +185,16 @@ def dudz(self, vel, orientation=None): if not orientation: orientation = self.orientation sign = 1 - if orientation == 'down': + if orientation == "down": sign *= -1 - dudz, rng = sign*self._diff_func(vel, 0) - return xr.DataArray(dudz, - coords=[rng, vel.time], - dims=['range', 'time'], - attrs={'units': 's-1', - 'long_name': 'Shear in X-direction'} - ) + dudz, rng = sign * self._diff_func(vel, 0) + return xr.DataArray( + dudz, + coords=[rng, vel.time], + dims=["range", "time"], + attrs={"units": "s-1", "long_name": "Shear in X-direction"}, + ) def dvdz(self, vel): """ @@ -204,12 +218,12 @@ def dvdz(self, vel): """ dvdz, rng = self._diff_func(vel, 1) - return xr.DataArray(dvdz, - coords=[rng, vel.time], - dims=['range', 'time'], - attrs={'units': 's-1', - 'long_name': 'Shear in Y-direction'} - ) + return xr.DataArray( + dvdz, + coords=[rng, vel.time], + dims=["range", "time"], + attrs={"units": "s-1", "long_name": "Shear in Y-direction"}, + ) def dwdz(self, vel): """ @@ -233,12 +247,12 @@ def dwdz(self, vel): """ dwdz, rng = self._diff_func(vel, 2) - return xr.DataArray(dwdz, - coords=[rng, vel.time], - dims=['range', 'time'], - attrs={'units': 's-1', - 'long_name': 'Shear in Z-direction'} - ) + return xr.DataArray( + dwdz, + coords=[rng, vel.time], + dims=["range", "time"], + attrs={"units": "s-1", "long_name": "Shear in Z-direction"}, + ) def shear_squared(self, vel): """ @@ -266,8 +280,8 @@ def shear_squared(self, vel): """ shear2 = self.dudz(vel) ** 2 + self.dvdz(vel) ** 2 - shear2.attrs['units'] = 's-2' - shear2.attrs['long_name'] = 'Horizontal Shear Squared' + shear2.attrs["units"] = "s-2" + shear2.attrs["long_name"] = "Horizontal Shear Squared" return shear2 @@ -286,7 +300,7 @@ def doppler_noise_level(self, psd, pct_fN=0.8): Returns ------- - doppler_noise (xarray.DataArray): + doppler_noise (xarray.DataArray): Doppler noise level in units of m/s Notes @@ -299,19 +313,19 @@ def doppler_noise_level(self, psd, pct_fN=0.8): `N` is the constant variance or spectral density, and `f_{c}` is the characteristic frequency. - The characteristic frequency is then found as + The characteristic frequency is then found as .. :math: f_{c} = pct_fN * (f_{s}/2) where `f_{s}/2` is the Nyquist frequency. - Richard, Jean-Baptiste, et al. "Method for identification of Doppler noise - levels in turbulent flow measurements dedicated to tidal energy." International + Richard, Jean-Baptiste, et al. "Method for identification of Doppler noise + levels in turbulent flow measurements dedicated to tidal energy." International Journal of Marine Energy 3 (2013): 52-64. - Thiébaut, Maxime, et al. "Investigating the flow dynamics and turbulence at a - tidal-stream energy site in a highly energetic estuary." Renewable Energy 195 + Thiébaut, Maxime, et al. "Investigating the flow dynamics and turbulence at a + tidal-stream energy site in a highly energetic estuary." Renewable Energy 195 (2022): 252-262. """ @@ -320,38 +334,41 @@ def doppler_noise_level(self, psd, pct_fN=0.8): if not isinstance(pct_fN, float) or not 0 <= pct_fN <= 1: raise ValueError("`pct_fN` must be a float within the range [0, 1].") if len(psd.shape) != 2: - raise Exception('PSD should be 2-dimensional (time, frequency)') + raise Exception("PSD should be 2-dimensional (time, frequency)") # Characteristic frequency set to 80% of Nyquist frequency - fN = self.fs/2 + fN = self.fs / 2 fc = pct_fN * fN # Get units right if psd.freq.units == "Hz": f_range = slice(fc, fN) else: - f_range = slice(2*np.pi*fc, 2*np.pi*fN) + f_range = slice(2 * np.pi * fc, 2 * np.pi * fN) # Noise floor N2 = psd.sel(freq=f_range) * psd.freq.sel(freq=f_range) - noise_level = np.sqrt(N2.mean(dim='freq')) + noise_level = np.sqrt(N2.mean(dim="freq")) + time_coord = psd.dims[0] # no reason this shouldn't be time or time_b5 return xr.DataArray( - noise_level.values.astype('float32'), - dims=['time'], - attrs={'units': 'm s-1', - 'long_name': 'Doppler Noise Level', - 'description': 'Doppler noise level calculated ' - 'from PSD white noise'}) + noise_level.values.astype("float32"), + coords={time_coord: psd.coords[time_coord]}, + attrs={ + "units": "m s-1", + "long_name": "Doppler Noise Level", + "description": "Doppler noise level calculated " "from PSD white noise", + }, + ) def _stress_func_warnings(self, ds, beam_angle, noise, tilt_thresh): """ Performs a series of checks and raises warnings for ADCP stress calculations. - This method checks several conditions relevant for ADCP stress calculations and raises - warnings if these conditions are not met. It checks if the beam angle is defined, - if the instrument's coordinate system is aligned with the principal flow directions, - if the tilt is above a threshold, if the noise level is specified, and if the data + This method checks several conditions relevant for ADCP stress calculations and raises + warnings if these conditions are not met. It checks if the beam angle is defined, + if the instrument's coordinate system is aligned with the principal flow directions, + if the tilt is above a threshold, if the noise level is specified, and if the data set is in the 'beam' coordinate system. Parameters @@ -374,41 +391,50 @@ def _stress_func_warnings(self, ds, beam_angle, noise, tilt_thresh): """ # Error 1. Beam Angle - b_angle = getattr(ds, 'beam_angle', beam_angle) + b_angle = getattr(ds, "beam_angle", beam_angle) if b_angle is None: raise Exception( - " Beam angle not found in dataset and no beam angle supplied.") + " Beam angle not found in dataset and no beam angle supplied." + ) # Warning 1. Memo - warnings.warn(" The beam-variance algorithms assume the instrument's " - "(XYZ) coordinate system is aligned with the principal " - "flow directions.") + warnings.warn( + " The beam-variance algorithms assume the instrument's " + "(XYZ) coordinate system is aligned with the principal " + "flow directions." + ) # Warning 2. Check tilt - tilt_mask = calc_tilt(ds['pitch'], ds['roll']) > tilt_thresh + tilt_mask = calc_tilt(ds["pitch"], ds["roll"]) > tilt_thresh if sum(tilt_mask): pct_above_thresh = round(sum(tilt_mask) / len(tilt_mask) * 100, 2) - warnings.warn(f" {pct_above_thresh} % of measurements have a tilt " - f"greater than {tilt_thresh} degrees.") + warnings.warn( + f" {pct_above_thresh} % of measurements have a tilt " + f"greater than {tilt_thresh} degrees." + ) # Warning 3. Noise level of instrument is important considering 50 % of variance # in ADCP data can be noise if noise is None: - warnings.warn(' No "noise" input supplied. Consider calculating "noise" ' - 'using `calc_doppler_noise`') + warnings.warn( + ' No "noise" input supplied. Consider calculating "noise" ' + "using `calc_doppler_noise`" + ) noise = 0 # Warning 4. Likely not in beam coordinates after running a typical analysis workflow - if 'beam' not in ds.coord_sys: - warnings.warn(" Raw dataset must be in the 'beam' coordinate system. " - "Rotating raw dataset...") - ds.velds.rotate2('beam') + if "beam" not in ds.coord_sys: + warnings.warn( + " Raw dataset must be in the 'beam' coordinate system. " + "Rotating raw dataset..." + ) + ds.velds.rotate2("beam") return b_angle, noise - + def _check_orientation(self, ds, orientation, beam5=False): """ - Determines the beam order for the beam-stress rotation algorithm based on + Determines the beam order for the beam-stress rotation algorithm based on the instrument orientation. Note: Stacey defines the beams for down-looking Workhorse ADCPs. @@ -424,11 +450,11 @@ def _check_orientation(self, ds, orientation, beam5=False): ds : xarray.Dataset Raw dataset in beam coordinates orientation : str - The orientation of the instrument, either 'up' or 'down'. - If None, the orientation will be retrieved from the dataset or the + The orientation of the instrument, either 'up' or 'down'. + If None, the orientation will be retrieved from the dataset or the instance's default orientation. beam5 : bool, default=False - A flag indicating whether a fifth beam is present. + A flag indicating whether a fifth beam is present. If True, the number 4 will be appended to the beam order. Returns @@ -438,36 +464,38 @@ def _check_orientation(self, ds, orientation, beam5=False): phi2 : float, optional The mean of the roll values in radians. Only returned if 'beam5' is True. phi3 : float, optional - The mean of the pitch values in radians, negated for Nortek instruments. + The mean of the pitch values in radians, negated for Nortek instruments. Only returned if 'beam5' is True. """ if orientation is None: - orientation = getattr(ds, 'orientation', self.orientation) + orientation = getattr(ds, "orientation", self.orientation) - if 'TRDI' in ds.inst_make: - phi2 = np.deg2rad(self.mean(ds['pitch'].values)) - phi3 = np.deg2rad(self.mean(ds['roll'].values)) - if 'down' in orientation.lower(): + if "TRDI" in ds.inst_make: + phi2 = np.deg2rad(self.mean(ds["pitch"].values)) + phi3 = np.deg2rad(self.mean(ds["roll"].values)) + if "down" in orientation.lower(): # this order is correct given the note above beams = [0, 1, 2, 3] # for down-facing RDIs - elif 'up' in orientation.lower(): + elif "up" in orientation.lower(): beams = [0, 1, 3, 2] # for up-facing RDIs else: raise Exception( - "Please provide instrument orientation ['up' or 'down']") + "Please provide instrument orientation ['up' or 'down']" + ) # For Nortek Signatures - elif ('Signature' in ds.inst_model) or ('AD2CP' in ds.inst_model): - phi2 = np.deg2rad(self.mean(ds['roll'].values)) - phi3 = -np.deg2rad(self.mean(ds['pitch'].values)) - if 'down' in orientation.lower(): + elif ("Signature" in ds.inst_model) or ("AD2CP" in ds.inst_model): + phi2 = np.deg2rad(self.mean(ds["roll"].values)) + phi3 = -np.deg2rad(self.mean(ds["pitch"].values)) + if "down" in orientation.lower(): beams = [2, 0, 3, 1] # for down-facing Norteks - elif 'up' in orientation.lower(): + elif "up" in orientation.lower(): beams = [0, 2, 3, 1] # for up-facing Norteks else: raise Exception( - "Please provide instrument orientation ['up' or 'down']") + "Please provide instrument orientation ['up' or 'down']" + ) if beam5: beams.append(4) @@ -477,7 +505,7 @@ def _check_orientation(self, ds, orientation, beam5=False): def _beam_variance(self, ds, time, noise, beam_order, n_beams): """ - Calculates the variance of the along-beam velocities and then subtracts + Calculates the variance of the along-beam velocities and then subtracts noise from the result. Parameters @@ -496,19 +524,20 @@ def _beam_variance(self, ds, time, noise, beam_order, n_beams): Returns ------- bp2_ : xarray.DataArray - Enxemble-averaged along-beam velocity variance, + Enxemble-averaged along-beam velocity variance, written "beam-velocity prime squared bar" in units of m^2/s^2 """ # Concatenate 5th beam velocity if need be if n_beams == 4: - beam_vel = ds['vel'].values + beam_vel = ds["vel"].values elif n_beams == 5: - beam_vel = np.concatenate((ds['vel'].values, - ds['vel_b5'].values[None, ...])) + beam_vel = np.concatenate( + (ds["vel"].values, ds["vel_b5"].values[None, ...]) + ) # Calculate along-beam velocity prime squared bar - bp2_ = np.empty((n_beams, len(ds.range), len(time)))*np.nan + bp2_ = np.empty((n_beams, len(ds.range), len(time))) * np.nan for i, beam in enumerate(beam_order): bp2_[i] = np.nanvar(self.reshape(beam_vel[beam]), axis=-1) @@ -521,7 +550,7 @@ def _beam_variance(self, ds, time, noise, beam_order, n_beams): def reynolds_stress_4beam(self, ds, noise=None, orientation=None, beam_angle=None): """ - Calculate the stresses from the covariance of along-beam + Calculate the stresses from the covariance of along-beam velocity measurements Parameters @@ -547,20 +576,21 @@ def reynolds_stress_4beam(self, ds, noise=None, orientation=None, beam_angle=Non Assumes ADCP instrument coordinate system is aligned with principal flow directions. - Stacey, Mark T., Stephen G. Monismith, and Jon R. Burau. "Measurements - of Reynolds stress profiles in unstratified tidal flow." Journal of + Stacey, Mark T., Stephen G. Monismith, and Jon R. Burau. "Measurements + of Reynolds stress profiles in unstratified tidal flow." Journal of Geophysical Research: Oceans 104.C5 (1999): 10933-10949. """ # Run through warnings b_angle, noise = self._stress_func_warnings( - ds, beam_angle, noise, tilt_thresh=5) + ds, beam_angle, noise, tilt_thresh=5 + ) # Fetch beam order beam_order = self._check_orientation(ds, orientation, beam5=False) # Calculate beam variance and subtract noise - time = self.mean(ds['time'].values) + time = self.mean(ds["time"].values) bp2_ = self._beam_variance(ds, time, noise, beam_order, n_beams=4) # Run stress calculations @@ -569,16 +599,20 @@ def reynolds_stress_4beam(self, ds, noise=None, orientation=None, beam_angle=Non vpwp_ = (bp2_[2] - bp2_[3]) / denm return xr.DataArray( - np.stack([upwp_*np.nan, upwp_, vpwp_]).astype('float32'), - coords={'tau': ["upvp_", "upwp_", "vpwp_"], - 'range': ds.range, - 'time': time}, - attrs={'units': 'm2 s-2', - 'long_name': 'Specific Reynolds Stress Vector'}) - - def stress_tensor_5beam(self, ds, noise=None, orientation=None, beam_angle=None, tke_only=False): + np.stack([upwp_ * np.nan, upwp_, vpwp_]).astype("float32"), + coords={ + "tau": ["upvp_", "upwp_", "vpwp_"], + "range": ds.range, + "time": time, + }, + attrs={"units": "m2 s-2", "long_name": "Specific Reynolds Stress Vector"}, + ) + + def stress_tensor_5beam( + self, ds, noise=None, orientation=None, beam_angle=None, tke_only=False + ): """ - Calculate the stresses from the covariance of along-beam + Calculate the stresses from the covariance of along-beam velocity measurements Parameters @@ -605,7 +639,7 @@ def stress_tensor_5beam(self, ds, noise=None, orientation=None, beam_angle=None, Assumes small-angle approximation is applicable. Assumes ADCP instrument coordinate system is aligned with principal flow - directions, i.e. u', v' and w' are aligned to the instrument's (XYZ) + directions, i.e. u', v' and w' are aligned to the instrument's (XYZ) frame of reference. The stress equations here utilize u'v'_ to account for small variations @@ -618,91 +652,122 @@ def stress_tensor_5beam(self, ds, noise=None, orientation=None, beam_angle=None, energy estimates from various ADCP beam configurations: Theory." J. of Phys. Ocean (2007): 1-35. - Guerra, Maricarmen, and Jim Thomson. "Turbulence measurements from - five-beam acoustic Doppler current profilers." Journal of Atmospheric + Guerra, Maricarmen, and Jim Thomson. "Turbulence measurements from + five-beam acoustic Doppler current profilers." Journal of Atmospheric and Oceanic Technology 34.6 (2017): 1267-1284. """ # Check that beam 5 velocity exists - if 'vel_b5' not in ds.data_vars: + if "vel_b5" not in ds.data_vars: raise Exception("Must have 5th beam data to use this function.") # Run through warnings b_angle, noise = self._stress_func_warnings( - ds, beam_angle, noise, tilt_thresh=10) + ds, beam_angle, noise, tilt_thresh=10 + ) # Fetch beam order - beam_order, phi2, phi3 = self._check_orientation( - ds, orientation, beam5=True) + beam_order, phi2, phi3 = self._check_orientation(ds, orientation, beam5=True) # Calculate beam variance and subtract noise - time = self.mean(ds['time'].values) + time = self.mean(ds["time"].values) bp2_ = self._beam_variance(ds, time, noise, beam_order, n_beams=5) # Run tke and stress calculations th = np.deg2rad(b_angle) sin = np.sin cos = np.cos - denm = -4 * sin(th)**6 * cos(th)**2 - - upup_ = (-2*sin(th)**4*cos(th)**2*(bp2_[1]+bp2_[0]-2*cos(th)**2*bp2_[4]) + - 2*sin(th)**5*cos(th)*phi3*(bp2_[1]-bp2_[0])) / denm - - vpvp_ = (-2*sin(th)**4*cos(th)**2*(bp2_[3]+bp2_[0]-2*cos(th)**2*bp2_[4]) - - 2*sin(th)**4*cos(th)**2*phi3*(bp2_[1]-bp2_[0]) + - 2*sin(th)**3*cos(th)**3*phi3*(bp2_[1]-bp2_[0]) - - 2*sin(th)**5*cos(th)*phi2*(bp2_[3]-bp2_[2])) / denm - - wpwp_ = (-2*sin(th)**5*cos(th) * - (bp2_[1]-bp2_[0] + 2*sin(th)**5*cos(th)*phi2*(bp2_[3]-bp2_[2]) - - 4*sin(th)**6*cos(th)**2*bp2_[4])) / denm + denm = -4 * sin(th) ** 6 * cos(th) ** 2 + + upup_ = ( + -2 + * sin(th) ** 4 + * cos(th) ** 2 + * (bp2_[1] + bp2_[0] - 2 * cos(th) ** 2 * bp2_[4]) + + 2 * sin(th) ** 5 * cos(th) * phi3 * (bp2_[1] - bp2_[0]) + ) / denm + + vpvp_ = ( + -2 + * sin(th) ** 4 + * cos(th) ** 2 + * (bp2_[3] + bp2_[0] - 2 * cos(th) ** 2 * bp2_[4]) + - 2 * sin(th) ** 4 * cos(th) ** 2 * phi3 * (bp2_[1] - bp2_[0]) + + 2 * sin(th) ** 3 * cos(th) ** 3 * phi3 * (bp2_[1] - bp2_[0]) + - 2 * sin(th) ** 5 * cos(th) * phi2 * (bp2_[3] - bp2_[2]) + ) / denm + + wpwp_ = ( + -2 + * sin(th) ** 5 + * cos(th) + * ( + bp2_[1] + - bp2_[0] + + 2 * sin(th) ** 5 * cos(th) * phi2 * (bp2_[3] - bp2_[2]) + - 4 * sin(th) ** 6 * cos(th) ** 2 * bp2_[4] + ) + ) / denm tke_vec = xr.DataArray( - np.stack([upup_, vpvp_, wpwp_]).astype('float32'), - coords={'tke': ["upup_", "vpvp_", "wpwp_"], - 'range': ds.range, - 'time': time}, - attrs={'units': 'm2 s-2', - 'long_name': 'TKE Vector', - 'standard_name': 'specific_turbulent_kinetic_energy_of_sea_water'}) + np.stack([upup_, vpvp_, wpwp_]).astype("float32"), + coords={ + "tke": ["upup_", "vpvp_", "wpwp_"], + "range": ds.range, + "time": time, + }, + attrs={ + "units": "m2 s-2", + "long_name": "TKE Vector", + "standard_name": "specific_turbulent_kinetic_energy_of_sea_water", + }, + ) if tke_only: return tke_vec else: # Guerra Thomson calculate u'v' bar from from the covariance of u' and v' - ds.velds.rotate2('inst') + ds.velds.rotate2("inst") vel = self.detrend(ds.vel.values) - upvp_ = np.nanmean(vel[0] * vel[1], axis=-1, - dtype=np.float64).astype(np.float32) - - upwp_ = (sin(th)**5*cos(th)*(bp2_[1]-bp2_[0]) + - 2*sin(th)**4*cos(th)*2*phi3*(bp2_[1]+bp2_[0]) - - 4*sin(th)**4*cos(th)*2*phi3*bp2_[4] - - 4*sin(th)**6*cos(th)*2*phi2*upvp_) / denm - - vpwp_ = (sin(th)**5*cos(th)*(bp2_[3]-bp2_[2]) - - 2*sin(th)**4*cos(th)*2*phi2*(bp2_[3]+bp2_[2]) + - 4*sin(th)**4*cos(th)*2*phi2*bp2_[4] + - 4*sin(th)**6*cos(th)*2*phi3*upvp_) / denm + upvp_ = np.nanmean(vel[0] * vel[1], axis=-1, dtype=np.float64).astype( + np.float32 + ) + + upwp_ = ( + sin(th) ** 5 * cos(th) * (bp2_[1] - bp2_[0]) + + 2 * sin(th) ** 4 * cos(th) * 2 * phi3 * (bp2_[1] + bp2_[0]) + - 4 * sin(th) ** 4 * cos(th) * 2 * phi3 * bp2_[4] + - 4 * sin(th) ** 6 * cos(th) * 2 * phi2 * upvp_ + ) / denm + + vpwp_ = ( + sin(th) ** 5 * cos(th) * (bp2_[3] - bp2_[2]) + - 2 * sin(th) ** 4 * cos(th) * 2 * phi2 * (bp2_[3] + bp2_[2]) + + 4 * sin(th) ** 4 * cos(th) * 2 * phi2 * bp2_[4] + + 4 * sin(th) ** 6 * cos(th) * 2 * phi3 * upvp_ + ) / denm stress_vec = xr.DataArray( - np.stack([upvp_, upwp_, vpwp_]).astype('float32'), - coords={'tau': ["upvp_", "upwp_", "vpwp_"], - 'range': ds.range, - 'time': time}, - attrs={'units': 'm2 s-2', - 'long_name': 'Specific Reynolds Stress Vector'}) + np.stack([upvp_, upwp_, vpwp_]).astype("float32"), + coords={ + "tau": ["upvp_", "upwp_", "vpwp_"], + "range": ds.range, + "time": time, + }, + attrs={ + "units": "m2 s-2", + "long_name": "Specific Reynolds Stress Vector", + }, + ) return tke_vec, stress_vec - def total_turbulent_kinetic_energy(self, - ds, - noise=None, - orientation=None, - beam_angle=None): + def total_turbulent_kinetic_energy( + self, ds, noise=None, orientation=None, beam_angle=None + ): """ - Calculate magnitude of turbulent kinetic energy from 5-beam ADCP. + Calculate magnitude of turbulent kinetic energy from 5-beam ADCP. Parameters ---------- @@ -726,25 +791,26 @@ def total_turbulent_kinetic_energy(self, combines the TKE components. Warning: the integral length scale of turbulence captured by the - ADCP measurements (i.e. the size of turbulent structures) increases + ADCP measurements (i.e. the size of turbulent structures) increases with increasing range from the instrument. """ tke_vec = self.stress_tensor_5beam( - ds, noise, orientation, beam_angle, tke_only=True) + ds, noise, orientation, beam_angle, tke_only=True + ) - tke = tke_vec.sum('tke') / 2 - tke.attrs['units'] = 'm2 s-2' - tke.attrs['long_name'] = 'TKE Magnitude', - tke.attrs['standard_name'] = 'specific_turbulent_kinetic_energy_of_sea_water' + tke = tke_vec.sum("tke") / 2 + tke.attrs["units"] = "m2 s-2" + tke.attrs["long_name"] = ("TKE Magnitude",) + tke.attrs["standard_name"] = "specific_turbulent_kinetic_energy_of_sea_water" - return tke.astype('float32') + return tke.astype("float32") def check_turbulence_cascade_slope(self, psd, freq_range=[0.2, 0.4]): """ - This function calculates the slope of the PSD, the power spectra + This function calculates the slope of the PSD, the power spectra of velocity, within the given frequency range. The purpose of this - function is to check that the region of the PSD containing the + function is to check that the region of the PSD containing the isotropic turbulence cascade decreases at a rate of :math:`f^{-5/3}`. Parameters @@ -752,13 +818,13 @@ def check_turbulence_cascade_slope(self, psd, freq_range=[0.2, 0.4]): psd : xarray.DataArray ([[range,] time,] freq) The power spectral density (1D, 2D or 3D) freq_range : iterable(2) (default: [6.28, 12.57]) - The range over which the isotropic turbulence cascade occurs, in + The range over which the isotropic turbulence cascade occurs, in units of the psd frequency vector (Hz or rad/s) Returns ------- (m, b): tuple (slope, y-intercept) - A tuple containing the coefficients of the log-adjusted linear + A tuple containing the coefficients of the log-adjusted linear regression between PSD and frequency Notes @@ -767,9 +833,9 @@ def check_turbulence_cascade_slope(self, psd, freq_range=[0.2, 0.4]): .. math:: S(k) = \\alpha \\epsilon^{2/3} k^{-5/3} + N - The slope of the isotropic turbulence cascade, which should be - equal to :math:`k^{-5/3}` or :math:`f^{-5/3}`, where k and f are - the wavenumber and frequency vectors, is estimated using linear + The slope of the isotropic turbulence cascade, which should be + equal to :math:`k^{-5/3}` or :math:`f^{-5/3}`, where k and f are + the wavenumber and frequency vectors, is estimated using linear regression with a log transformation: .. math:: log10(y) = m*log10(x) + b @@ -778,35 +844,35 @@ def check_turbulence_cascade_slope(self, psd, freq_range=[0.2, 0.4]): .. math:: y = 10^{b} x^{m} - Where :math:`y` is S(k) or S(f), :math:`x` is k or f, :math:`m` - is the slope (ideally -5/3), and :math:`10^{b}` is the intercept of + Where :math:`y` is S(k) or S(f), :math:`x` is k or f, :math:`m` + is the slope (ideally -5/3), and :math:`10^{b}` is the intercept of y at x^m=1. """ if not isinstance(psd, xr.DataArray): raise TypeError("`psd` must be an instance of `xarray.DataArray`.") - if not hasattr(freq_range, '__iter__') or len(freq_range) != 2: + if not hasattr(freq_range, "__iter__") or len(freq_range) != 2: raise ValueError("`freq_range` must be an iterable of length 2.") - + idx = np.where((freq_range[0] < psd.freq) & (psd.freq < freq_range[1])) idx = idx[0] - x = np.log10(psd['freq'].isel(freq=idx)) + x = np.log10(psd["freq"].isel(freq=idx)) y = np.log10(psd.isel(freq=idx)) - y_bar = y.mean('freq') - x_bar = x.mean('freq') + y_bar = y.mean("freq") + x_bar = x.mean("freq") # using the formula to calculate the slope and intercept n = np.sum((x - x_bar) * (y - y_bar), axis=0) - d = np.sum((x - x_bar)**2, axis=0) + d = np.sum((x - x_bar) ** 2, axis=0) - m = n/d - b = y_bar - m*x_bar + m = n / d + b = y_bar - m * x_bar return m, b - def dissipation_rate_LT83(self, psd, U_mag, freq_range=[0.2, 0.4]): + def dissipation_rate_LT83(self, psd, U_mag, freq_range=[0.2, 0.4], noise=None): """ Calculate the TKE dissipation rate from the velocity spectra. @@ -817,8 +883,12 @@ def dissipation_rate_LT83(self, psd, U_mag, freq_range=[0.2, 0.4]): U_mag : xarray.DataArray (time) The bin-averaged horizontal velocity (a.k.a. speed) from a single depth bin (range) f_range : iterable(2) - The range over which to integrate/average the spectrum, in units + The range over which to integrate/average the spectrum, in units of the psd frequency vector (Hz or rad/s) + noise : float or array-like + Instrument noise level in same units as velocity. Typically + found from `adp.turbulence.doppler_noise_level`. + Default: None. Returns ------- @@ -850,33 +920,47 @@ def dissipation_rate_LT83(self, psd, U_mag, freq_range=[0.2, 0.4]): """ if len(psd.shape) != 2: - raise Exception('PSD should be 2-dimensional (time, frequency)') + raise Exception("PSD should be 2-dimensional (time, frequency)") if len(U_mag.shape) != 1: - raise Exception('U_mag should be 1-dimensional (time)') - if not hasattr(freq_range, '__iter__') or len(freq_range) != 2: + raise Exception("U_mag should be 1-dimensional (time)") + if not hasattr(freq_range, "__iter__") or len(freq_range) != 2: raise ValueError("`freq_range` must be an iterable of length 2.") - + if noise is not None: + if np.shape(noise)[0] != np.shape(psd)[0]: + raise Exception("Noise should have same first dimension as PSD") + else: + noise = np.array(0) + + # Noise subtraction from binner.TimeBinner._psd_base + psd = psd.copy() + if noise is not None: + psd -= noise**2 / (self.fs / 2) + psd = psd.where(psd > 0, np.min(np.abs(psd)) / 100) + freq = psd.freq idx = np.where((freq_range[0] < freq) & (freq < freq_range[1])) idx = idx[0] - if freq.units == 'Hz': - U = U_mag/(2*np.pi) + if freq.units == "Hz": + U = U_mag / (2 * np.pi) else: U = U_mag a = 0.5 - out = (psd[:, idx] * freq[idx]**(5/3) / - a).mean(axis=-1)**(3/2) / U.values + out = (psd[:, idx] * freq[idx] ** (5 / 3) / a).mean(axis=-1) ** ( + 3 / 2 + ) / U.values return xr.DataArray( - out.astype('float32'), - attrs={'units': 'm2 s-3', - 'long_name': 'TKE Dissipation Rate', - 'standard_name': 'specific_turbulent_kinetic_energy_dissipation_in_sea_water', - 'description': 'TKE dissipation rate calculated using ' - 'the method from Lumley and Terray, 1983', - }) + out.astype("float32"), + attrs={ + "units": "m2 s-3", + "long_name": "TKE Dissipation Rate", + "standard_name": "specific_turbulent_kinetic_energy_dissipation_in_sea_water", + "description": "TKE dissipation rate calculated using " + "the method from Lumley and Terray, 1983", + }, + ) def dissipation_rate_SF(self, vel_raw, r_range=[1, 5]): """ @@ -904,18 +988,18 @@ def dissipation_rate_SF(self, vel_raw, r_range=[1, 5]): Notes ----- - Dissipation rate outputted by this function is only valid if the isotropic - turbulence cascade can be seen in the TKE spectra. + Dissipation rate outputted by this function is only valid if the isotropic + turbulence cascade can be seen in the TKE spectra. - Velocity data must be in beam coordinates and should be cleaned of surface + Velocity data must be in beam coordinates and should be cleaned of surface interference. This method calculates the 2nd order structure function: .. math:: D(z,r) = [(u'(z) - u`(z+r))^2] - where `u'` is the velocity fluctuation `z` is the depth bin, - `r` is the separation between depth bins, and [] denotes a time average + where `u'` is the velocity fluctuation `z` is the depth bin, + `r` is the separation between depth bins, and [] denotes a time average (size 'ADPBinner.n_bin'). The stucture function can then be used to estimate the dissipation rate: @@ -934,14 +1018,15 @@ def dissipation_rate_SF(self, vel_raw, r_range=[1, 5]): if not isinstance(vel_raw, xr.DataArray): raise TypeError("`vel_raw` must be an instance of `xarray.DataArray`.") - if not hasattr(r_range, '__iter__') or len(r_range) != 2: + if not hasattr(r_range, "__iter__") or len(r_range) != 2: raise ValueError("`r_range` must be an iterable of length 2.") if len(vel_raw.shape) != 2: raise Exception( - "Function input must be single beam and in 'beam' coordinate system") + "Function input must be single beam and in 'beam' coordinate system" + ) - if 'range_b5' in vel_raw.dims: + if "range_b5" in vel_raw.dims: rng = vel_raw.range_b5 time = self.mean(vel_raw.time_b5.values) else: @@ -951,28 +1036,27 @@ def dissipation_rate_SF(self, vel_raw, r_range=[1, 5]): # bm shape is [range, ensemble time, 'data within ensemble'] bm = self.demean(vel_raw.values) # take out the ensemble mean - e = np.empty(bm.shape[:2], dtype='float32')*np.nan - n = np.empty(bm.shape[:2], dtype='float32')*np.nan + e = np.empty(bm.shape[:2], dtype="float32") * np.nan + n = np.empty(bm.shape[:2], dtype="float32") * np.nan bin_size = round(np.diff(rng)[0], 3) - R = int(r_range[0]/bin_size) - r = np.arange(bin_size, r_range[1]+bin_size, bin_size) + R = int(r_range[0] / bin_size) + r = np.arange(bin_size, r_range[1] + bin_size, bin_size) # D(z,r,time) D = np.zeros((bm.shape[0], r.size, bm.shape[1])) for r_value in r: # the i in d is the index based on r and bin size # bin size index, > 1 - i = int(r_value/bin_size) + i = int(r_value / bin_size) for idx in range(bm.shape[1]): # for each ensemble # subtract the variance of adjacent depth cells - d = np.nanmean( - (bm[:-i, idx, :] - bm[i:, idx, :]) ** 2, axis=-1) + d = np.nanmean((bm[:-i, idx, :] - bm[i:, idx, :]) ** 2, axis=-1) # have to insert 0/nan in first bin to match length spaces = np.empty((i,)) spaces[:] = np.NaN - D[:, i-1, idx] = np.concatenate((spaces, d)) + D[:, i - 1, idx] = np.concatenate((spaces, d)) # find best fit line y = mx + b (aka D(z,r) = A*r^2/3 + N) to solve # epsilon for each depth and ensemble @@ -981,50 +1065,52 @@ def dissipation_rate_SF(self, vel_raw, r_range=[1, 5]): for i in range(D.shape[1], D.shape[0]): # average ensembles together if not all(np.isnan(D[i, R:, idx])): # if no nan's - e[i, idx], n[i, idx] = np.polyfit(r[R:] ** 2/3, - D[i, R:, idx], - deg=1) + e[i, idx], n[i, idx] = np.polyfit( + r[R:] ** 2 / 3, D[i, R:, idx], deg=1 + ) else: e[i, idx], n[i, idx] = np.nan, np.nan # A taken as 2.1, n = y-intercept - epsilon = (e/2.1)**(3/2) - noise = np.sqrt(n/2) + epsilon = (e / 2.1) ** (3 / 2) + noise = np.sqrt(n / 2) epsilon = xr.DataArray( - epsilon.astype('float32'), - coords={vel_raw.dims[0]: rng, - vel_raw.dims[1]: time}, + epsilon.astype("float32"), + coords={vel_raw.dims[0]: rng, vel_raw.dims[1]: time}, dims=vel_raw.dims, - attrs={'units': 'm2 s-3', - 'long_name': 'TKE Dissipation Rate', - 'standard_name': 'specific_turbulent_kinetic_energy_dissipation_in_sea_water', - 'description': 'TKE dissipation rate calculated from the ' - '"structure function" method from Wiles et al, 2006.' - }) + attrs={ + "units": "m2 s-3", + "long_name": "TKE Dissipation Rate", + "standard_name": "specific_turbulent_kinetic_energy_dissipation_in_sea_water", + "description": "TKE dissipation rate calculated from the " + '"structure function" method from Wiles et al, 2006.', + }, + ) noise = xr.DataArray( - noise.astype('float32'), - coords={vel_raw.dims[0]: rng, - vel_raw.dims[1]: time}, - attrs={'units': 'm s-1', - 'long_name': 'Structure Function Noise Offset', - }) + noise.astype("float32"), + coords={vel_raw.dims[0]: rng, vel_raw.dims[1]: time}, + attrs={ + "units": "m s-1", + "long_name": "Structure Function Noise Offset", + }, + ) SF = xr.DataArray( - D.astype('float32'), - coords={vel_raw.dims[0]: rng, - 'range_SF': r, - vel_raw.dims[1]: time}, - attrs={'units': 'm2 s-2', - 'long_name': 'Structure Function D(z,r)', - 'description': '"Structure function" from Wiles et al, 2006.' - }) + D.astype("float32"), + coords={vel_raw.dims[0]: rng, "range_SF": r, vel_raw.dims[1]: time}, + attrs={ + "units": "m2 s-2", + "long_name": "Structure Function D(z,r)", + "description": '"Structure function" from Wiles et al, 2006.', + }, + ) return epsilon, noise, SF def friction_velocity(self, ds_avg, upwp_, z_inds=slice(1, 5), H=None): """ - Approximate friction velocity from shear stress using a + Approximate friction velocity from shear stress using a logarithmic profile. Parameters @@ -1051,18 +1137,20 @@ def friction_velocity(self, ds_avg, upwp_, z_inds=slice(1, 5), H=None): raise TypeError("`upwp_` must be an instance of `xarray.DataArray`.") if not isinstance(z_inds, slice): raise TypeError("`z_inds` must be an instance of `slice(int,int)`.") - + if not H: H = ds_avg.depth.values - z = ds_avg['range'].values + z = ds_avg["range"].values upwp_ = upwp_.values sign = np.nanmean(np.sign(upwp_[z_inds, :]), axis=0) - u_star = np.nanmean(sign * upwp_[z_inds, :] / - (1 - z[z_inds, None] / H), axis=0) ** 0.5 + u_star = ( + np.nanmean(sign * upwp_[z_inds, :] / (1 - z[z_inds, None] / H), axis=0) + ** 0.5 + ) return xr.DataArray( - u_star.astype('float32'), - coords={'time': ds_avg.time}, - attrs={'units': 'm s-1', - 'long_name': 'Friction Velocity'}) + u_star.astype("float32"), + coords={"time": ds_avg.time}, + attrs={"units": "m s-1", "long_name": "Friction Velocity"}, + ) diff --git a/mhkit/dolfyn/adv/__init__.py b/mhkit/dolfyn/adv/__init__.py index 9468875d3..4dc7607ef 100644 --- a/mhkit/dolfyn/adv/__init__.py +++ b/mhkit/dolfyn/adv/__init__.py @@ -1 +1 @@ -from . import api \ No newline at end of file +from . import api diff --git a/mhkit/dolfyn/adv/clean.py b/mhkit/dolfyn/adv/clean.py index e33c95043..7bf95d46a 100644 --- a/mhkit/dolfyn/adv/clean.py +++ b/mhkit/dolfyn/adv/clean.py @@ -1,16 +1,18 @@ """Module containing functions to clean data """ + import numpy as np import warnings from ..velocity import VelBinner from ..tools.misc import group, slice1d_along_axis -warnings.filterwarnings('ignore', category=np.RankWarning) + +warnings.filterwarnings("ignore", category=np.RankWarning) sin = np.sin cos = np.cos -def clean_fill(u, mask, npt=12, method='cubic', maxgap=6): +def clean_fill(u, mask, npt=12, method="cubic", maxgap=6): """ Interpolate over mask values in timeseries data using the specified method @@ -22,7 +24,7 @@ def clean_fill(u, mask, npt=12, method='cubic', maxgap=6): Logical tensor of elements to "nan" out (from `spikeThresh`, `rangeLimit`, or `GN2002`) and replace npt : int - The number of points on either side of the bad values that + The number of points on either side of the bad values that interpolation occurs over method : string Interpolation method to use (linear, cubic, pchip, etc). Default is 'cubic' @@ -43,7 +45,7 @@ def clean_fill(u, mask, npt=12, method='cubic', maxgap=6): u.values[..., mask] = np.nan # Remove bad data for 2D+ and 1D timeseries variables - if 'dir' in u.dims: + if "dir" in u.dims: for i in range(u.shape[0]): u[i] = _interp_nan(u[i], npt, method, maxgap) else: @@ -101,13 +103,12 @@ def _interp_nan(da, npt, method, maxgap): ntail += 1 pos += 1 - if (ntail == npt or pos == len(da)): + if ntail == npt or pos == len(da): # This is the block we are interpolating over i_int = i[start:pos] - da[i_int] = da[i_int].interpolate_na(dim=da.dims[-1], - method=method, - use_coordinate=True, - limit=maxgap) + da[i_int] = da[i_int].interpolate_na( + dim=da.dims[-1], method=method, use_coordinate=True, limit=maxgap + ) # Reset searching = True ntail = 0 @@ -141,7 +142,7 @@ def fill_nan_ensemble_mean(u, mask, fs, window): """ u = u.where(~mask) - bnr = VelBinner(n_bin=window*fs, fs=fs) + bnr = VelBinner(n_bin=window * fs, fs=fs) if len(u.shape) == 1: var = u.values[None, :] @@ -158,12 +159,11 @@ def fill_nan_ensemble_mean(u, mask, fs, window): # diff = number of extra points extra_nans = vel_reshaped.shape[-1] - diff if diff: - vel = np.empty((var.shape[0], var.shape[-1]+extra_nans)) + vel = np.empty((var.shape[0], var.shape[-1] + extra_nans)) extra = var[:, -diff:] - empty = np.empty((vel.shape[0], extra_nans))*np.nan + empty = np.empty((vel.shape[0], extra_nans)) * np.nan extra = np.concatenate((extra, empty), axis=-1) - vel_reshaped = np.concatenate( - (vel_reshaped, extra[:, None, :]), axis=1) + vel_reshaped = np.concatenate((vel_reshaped, extra[:, None, :]), axis=1) extra_mean = np.nanmean(extra, axis=-1) vel_mean = np.concatenate((vel_mean, extra_mean[:, None]), axis=-1) @@ -172,11 +172,12 @@ def fill_nan_ensemble_mean(u, mask, fs, window): vel_mean_matrix = np.tile(vel_mean[..., None], (1, 1, bnr.n_bin)) vel_missing = np.isnan(vel_reshaped) vel_mask = np.ma.masked_array(vel_mean_matrix, ~vel_missing).filled(np.nan) - vel_filled = np.where(np.isnan(vel_reshaped), vel_mask, - vel_reshaped + np.nan_to_num(vel_mask)) + vel_filled = np.where( + np.isnan(vel_reshaped), vel_mask, vel_reshaped + np.nan_to_num(vel_mask) + ) # "Unshape" the data for i in range(var.shape[0]): - vel[i] = np.ravel(vel_filled[i], 'C') + vel[i] = np.ravel(vel_filled[i], "C") if diff: # Trim off the extra means u.values = np.squeeze(vel[:, :-extra_nans]) @@ -212,7 +213,7 @@ def spike_thresh(u, thresh=10): def range_limit(u, range=[-5, 5]): """ - Returns a logical vector that is True where the values of `u` are + Returns a logical vector that is True where the values of `u` are outside of `range`. Parameters @@ -232,12 +233,13 @@ def range_limit(u, range=[-5, 5]): def _calcab(al, Lu_std_u, Lu_std_d2u): - """Solve equations 10 and 11 of Goring+Nikora2002 - """ - return tuple(np.linalg.solve( - np.array([[cos(al) ** 2, sin(al) ** 2], - [sin(al) ** 2, cos(al) ** 2]]), - np.array([(Lu_std_u) ** 2, (Lu_std_d2u) ** 2]))) + """Solve equations 10 and 11 of Goring+Nikora2002""" + return tuple( + np.linalg.solve( + np.array([[cos(al) ** 2, sin(al) ** 2], [sin(al) ** 2, cos(al) ** 2]]), + np.array([(Lu_std_u) ** 2, (Lu_std_d2u) ** 2]), + ) + ) def _phaseSpaceThresh(u): @@ -252,27 +254,28 @@ def _phaseSpaceThresh(u): du[1:-1] = (u[2:] - u[:-2]) / 2 # And again. d2u[2:-2] = (du[1:-1][2:] - du[1:-1][:-2]) / 2 - p = (u ** 2 + du ** 2 + d2u ** 2) + p = u**2 + du**2 + d2u**2 std_u = np.std(u, axis=0) std_du = np.std(du, axis=0) std_d2u = np.std(d2u, axis=0) - alpha = np.arctan2(np.sum(u * d2u, axis=0), np.sum(u ** 2, axis=0)) + alpha = np.arctan2(np.sum(u * d2u, axis=0), np.sum(u**2, axis=0)) a = np.empty_like(alpha) b = np.empty_like(alpha) with warnings.catch_warnings() as w: warnings.filterwarnings( - 'ignore', category=RuntimeWarning, message='invalid value encountered in ') + "ignore", category=RuntimeWarning, message="invalid value encountered in " + ) for idx, al in enumerate(alpha): a[idx], b[idx] = _calcab(al, Lu * std_u[idx], Lu * std_d2u[idx]) theta = np.arctan2(du, u) - phi = np.arctan2((du ** 2 + u ** 2) ** 0.5, d2u) - pe = (((sin(phi) * cos(theta) * cos(alpha) + - cos(phi) * sin(alpha)) ** 2) / a + - ((sin(phi) * cos(theta) * sin(alpha) - - cos(phi) * cos(alpha)) ** 2) / b + - ((sin(phi) * sin(theta)) ** 2) / (Lu * std_du) ** 2) ** -1 + phi = np.arctan2((du**2 + u**2) ** 0.5, d2u) + pe = ( + ((sin(phi) * cos(theta) * cos(alpha) + cos(phi) * sin(alpha)) ** 2) / a + + ((sin(phi) * cos(theta) * sin(alpha) - cos(phi) * cos(alpha)) ** 2) / b + + ((sin(phi) * sin(theta)) ** 2) / (Lu * std_du) ** 2 + ) ** -1 pe[:, np.isnan(pe[0, :])] = 0 - return (p > pe).flatten('F') + return (p > pe).flatten("F") def GN2002(u, npt=5000): @@ -297,16 +300,16 @@ def GN2002(u, npt=5000): return GN2002(u.values, npt=npt) if u.ndim > 1: - mask = np.zeros(u.shape, dtype='bool') + mask = np.zeros(u.shape, dtype="bool") for slc in slice1d_along_axis(u.shape, -1): mask[slc] = GN2002(u[slc], npt=npt) return mask - mask = np.zeros(len(u), dtype='bool') + mask = np.zeros(len(u), dtype="bool") # Find large bad segments (>npt/10): # group returns a vector of slice objects. - bad_segs = group(np.isnan(u), min_length=int(npt//10)) + bad_segs = group(np.isnan(u), min_length=int(npt // 10)) if bad_segs.size > 2: # Break them up into separate regions: sp = 0 @@ -323,7 +326,7 @@ def GN2002(u, npt=5000): for ind in range(len(bad_segs)): bs = bad_segs[ind] # bs is a slice object. # Clean the good region: - mask[sp:bs.start] = GN2002(u[sp:bs.start], npt=npt) + mask[sp : bs.start] = GN2002(u[sp : bs.start], npt=npt) sp = bs.stop # Clean the last good region. mask[sp:ep] = GN2002(u[sp:ep], npt=npt) @@ -335,12 +338,13 @@ def GN2002(u, npt=5000): mask_last = np.zeros_like(mask) + np.inf mask[0] = True # make sure we start. while mask.any(): - mask[:nbins * npt] = _phaseSpaceThresh( - np.array(np.reshape(u[:(nbins * npt)], (npt, nbins), order='F'))) + mask[: nbins * npt] = _phaseSpaceThresh( + np.array(np.reshape(u[: (nbins * npt)], (npt, nbins), order="F")) + ) mask[-npt:] = _phaseSpaceThresh(u[-npt:]) c += 1 if c >= 100: - raise Exception('GN2002 loop-limit exceeded.') + raise Exception("GN2002 loop-limit exceeded.") if mask.sum() >= mask_last.sum(): break mask_last = mask.copy() diff --git a/mhkit/dolfyn/adv/motion.py b/mhkit/dolfyn/adv/motion.py index 43ac8c3d4..7db6f2797 100644 --- a/mhkit/dolfyn/adv/motion.py +++ b/mhkit/dolfyn/adv/motion.py @@ -11,21 +11,24 @@ class MissingDataError(ValueError): pass + class DataAlreadyProcessedError(Exception): pass + class MissingRequiredDataError(Exception): pass + def _get_body2imu(make_model): - if make_model == 'nortek vector': + if make_model == "nortek vector": # In inches it is: (0.25, 0.25, 5.9) return np.array([0.00635, 0.00635, 0.14986]) else: raise Exception("The imu->body vector is unknown for this instrument.") -class CalcMotion(): +class CalcMotion: """ A 'calculator' for computing the velocity of points that are rigidly connected to an ADV-body with an IMU. @@ -44,22 +47,17 @@ class CalcMotion(): _default_accel_filtfreq = 0.03 - def __init__(self, ds, - accel_filtfreq=None, - vel_filtfreq=None, - to_earth=True): - + def __init__(self, ds, accel_filtfreq=None, vel_filtfreq=None, to_earth=True): self.ds = ds - self._check_filtfreqs(accel_filtfreq, - vel_filtfreq) + self._check_filtfreqs(accel_filtfreq, vel_filtfreq) self.to_earth = to_earth self._set_accel() self._set_acclow() - self.angrt = ds['angrt'].values # No copy because not modified. + self.angrt = ds["angrt"].values # No copy because not modified. def _check_filtfreqs(self, accel_filtfreq, vel_filtfreq): - datval = self.ds.attrs.get('motion accel_filtfreq Hz', None) + datval = self.ds.attrs.get("motion accel_filtfreq Hz", None) if datval is None: if accel_filtfreq is None: accel_filtfreq = self._default_accel_filtfreq @@ -72,48 +70,58 @@ def _check_filtfreqs(self, accel_filtfreq, vel_filtfreq): warnings.warn( f"The default accel_filtfreq is {datval} Hz. " "Overriding this with the user-specified " - "value: {accel_filtfreq} Hz.") + "value: {accel_filtfreq} Hz." + ) if vel_filtfreq is None: - vel_filtfreq = self.ds.attrs.get('motion vel_filtfreq Hz', None) + vel_filtfreq = self.ds.attrs.get("motion vel_filtfreq Hz", None) if vel_filtfreq is None: vel_filtfreq = accel_filtfreq / 3.0 self.accel_filtfreq = accel_filtfreq self.accelvel_filtfreq = vel_filtfreq - def _set_accel(self, ): + def _set_accel( + self, + ): ds = self.ds - if ds.coord_sys == 'inst': - self.accel = np.einsum('ij...,i...->j...', - ds['orientmat'].values, - ds['accel'].values) - elif self.ds.coord_sys == 'earth': - self.accel = ds['accel'].values.copy() + if ds.coord_sys == "inst": + self.accel = np.einsum( + "ij...,i...->j...", ds["orientmat"].values, ds["accel"].values + ) + elif self.ds.coord_sys == "earth": + self.accel = ds["accel"].values.copy() else: - raise Exception(("Invalid coordinate system '%s'. The coordinate " - "system must either be 'earth' or 'inst' to " - "perform motion correction.") - % (self.ds.coord_sys)) - - def _check_duty_cycle(self, ): + raise Exception( + ( + "Invalid coordinate system '%s'. The coordinate " + "system must either be 'earth' or 'inst' to " + "perform motion correction." + ) + % (self.ds.coord_sys) + ) + + def _check_duty_cycle( + self, + ): """ Function to check if duty cycle exists and if it is followed consistently in the datafile """ - n_burst = self.ds.attrs.get('duty_cycle_n_burst') + n_burst = self.ds.attrs.get("duty_cycle_n_burst") if not n_burst: return # duty cycle interval in seconds - interval = self.ds.attrs.get('duty_cycle_interval') + interval = self.ds.attrs.get("duty_cycle_interval") actual_interval = ( - self.ds.time[n_burst:].values - self.ds.time[:-n_burst].values)/1e9 + self.ds.time[n_burst:].values - self.ds.time[:-n_burst].values + ) / 1e9 rng = actual_interval.max() - actual_interval.min() mean = actual_interval.mean() # Range will vary depending on how datetime64 rounds the timestamp # But isn't an issue if it does - if rng > 2 or (mean > interval+1 and mean < interval-1): + if rng > 2 or (mean > interval + 1 and mean < interval - 1): raise Exception("Bad duty cycle detected") # If this passes, it means we're safe to blindly skip n_burst for every integral @@ -121,17 +129,21 @@ def _check_duty_cycle(self, ): def reshape(self, dat, n_bin): # Assumes shape is (3, time) - length = dat.shape[-1]//n_bin - return np.reshape(dat[..., :length*n_bin], (dat.shape[0], length, n_bin)) + length = dat.shape[-1] // n_bin + return np.reshape(dat[..., : length * n_bin], (dat.shape[0], length, n_bin)) - def _set_acclow(self, ): + def _set_acclow( + self, + ): # Check if file is duty cycled n = self._check_duty_cycle() if n: - warnings.warn(" Duty Cycle detected. " - "Motion corrected data may contain edge effects " - "at the beginning and end of each duty cycle.") + warnings.warn( + " Duty Cycle detected. " + "Motion corrected data may contain edge effects " + "at the beginning and end of each duty cycle." + ) self.accel = self.reshape(self.accel, n_bin=n) self.acclow = acc = self.accel.copy() @@ -146,10 +158,13 @@ def _set_acclow(self, ): if np.isnan(acc).any(): warnings.warn( "Error filtering acceleration data. " - "Please decrease `accel_filtfreq`.") + "Please decrease `accel_filtfreq`." + ) acc = np.nan_to_num(acc) - def calc_velacc(self, ): + def calc_velacc( + self, + ): """ Calculates the translational velocity from the high-pass filtered acceleration signal. @@ -170,8 +185,13 @@ def calc_velacc(self, ): hp = self.accel - self.acclow # Integrate in time to get velocities - dat = np.concatenate((np.zeros(list(hp.shape[:-1]) + [1]), - cumtrapz(hp, dx=1 / samp_freq, axis=-1)), axis=-1) + dat = np.concatenate( + ( + np.zeros(list(hp.shape[:-1]) + [1]), + cumtrapz(hp, dx=1 / samp_freq, axis=-1), + ), + axis=-1, + ) if self.accelvel_filtfreq > 0: filt_freq = self.accelvel_filtfreq @@ -179,14 +199,15 @@ def calc_velacc(self, ): # Applied twice by 'filtfilt' = 4th order butterworth filt = ss.butter(2, float(filt_freq) / (samp_freq / 2)) for idx in range(hp.shape[0]): - dat[idx] = dat[idx] - \ - ss.filtfilt(filt[0], filt[1], dat[idx], axis=-1) + dat[idx] = dat[idx] - ss.filtfilt(filt[0], filt[1], dat[idx], axis=-1) # Fill nan with zeros - happens for some filter frequencies if np.isnan(dat).any(): - warnings.warn("Error filtering acceleration data. " - "Please decrease `vel_filtfreq`. " - "(default is 1/3 `accel_filtfreq`)") + warnings.warn( + "Error filtering acceleration data. " + "Please decrease `vel_filtfreq`. " + "(default is 1/3 `accel_filtfreq`)" + ) dat = np.nan_to_num(dat) if n: @@ -195,9 +216,9 @@ def calc_velacc(self, ): acclow_shaped = np.empty(self.angrt.shape) accel_shaped = np.empty(self.angrt.shape) for idx in range(hp.shape[0]): - velacc_shaped[idx] = np.ravel(dat[idx], 'C') - acclow_shaped[idx] = np.ravel(self.acclow[idx], 'C') - accel_shaped[idx] = np.ravel(self.accel[idx], 'C') + velacc_shaped[idx] = np.ravel(dat[idx], "C") + acclow_shaped[idx] = np.ravel(self.acclow[idx], "C") + accel_shaped[idx] = np.ravel(self.accel[idx], "C") # return acclow and velacc self.acclow = acclow_shaped @@ -209,7 +230,7 @@ def calc_velacc(self, ): def calc_velrot(self, vec, to_earth=None): """ - Calculate the induced velocity due to rotations of the + Calculate the induced velocity due to rotations of the instrument about the IMU center. Parameters @@ -245,17 +266,16 @@ def calc_velrot(self, vec, to_earth=None): # cross-product of omega (rotation vector) and the vector. # u=dz*omegaY-dy*omegaZ,v=dx*omegaZ-dz*omegaX,w=dy*omegaX-dx*omegaY # where vec=[dx,dy,dz], and angrt=[omegaX,omegaY,omegaZ] - velrot = np.array([(vec[2][:, None] * self.angrt[1] - - vec[1][:, None] * self.angrt[2]), - (vec[0][:, None] * self.angrt[2] - - vec[2][:, None] * self.angrt[0]), - (vec[1][:, None] * self.angrt[0] - - vec[0][:, None] * self.angrt[1]), - ]) + velrot = np.array( + [ + (vec[2][:, None] * self.angrt[1] - vec[1][:, None] * self.angrt[2]), + (vec[0][:, None] * self.angrt[2] - vec[2][:, None] * self.angrt[0]), + (vec[1][:, None] * self.angrt[0] - vec[0][:, None] * self.angrt[1]), + ] + ) if to_earth: - velrot = np.einsum('ji...,j...->i...', - self.ds['orientmat'].values, velrot) + velrot = np.einsum("ji...,j...->i...", self.ds["orientmat"].values, velrot) if dimflag: return velrot[:, 0, :] @@ -271,16 +291,16 @@ def _calc_probe_pos(ds, separate_probes=False): ----------- ds : xarray.Dataset ADV dataset - separate_probes : bool - If a Nortek Vector ADV, this function returns the - transformation matrix of positions of the probe's + separate_probes : bool + If a Nortek Vector ADV, this function returns the + transformation matrix of positions of the probe's acoustic recievers to the ADV's instrument frame of reference. Optional, default = False Returns ------- vec : 3x3 numpy.ndarray - Transformation matrix to convert from ADV probe to + Transformation matrix to convert from ADV probe to instrument frame of reference """ @@ -294,26 +314,28 @@ def _calc_probe_pos(ds, separate_probes=False): # In the coordinate system of the center of the probe (origin at # the acoustic transmitter) then, the positions of the centers of # the receivers is: - if separate_probes and _make_model(ds) == 'nortek vector': + if separate_probes and _make_model(ds) == "nortek vector": r = 0.076 # The angle between the x-y plane and the probes phi = np.deg2rad(-30) # The angles of the probes from the x-axis: - theta = np.deg2rad(np.array([0., 120., 240.])) - return (np.dot(ds['inst2head_rotmat'].values.T, - np.array([r * np.cos(theta), - r * np.sin(theta), - r * np.tan(phi) * np.ones(3)])) + - vec[:, None]) + theta = np.deg2rad(np.array([0.0, 120.0, 240.0])) + return ( + np.dot( + ds["inst2head_rotmat"].values.T, + np.array( + [r * np.cos(theta), r * np.sin(theta), r * np.tan(phi) * np.ones(3)] + ), + ) + + vec[:, None] + ) else: return vec -def correct_motion(ds, - accel_filtfreq=None, - vel_filtfreq=None, - to_earth=True, - separate_probes=False): +def correct_motion( + ds, accel_filtfreq=None, vel_filtfreq=None, to_earth=True, separate_probes=False +): """ This function performs motion correction on an IMU-ADV data object. The IMU and ADV data should be tightly synchronized and @@ -332,7 +354,7 @@ def correct_motion(ds, a second frequency to high-pass filter the integrated acceleration. Optional, default = 1/3 of `accel_filtfreq` - to_earth : bool + to_earth : bool All variables in the ds.props['rotate_vars'] list will be rotated into either the earth frame (to_earth=True) or the instrument frame (to_earth=False). Optional, default = True @@ -357,7 +379,7 @@ def correct_motion(ds, ``velacc`` is the translational component of the head motion (from accel, the high-pass filtered accel sigal) - ``acclow`` is the low-pass filtered accel sigal (i.e., + ``acclow`` is the low-pass filtered accel sigal (i.e., The primary velocity vector attribute, ``vel``, is motion corrected such that: @@ -408,44 +430,44 @@ def correct_motion(ds, ds = ds.copy(deep=True) # Check that no nan's exist - if ds['accel'].isnull().sum(): + if ds["accel"].isnull().sum(): raise MissingDataError("There should be no missing data in `accel` variable") - if ds['angrt'].isnull().sum(): + if ds["angrt"].isnull().sum(): raise MissingDataError("There should be no missing data in `angrt` variable") - if hasattr(ds, 'velrot') or ds.attrs.get('motion corrected', False): - raise DataAlreadyProcessedError('The data appears to already have been ' - 'motion corrected.') + if hasattr(ds, "velrot") or ds.attrs.get("motion corrected", False): + raise DataAlreadyProcessedError( + "The data appears to already have been " "motion corrected." + ) - if not hasattr(ds, 'has_imu') or ('accel' not in ds): - raise MissingRequiredDataError('The instrument does not appear to have an IMU.') + if not hasattr(ds, "has_imu") or ("accel" not in ds): + raise MissingRequiredDataError("The instrument does not appear to have an IMU.") - if ds.coord_sys != 'inst': - rotate2(ds, 'inst', inplace=True) + if ds.coord_sys != "inst": + rotate2(ds, "inst", inplace=True) # Returns True/False if head2inst_rotmat has been set/not-set. # Bad configs raises errors (this is to check for those) rot._check_inst2head_rotmat(ds) # Create the motion 'calculator': - calcobj = CalcMotion(ds, - accel_filtfreq=accel_filtfreq, - vel_filtfreq=vel_filtfreq, - to_earth=to_earth) + calcobj = CalcMotion( + ds, accel_filtfreq=accel_filtfreq, vel_filtfreq=vel_filtfreq, to_earth=to_earth + ) ########## # Calculate the translational velocity (from the accel): - ds['velacc'] = xr.DataArray(calcobj.calc_velacc(), - dims=['dirIMU', 'time'], - attrs={'units': 'm s-1', - 'long_name': 'Velocity from IMU Accelerometer'} - ).astype('float32') + ds["velacc"] = xr.DataArray( + calcobj.calc_velacc(), + dims=["dirIMU", "time"], + attrs={"units": "m s-1", "long_name": "Velocity from IMU Accelerometer"}, + ).astype("float32") # Copy acclow to the adv-object. - ds['acclow'] = xr.DataArray(calcobj.acclow, - dims=['dirIMU', 'time'], - attrs={'units': 'm s-2', - 'long_name': 'Low-Frequency Acceleration from IMU'} - ).astype('float32') + ds["acclow"] = xr.DataArray( + calcobj.acclow, + dims=["dirIMU", "time"], + attrs={"units": "m s-2", "long_name": "Low-Frequency Acceleration from IMU"}, + ).astype("float32") ########## # Calculate rotational velocity (from angrt): @@ -454,60 +476,65 @@ def correct_motion(ds, velrot = calcobj.calc_velrot(pos, to_earth=False) if separate_probes: # The head->beam transformation matrix - transMat = ds.get('beam2inst_orientmat', None) + transMat = ds.get("beam2inst_orientmat", None) # The inst->head transformation matrix - rmat = ds['inst2head_rotmat'] + rmat = ds["inst2head_rotmat"] # 1) Rotate body-coordinate velocities to head-coord. velrot = np.dot(rmat, velrot) # 2) Rotate body-coord to beam-coord (einsum), # 3) Take along beam-component (diagonal), # 4) Rotate back to head-coord (einsum), - velrot = np.einsum('ij,kj->ik', - transMat, - np.diagonal(np.einsum('ij,j...->i...', - np.linalg.inv(transMat), - velrot))) + velrot = np.einsum( + "ij,kj->ik", + transMat, + np.diagonal(np.einsum("ij,j...->i...", np.linalg.inv(transMat), velrot)), + ) # 5) Rotate back to body-coord. velrot = np.dot(rmat.T, velrot) - ds['velrot'] = xr.DataArray(velrot, - dims=['dirIMU', 'time'], - attrs={'units': 'm s-1', - 'long_name': 'Velocity from IMU Gyroscope'} - ).astype('float32') + ds["velrot"] = xr.DataArray( + velrot, + dims=["dirIMU", "time"], + attrs={"units": "m s-1", "long_name": "Velocity from IMU Gyroscope"}, + ).astype("float32") ########## # Rotate the data into the correct coordinate system. # inst2earth expects a 'rotate_vars' property. # Add velrot, velacc, acclow, to it. - if 'rotate_vars' not in ds.attrs: - ds.attrs['rotate_vars'] = ['vel', 'velrot', 'velacc', 'accel', - 'acclow', 'angrt', 'mag'] + if "rotate_vars" not in ds.attrs: + ds.attrs["rotate_vars"] = [ + "vel", + "velrot", + "velacc", + "accel", + "acclow", + "angrt", + "mag", + ] else: - ds.attrs['rotate_vars'].extend(['velrot', 'velacc', 'acclow']) + ds.attrs["rotate_vars"].extend(["velrot", "velacc", "acclow"]) # NOTE: accel, acclow, and velacc are in the earth-frame after # calc_velacc() call. inst2earth = rot._inst2earth if to_earth: # accel was converted to earth coordinates - ds['accel'].values = calcobj.accel - to_remove = ['accel', 'acclow', 'velacc'] - ds = inst2earth(ds, rotate_vars=[e for e in - ds.attrs['rotate_vars'] - if e not in to_remove]) + ds["accel"].values = calcobj.accel + to_remove = ["accel", "acclow", "velacc"] + ds = inst2earth( + ds, rotate_vars=[e for e in ds.attrs["rotate_vars"] if e not in to_remove] + ) else: # rotate these variables back to the instrument frame. - ds = inst2earth(ds, reverse=True, - rotate_vars=['acclow', 'velacc'], - force=True) + ds = inst2earth(ds, reverse=True, rotate_vars=["acclow", "velacc"], force=True) ########## # Copy vel -> velraw prior to motion correction: - ds['vel_raw'] = ds.vel.copy(deep=True) + ds["vel_raw"] = ds.vel.copy(deep=True) # Add it to rotate_vars: - ds.attrs['rotate_vars'].append('vel_raw') + ds.attrs["rotate_vars"].append("vel_raw") ########## # Remove motion from measured velocity @@ -517,10 +544,10 @@ def correct_motion(ds, # measures a velocity in the opposite direction. # use xarray to keep dimensions consistent - velmot = ds['velrot'] + ds['velacc'] - ds['vel'].values += velmot.values + velmot = ds["velrot"] + ds["velacc"] + ds["vel"].values += velmot.values - ds.attrs['motion corrected'] = 1 - ds.attrs['motion accel_filtfreq Hz'] = calcobj.accel_filtfreq + ds.attrs["motion corrected"] = 1 + ds.attrs["motion accel_filtfreq Hz"] = calcobj.accel_filtfreq return ds diff --git a/mhkit/dolfyn/adv/turbulence.py b/mhkit/dolfyn/adv/turbulence.py index 022012928..83ae80a7a 100644 --- a/mhkit/dolfyn/adv/turbulence.py +++ b/mhkit/dolfyn/adv/turbulence.py @@ -8,7 +8,7 @@ class ADVBinner(VelBinner): """ - A class that builds upon `VelBinner` for calculating turbulence + A class that builds upon `VelBinner` for calculating turbulence statistics and velocity spectra from ADV data Parameters @@ -24,35 +24,36 @@ class ADVBinner(VelBinner): n_fft_coh : int Number of data points to use for coherence and cross-spectra fft's. Optional, default `n_fft_coh` = `n_fft` - noise : float, list or numpy.ndarray - Instrument's doppler noise in same units as velocity + noise : float or array-like + Instrument noise level in same units as velocity. Typically + found from `adv.turbulence.doppler_noise_level`. + Default: None. """ - def __call__(self, ds, freq_units='rad/s', window='hann'): + def __call__(self, ds, freq_units="rad/s", window="hann"): out = type(ds)() out = self.bin_average(ds, out) - noise = ds.get('doppler_noise', [0, 0, 0]) - out['tke_vec'] = self.turbulent_kinetic_energy(ds['vel'], noise=noise) - out['stress_vec'] = self.reynolds_stress(ds['vel']) + noise = ds.get("doppler_noise", [0, 0, 0]) + out["tke_vec"] = self.turbulent_kinetic_energy(ds["vel"], noise=noise) + out["stress_vec"] = self.reynolds_stress(ds["vel"]) - out['psd'] = self.power_spectral_density(ds['vel'], - window=window, - freq_units=freq_units, - noise=noise) + out["psd"] = self.power_spectral_density( + ds["vel"], window=window, freq_units=freq_units, noise=noise + ) for key in list(ds.attrs.keys()): - if 'config' in key: + if "config" in key: ds.attrs.pop(key) out.attrs = ds.attrs - out.attrs['n_bin'] = self.n_bin - out.attrs['n_fft'] = self.n_fft - out.attrs['n_fft_coh'] = self.n_fft_coh + out.attrs["n_bin"] = self.n_bin + out.attrs["n_fft"] = self.n_fft + out.attrs["n_fft_coh"] = self.n_fft_coh return out def reynolds_stress(self, veldat, detrend=True): """ - Calculate the specific Reynolds stresses + Calculate the specific Reynolds stresses (cross-covariances of u,v,w in m^2/s^2) Parameters @@ -78,8 +79,7 @@ def reynolds_stress(self, veldat, detrend=True): time = self.mean(veldat.time.values) vel = veldat.values - out = np.empty(self._outshape(vel[:3].shape)[:-1], - dtype=np.float32) + out = np.empty(self._outshape(vel[:3].shape)[:-1], dtype=np.float32) if detrend: vel = self.detrend(vel) @@ -87,25 +87,29 @@ def reynolds_stress(self, veldat, detrend=True): vel = self.demean(vel) for idx, p in enumerate(self._cross_pairs): - out[idx] = np.nanmean(vel[p[0]] * vel[p[1]], - -1, dtype=np.float64 - ).astype(np.float32) - - da = xr.DataArray(out.astype('float32'), - dims=veldat.dims, - attrs={'units': 'm2 s-2', - 'long_name': 'Specific Reynolds Stress Vector'}) - da = da.rename({'dir': 'tau'}) - da = da.assign_coords({'tau': self.tau, 'time': time}) - + out[idx] = np.nanmean(vel[p[0]] * vel[p[1]], -1, dtype=np.float64).astype( + np.float32 + ) + + da = xr.DataArray( + out.astype("float32"), + dims=veldat.dims, + attrs={"units": "m2 s-2", "long_name": "Specific Reynolds Stress Vector"}, + ) + da = da.rename({"dir": "tau"}) + da = da.assign_coords({"tau": self.tau, "time": time}) + return da - def cross_spectral_density(self, veldat, - freq_units='rad/s', - fs=None, - window='hann', - n_bin=None, - n_fft_coh=None): + def cross_spectral_density( + self, + veldat, + freq_units="rad/s", + fs=None, + window="hann", + n_bin=None, + n_fft_coh=None, + ): """ Calculate the cross-spectral density of velocity components. @@ -114,7 +118,7 @@ def cross_spectral_density(self, veldat, veldat : xarray.DataArray The raw 3D velocity data. freq_units : string - Frequency units of the returned spectra in either Hz or rad/s + Frequency units of the returned spectra in either Hz or rad/s (`f` or :math:`\\omega`) fs : float (optional) The sample rate. Default = `binner.fs` @@ -135,7 +139,7 @@ def cross_spectral_density(self, veldat, if not isinstance(veldat, xr.DataArray): raise TypeError("`veldat` must be an instance of `xarray.DataArray`.") - if ('rad' not in freq_units) and ('Hz' not in freq_units): + if ("rad" not in freq_units) and ("Hz" not in freq_units): raise ValueError("`freq_units` should be one of 'Hz' or 'rad/s'") fs_in = self._parse_fs(fs) @@ -143,46 +147,57 @@ def cross_spectral_density(self, veldat, time = self.mean(veldat.time.values) veldat = veldat.values if len(np.shape(veldat)) != 2: - raise Exception("This function is only valid for calculating TKE using " - "the 3D velocity vector from an ADV.") + raise Exception( + "This function is only valid for calculating TKE using " + "the 3D velocity vector from an ADV." + ) - out = np.empty(self._outshape_fft(veldat[:3].shape, n_fft=n_fft, n_bin=n_bin), - dtype='complex') + out = np.empty( + self._outshape_fft(veldat[:3].shape, n_fft=n_fft, n_bin=n_bin), + dtype="complex", + ) # Create frequency vector, also checks whether using f or omega - if 'rad' in freq_units: - fs = 2*np.pi*fs_in - freq_units = 'rad s-1' - units = 'm2 s-1 rad-1' + if "rad" in freq_units: + fs = 2 * np.pi * fs_in + freq_units = "rad s-1" + units = "m2 s-1 rad-1" else: fs = fs_in - freq_units = 'Hz' - units = 'm2 s-2 Hz-1' - coh_freq = xr.DataArray(self._fft_freq(fs=fs_in, units=freq_units, n_fft=n_fft, coh=True), - dims=['coh_freq'], - name='coh_freq', - attrs={'units': freq_units, - 'long_name': 'FFT Frequency Vector', - 'coverage_content_type': 'coordinate'} - ).astype('float32') + freq_units = "Hz" + units = "m2 s-2 Hz-1" + coh_freq = xr.DataArray( + self._fft_freq(fs=fs_in, units=freq_units, n_fft=n_fft, coh=True), + dims=["coh_freq"], + name="coh_freq", + attrs={ + "units": freq_units, + "long_name": "FFT Frequency Vector", + "coverage_content_type": "coordinate", + }, + ).astype("float32") for ip, ipair in enumerate(self._cross_pairs): - out[ip] = self._csd_base(veldat[ipair[0]], - veldat[ipair[1]], - fs=fs, - window=window, - n_bin=n_bin, - n_fft=n_fft) - - csd = xr.DataArray(out.astype('complex64'), - coords={'C': self.C, - 'time': time, - 'coh_freq': coh_freq}, - dims=['C', 'time', 'coh_freq'], - attrs={'units': units, - 'n_fft_coh': n_fft, - 'long_name': 'Cross Spectral Density'}) - csd['coh_freq'].attrs['units'] = freq_units + out[ip] = self._csd_base( + veldat[ipair[0]], + veldat[ipair[1]], + fs=fs, + window=window, + n_bin=n_bin, + n_fft=n_fft, + ) + + csd = xr.DataArray( + out.astype("complex64"), + coords={"C": self.C, "time": time, "coh_freq": coh_freq}, + dims=["C", "time", "coh_freq"], + attrs={ + "units": units, + "n_fft_coh": n_fft, + "long_name": "Cross Spectral Density", + }, + ) + csd["coh_freq"].attrs["units"] = freq_units return csd @@ -200,7 +215,7 @@ def doppler_noise_level(self, psd, pct_fN=0.8): Returns ------- - doppler_noise (xarray.DataArray): + doppler_noise (xarray.DataArray): Doppler noise level in units of m/s Notes @@ -213,54 +228,56 @@ def doppler_noise_level(self, psd, pct_fN=0.8): `N` is the constant variance or spectral density, and `f_{c}` is the characteristic frequency. - The characteristic frequency is then found as + The characteristic frequency is then found as .. :math: f_{c} = pct_fN * (f_{s}/2) where `f_{s}/2` is the Nyquist frequency. - Richard, Jean-Baptiste, et al. "Method for identification of Doppler noise - levels in turbulent flow measurements dedicated to tidal energy." International + Richard, Jean-Baptiste, et al. "Method for identification of Doppler noise + levels in turbulent flow measurements dedicated to tidal energy." International Journal of Marine Energy 3 (2013): 52-64. - Thiébaut, Maxime, et al. "Investigating the flow dynamics and turbulence at a - tidal-stream energy site in a highly energetic estuary." Renewable Energy 195 + Thiébaut, Maxime, et al. "Investigating the flow dynamics and turbulence at a + tidal-stream energy site in a highly energetic estuary." Renewable Energy 195 (2022): 252-262. """ - + if not isinstance(psd, xr.DataArray): raise TypeError("`psd` must be an instance of `xarray.DataArray`.") if not isinstance(pct_fN, float) or not 0 <= pct_fN <= 1: raise ValueError("`pct_fN` must be a float within the range [0, 1].") # Characteristic frequency set to 80% of Nyquist frequency - fN = self.fs/2 + fN = self.fs / 2 fc = pct_fN * fN # Get units right if psd.freq.units == "Hz": f_range = slice(fc, fN) else: - f_range = slice(2*np.pi*fc, 2*np.pi*fN) + f_range = slice(2 * np.pi * fc, 2 * np.pi * fN) # Noise floor N2 = psd.sel(freq=f_range) * psd.freq.sel(freq=f_range) - noise_level = np.sqrt(N2.mean(dim='freq')) + noise_level = np.sqrt(N2.mean(dim="freq")) return xr.DataArray( - noise_level.values.astype('float32'), - dims=['dir', 'time'], - attrs={'units': 'm/s', - 'long_name': 'Doppler Noise Level', - 'description': 'Doppler noise level calculated ' - 'from PSD white noise'}) + noise_level.values.astype("float32"), + coords={"S": psd["S"], "time": psd["time"]}, + attrs={ + "units": "m/s", + "long_name": "Doppler Noise Level", + "description": "Doppler noise level calculated " "from PSD white noise", + }, + ) def check_turbulence_cascade_slope(self, psd, freq_range=[6.28, 12.57]): """ - This function calculates the slope of the PSD, the power spectra + This function calculates the slope of the PSD, the power spectra of velocity, within the given frequency range. The purpose of this - function is to check that the region of the PSD containing the + function is to check that the region of the PSD containing the isotropic turbulence cascade decreases at a rate of :math:`f^{-5/3}`. Parameters @@ -268,14 +285,14 @@ def check_turbulence_cascade_slope(self, psd, freq_range=[6.28, 12.57]): psd : xarray.DataArray ([time,] freq) The power spectral density (1D or 2D) freq_range : iterable(2) (default: [6.28, 12.57]) - The range over which the isotropic turbulence cascade occurs, in + The range over which the isotropic turbulence cascade occurs, in units of the psd frequency vector (Hz or rad/s) Returns ------- (m, b): tuple (slope, y-intercept) - A tuple containing the coefficients of the log-adjusted linear - regression between PSD and frequency + A tuple containing the coefficients of the log-adjusted linear + regression between PSD and frequency Notes ----- @@ -283,9 +300,9 @@ def check_turbulence_cascade_slope(self, psd, freq_range=[6.28, 12.57]): .. math:: S(k) = \\alpha \\epsilon^{2/3} k^{-5/3} + N - The slope of the isotropic turbulence cascade, which should be - equal to :math:`k^{-5/3}` or :math:`f^{-5/3}`, where k and f are - the wavenumber and frequency vectors, is estimated using linear + The slope of the isotropic turbulence cascade, which should be + equal to :math:`k^{-5/3}` or :math:`f^{-5/3}`, where k and f are + the wavenumber and frequency vectors, is estimated using linear regression with a log transformation: .. math:: log10(y) = m*log10(x) + b @@ -293,36 +310,36 @@ def check_turbulence_cascade_slope(self, psd, freq_range=[6.28, 12.57]): Which is equivalent to .. math:: y = 10^{b} x^{m} - - Where :math:`y` is S(k) or S(f), :math:`x` is k or f, :math:`m` - is the slope (ideally -5/3), and :math:`10^{b}` is the intercept of + + Where :math:`y` is S(k) or S(f), :math:`x` is k or f, :math:`m` + is the slope (ideally -5/3), and :math:`10^{b}` is the intercept of y at x^m=1. """ if not isinstance(psd, xr.DataArray): raise TypeError("`psd` must be an instance of `xarray.DataArray`.") - if not hasattr(freq_range, '__iter__') or len(freq_range) != 2: + if not hasattr(freq_range, "__iter__") or len(freq_range) != 2: raise ValueError("`freq_range` must be an iterable of length 2.") - + idx = np.where((freq_range[0] < psd.freq) & (psd.freq < freq_range[1])) idx = idx[0] - x = np.log10(psd['freq'].isel(freq=idx)) + x = np.log10(psd["freq"].isel(freq=idx)) y = np.log10(psd.isel(freq=idx)) - y_bar = y.mean('freq') - x_bar = x.mean('freq') + y_bar = y.mean("freq") + x_bar = x.mean("freq") # using the formula to calculate the slope and intercept n = np.sum((x - x_bar) * (y - y_bar), axis=0) - d = np.sum((x - x_bar)**2, axis=0) + d = np.sum((x - x_bar) ** 2, axis=0) - m = n/d - b = y_bar - m*x_bar + m = n / d + b = y_bar - m * x_bar return m, b - def dissipation_rate_LT83(self, psd, U_mag, freq_range=[6.28, 12.57]): + def dissipation_rate_LT83(self, psd, U_mag, freq_range=[6.28, 12.57], noise=None): """ Calculate the dissipation rate from the PSD @@ -333,9 +350,13 @@ def dissipation_rate_LT83(self, psd, U_mag, freq_range=[6.28, 12.57]): U_mag : xarray.DataArray (...,time) The bin-averaged horizontal velocity [m/s] (from dataset shortcut) freq_range : iterable(2) - The range over which to integrate/average the spectrum, in units - of the psd frequency vector (Hz or rad/s). + The range over which to integrate/average the spectrum, in units + of the psd frequency vector (Hz or rad/s). Default = [6.28, 12.57] rad/s + noise : float or array-like + Instrument noise level in same units as velocity. Typically + found from `adv.turbulence.calc_doppler_noise`. + Default: None. Returns ------- @@ -369,49 +390,64 @@ def dissipation_rate_LT83(self, psd, U_mag, freq_range=[6.28, 12.57]): if not isinstance(psd, xr.DataArray): raise TypeError("`psd` must be an instance of `xarray.DataArray`.") if len(U_mag.shape) != 1: - raise Exception('U_mag should be 1-dimensional (time)') - if len(psd.time)!=len(U_mag.time): + raise Exception("U_mag should be 1-dimensional (time)") + if len(psd.time) != len(U_mag.time): raise Exception("`U_mag` should be from ensembled-averaged dataset") - if not hasattr(freq_range, '__iter__') or len(freq_range) != 2: + if not hasattr(freq_range, "__iter__") or len(freq_range) != 2: raise ValueError("`freq_range` must be an iterable of length 2.") + if noise is not None: + if np.shape(noise)[0] != 3: + raise Exception("Noise should have same first dimension as velocity") + else: + noise = np.array([0, 0, 0])[:, None, None] + + # Noise subtraction from binner.TimeBinner.calc_psd_base + psd = psd.copy() + if noise is not None: + psd -= noise**2 / (self.fs / 2) + psd = psd.where(psd > 0, np.min(np.abs(psd)) / 100) + freq = psd.freq idx = np.where((freq_range[0] < freq) & (freq < freq_range[1])) idx = idx[0] - if freq.units == 'Hz': - U = U_mag/(2*np.pi) + if freq.units == "Hz": + U = U_mag / (2 * np.pi) else: U = U_mag a = 0.5 - out = (psd.isel(freq=idx) * - freq.isel(freq=idx)**(5/3) / a).mean(axis=-1)**(3/2) / U + out = (psd.isel(freq=idx) * freq.isel(freq=idx) ** (5 / 3) / a).mean( + axis=-1 + ) ** (3 / 2) / U return xr.DataArray( - out.astype('float32'), - attrs={'units': 'm2 s-3', - 'long_name': 'TKE Dissipation Rate', - 'standard_name': 'specific_turbulent_kinetic_energy_dissipation_in_sea_water', - 'description': 'TKE dissipation rate calculated using ' - 'the method from Lumley and Terray, 1983', - }) - - def dissipation_rate_SF(self, vel_raw, U_mag, fs=None, freq_range=[2., 4.]): + out.astype("float32"), + attrs={ + "units": "m2 s-3", + "long_name": "TKE Dissipation Rate", + "standard_name": "specific_turbulent_kinetic_energy_dissipation_in_sea_water", + "description": "TKE dissipation rate calculated using " + "the method from Lumley and Terray, 1983", + }, + ) + + def dissipation_rate_SF(self, vel_raw, U_mag, fs=None, freq_range=[2.0, 4.0]): """ Calculate dissipation rate using the "structure function" (SF) method Parameters ---------- vel_raw : xarray.DataArray (time) - The raw velocity data upon which to perform the SF technique. + The raw velocity data upon which to perform the SF technique. U_mag : xarray.DataArray The bin-averaged horizontal velocity (from dataset shortcut) fs : float The sample rate of `vel_raw` [Hz] freq_range : iterable(2) The frequency range over which to compute the SF [Hz] - (i.e. the frequency range within which the isotropic + (i.e. the frequency range within which the isotropic turbulence cascade falls). Default = [2., 4.] Hz @@ -423,9 +459,9 @@ def dissipation_rate_SF(self, vel_raw, U_mag, fs=None, freq_range=[2., 4.]): if not isinstance(vel_raw, xr.DataArray): raise TypeError("`vel_raw` must be an instance of `xarray.DataArray`.") - if len(vel_raw.time)==len(U_mag.time): + if len(vel_raw.time) == len(U_mag.time): raise Exception("`U_mag` should be from ensembled-averaged dataset") - if not hasattr(freq_range, '__iter__') or len(freq_range) != 2: + if not hasattr(freq_range, "__iter__") or len(freq_range) != 2: raise ValueError("`freq_range` must be an iterable of length 2.") veldat = vel_raw.values @@ -434,7 +470,7 @@ def dissipation_rate_SF(self, vel_raw, U_mag, fs=None, freq_range=[2., 4.]): fs = self._parse_fs(fs) if freq_range[1] > fs: - warnings.warn('Max freq_range cannot be greater than fs') + warnings.warn("Max freq_range cannot be greater than fs") dt = self.reshape(veldat) out = np.empty(dt.shape[:-1], dtype=dt.dtype) @@ -449,15 +485,17 @@ def dissipation_rate_SF(self, vel_raw, U_mag, fs=None, freq_range=[2., 4.]): out[slc[:-1]] = (cv2m / 2.1) ** (3 / 2) return xr.DataArray( - out.astype('float32'), + out.astype("float32"), coords=U_mag.coords, dims=U_mag.dims, - attrs={'units': 'm2 s-3', - 'long_name': 'TKE Dissipation Rate', - 'standard_name': 'specific_turbulent_kinetic_energy_dissipation_in_sea_water', - 'description': 'TKE dissipation rate calculated using the ' - '"structure function" method', - }) + attrs={ + "units": "m2 s-3", + "long_name": "TKE Dissipation Rate", + "standard_name": "specific_turbulent_kinetic_energy_dissipation_in_sea_water", + "description": "TKE dissipation rate calculated using the " + '"structure function" method', + }, + ) def _up_angle(self, U_complex): """ @@ -498,11 +536,11 @@ def _integral_TE01(self, I_tke, theta): out = np.empty_like(I_tke.flatten()) for i, (b, t) in enumerate(zip(I_tke.flatten(), theta.flatten())): out[i] = np.trapz( - cbrt(x**2 - 2/b*np.cos(t)*x + b**(-2)) * - np.exp(-0.5 * x ** 2), x) + cbrt(x**2 - 2 / b * np.cos(t) * x + b ** (-2)) * np.exp(-0.5 * x**2), + x, + ) - return out.reshape(I_tke.shape) * \ - (2 * np.pi) ** (-0.5) * I_tke ** (2 / 3) + return out.reshape(I_tke.shape) * (2 * np.pi) ** (-0.5) * I_tke ** (2 / 3) def dissipation_rate_TE01(self, dat_raw, dat_avg, freq_range=[6.28, 12.57]): """ @@ -514,10 +552,10 @@ def dissipation_rate_TE01(self, dat_raw, dat_avg, freq_range=[6.28, 12.57]): The raw (off the instrument) adv dataset dat_avg : xarray.Dataset The bin-averaged adv dataset (calc'd from 'calc_turbulence' or - 'do_avg'). The spectra (psd) and basic turbulence statistics + 'do_avg'). The spectra (psd) and basic turbulence statistics ('tke_vec' and 'stress_vec') must already be computed. freq_range : iterable(2) - The range over which to integrate/average the spectrum, in units + The range over which to integrate/average the spectrum, in units of the psd frequency vector (Hz or rad/s). Default = [6.28, 12.57] rad/s @@ -531,15 +569,16 @@ def dissipation_rate_TE01(self, dat_raw, dat_avg, freq_range=[6.28, 12.57]): raise TypeError("`dat_raw` must be an instance of `xarray.Dataset`.") if not isinstance(dat_avg, xr.Dataset): raise TypeError("`dat_avg` must be an instance of `xarray.Dataset`.") - if not hasattr(freq_range, '__iter__') or len(freq_range) != 2: + if not hasattr(freq_range, "__iter__") or len(freq_range) != 2: raise ValueError("`freq_range` must be an iterable of length 2.") # Assign local names U_mag = dat_avg.velds.U_mag.values I_tke = dat_avg.velds.I_tke.values - theta = np.angle(dat_avg.velds.U.values) - \ - self._up_angle(dat_raw.velds.U.values) - freq = dat_avg['psd'].freq.values + theta = np.angle(dat_avg.velds.U.values) - self._up_angle( + dat_raw.velds.U.values + ) + freq = dat_avg["psd"].freq.values # Calculate constants alpha = 1.5 @@ -552,26 +591,31 @@ def dissipation_rate_TE01(self, dat_raw, dat_avg, freq_range=[6.28, 12.57]): # Estimate values # u & v components (equation 6) - out = (np.nanmean((psd[0] + psd[1]) * freq**(5/3), -1) / - (21/55 * alpha * intgrl))**(3/2) / U_mag + out = ( + np.nanmean((psd[0] + psd[1]) * freq ** (5 / 3), -1) + / (21 / 55 * alpha * intgrl) + ) ** (3 / 2) / U_mag # Add w component - out += (np.nanmean(psd[2] * freq**(5/3), -1) / - (12/55 * alpha * intgrl))**(3/2) / U_mag + out += ( + np.nanmean(psd[2] * freq ** (5 / 3), -1) / (12 / 55 * alpha * intgrl) + ) ** (3 / 2) / U_mag # Average the two estimates out *= 0.5 return xr.DataArray( - out.astype('float32'), - coords={'time': dat_avg.psd.time}, - dims='time', - attrs={'units': 'm2 s-3', - 'long_name': 'TKE Dissipation Rate', - 'standard_name': 'specific_turbulent_kinetic_energy_dissipation_in_sea_water', - 'description': 'TKE dissipation rate calculated using the ' - 'method from Trowbridge and Elgar, 2001' - }) + out.astype("float32"), + coords={"time": dat_avg.psd.time}, + dims="time", + attrs={ + "units": "m2 s-3", + "long_name": "TKE Dissipation Rate", + "standard_name": "specific_turbulent_kinetic_energy_dissipation_in_sea_water", + "description": "TKE dissipation rate calculated using the " + "method from Trowbridge and Elgar, 2001", + }, + ) def integral_length_scales(self, a_cov, U_mag, fs=None): """ @@ -601,26 +645,31 @@ def integral_length_scales(self, a_cov, U_mag, fs=None): if not isinstance(a_cov, xr.DataArray): raise TypeError("`a_cov` must be an instance of `xarray.DataArray`.") - if len(a_cov.time)!=len(U_mag.time): + if len(a_cov.time) != len(U_mag.time): raise Exception("`U_mag` should be from ensembled-averaged dataset") acov = a_cov.values fs = self._parse_fs(fs) - scale = np.argmin((acov/acov[..., :1]) > (1/np.e), axis=-1) + scale = np.argmin((acov / acov[..., :1]) > (1 / np.e), axis=-1) L_int = U_mag.values / fs * scale return xr.DataArray( - L_int.astype('float32'), - coords={'dir': a_cov.dir, 'time': a_cov.time}, - attrs={'units': 'm', - 'long_name': 'Integral Length Scale', - 'standard_name': 'turbulent_mixing_length_of_sea_water'}) - - -def turbulence_statistics(ds_raw, n_bin, fs, n_fft=None, freq_units='rad/s', window='hann'): + L_int.astype("float32"), + coords={"dir": a_cov.dir, "time": a_cov.time}, + attrs={ + "units": "m", + "long_name": "Integral Length Scale", + "standard_name": "turbulent_mixing_length_of_sea_water", + }, + ) + + +def turbulence_statistics( + ds_raw, n_bin, fs, n_fft=None, freq_units="rad/s", window="hann" +): """ - Functional version of `ADVBinner` that computes a suite of turbulence + Functional version of `ADVBinner` that computes a suite of turbulence statistics for the input dataset, and returns a `binned` data object. Parameters @@ -629,7 +678,7 @@ def turbulence_statistics(ds_raw, n_bin, fs, n_fft=None, freq_units='rad/s', win The raw adv datset to `bin`, average and compute turbulence statistics of. freq_units : string - Frequency units of the returned spectra in either Hz or rad/s + Frequency units of the returned spectra in either Hz or rad/s (`f` or :math:`\\omega`). Default is 'rad/s' window : string or array The window to use for calculating spectra. diff --git a/mhkit/dolfyn/binned.py b/mhkit/dolfyn/binned.py index 1db825dc2..0bdb00f73 100644 --- a/mhkit/dolfyn/binned.py +++ b/mhkit/dolfyn/binned.py @@ -3,19 +3,19 @@ from .tools.fft import fft_frequency, psd_1D, cpsd_1D, cpsd_quasisync_1D from .tools.misc import slice1d_along_axis, detrend_array from .time import epoch2dt64, dt642epoch -warnings.simplefilter('ignore', RuntimeWarning) + +warnings.simplefilter("ignore", RuntimeWarning) class TimeBinner: - def __init__(self, n_bin, fs, n_fft=None, n_fft_coh=None, - noise=[0, 0, 0]): + def __init__(self, n_bin, fs, n_fft=None, n_fft_coh=None, noise=[0, 0, 0]): """ Initialize an averaging object Parameters ---------- n_bin : int - Number of data points to include in a 'bin' (ensemble), not the + Number of data points to include in a 'bin' (ensemble), not the number of bins fs : int Instrument sampling frequency in Hz @@ -38,14 +38,15 @@ def __init__(self, n_bin, fs, n_fft=None, n_fft_coh=None, self.n_fft = n_bin elif n_fft > n_bin: self.n_fft = n_bin - warnings.warn( - "n_fft must be smaller than n_bin, setting n_fft = n_bin") + warnings.warn("n_fft must be smaller than n_bin, setting n_fft = n_bin") if n_fft_coh is None: self.n_fft_coh = int(self.n_fft) elif n_fft_coh > n_bin: self.n_fft_coh = int(n_bin) - warnings.warn("n_fft_coh must be smaller than or equal to n_bin, " - "setting n_fft_coh = n_bin") + warnings.warn( + "n_fft_coh must be smaller than or equal to n_bin, " + "setting n_fft_coh = n_bin" + ) def _outshape(self, inshape, n_pad=0, n_bin=None): """ @@ -77,8 +78,7 @@ def _parse_nfft(self, n_fft=None): return self.n_fft if n_fft > self.n_bin: n_fft = self.n_bin - warnings.warn( - "n_fft must be smaller than n_bin, setting n_fft = n_bin") + warnings.warn("n_fft must be smaller than n_bin, setting n_fft = n_bin") return n_fft def _parse_nfft_coh(self, n_fft_coh=None): @@ -86,8 +86,10 @@ def _parse_nfft_coh(self, n_fft_coh=None): return self.n_fft_coh if n_fft_coh > self.n_bin: n_fft_coh = int(self.n_bin) - warnings.warn("n_fft_coh must be smaller than or equal to n_bin, " - "setting n_fft_coh = n_bin") + warnings.warn( + "n_fft_coh must be smaller than or equal to n_bin, " + "setting n_fft_coh = n_bin" + ) return n_fft_coh def _check_ds(self, raw_ds, out_ds): @@ -109,17 +111,22 @@ def _check_ds(self, raw_ds, out_ds): for v in raw_ds.data_vars: if np.any(np.array(raw_ds[v].shape) == 0): - raise RuntimeError(f"{v} cannot be averaged " - "because it is empty.") - if 'DutyCycle_NBurst' in raw_ds.attrs and \ - raw_ds.attrs['DutyCycle_NBurst'] < self.n_bin: - warnings.warn(f"The averaging interval (n_bin = {self.n_bin})" - "is larger than the burst interval " - "(NBurst = {dat.attrs['DutyCycle_NBurst']})") + raise RuntimeError(f"{v} cannot be averaged " "because it is empty.") + if ( + "DutyCycle_NBurst" in raw_ds.attrs + and raw_ds.attrs["DutyCycle_NBurst"] < self.n_bin + ): + warnings.warn( + f"The averaging interval (n_bin = {self.n_bin})" + "is larger than the burst interval " + "(NBurst = {dat.attrs['DutyCycle_NBurst']})" + ) if raw_ds.fs != self.fs: - raise Exception(f"The input data sample rate ({raw_ds.fs}) does not " - "match the sample rate of this binning-object " - "({self.fs})") + raise Exception( + f"The input data sample rate ({raw_ds.fs}) does not " + "match the sample rate of this binning-object " + "({self.fs})" + ) if out_ds is None: out_ds = type(raw_ds)() @@ -127,11 +134,12 @@ def _check_ds(self, raw_ds, out_ds): o_attrs = out_ds.attrs props = {} - props['fs'] = self.fs - props['n_bin'] = self.n_bin - props['n_fft'] = self.n_fft - props['description'] = 'Binned averages calculated from ' \ - 'ensembles of size "n_bin"' + props["fs"] = self.fs + props["n_bin"] = self.n_bin + props["n_fft"] = self.n_fft + props["description"] = ( + "Binned averages calculated from " 'ensembles of size "n_bin"' + ) props.update(raw_ds.attrs) for ky in props: @@ -140,24 +148,25 @@ def _check_ds(self, raw_ds, out_ds): # plus those defined above) raise AttributeError( "The attribute '{}' of `out_ds` is inconsistent " - "with this `VelBinner` or the input data (`raw_ds`)".format(ky)) + "with this `VelBinner` or the input data (`raw_ds`)".format(ky) + ) else: o_attrs[ky] = props[ky] return out_ds def _new_coords(self, array): """ - Function for setting up a new xarray.DataArray regardless of how + Function for setting up a new xarray.DataArray regardless of how many dimensions the input data-array has """ dims = array.dims dims_list = [] coords_dict = {} - if len(array.shape) == 1 & ('dir' in array.coords): - array = array.drop_vars('dir') + if len(array.shape) == 1 & ("dir" in array.coords): + array = array.drop_vars("dir") for ky in dims: dims_list.append(ky) - if 'time' in ky: + if "time" in ky: coords_dict[ky] = self.mean(array.time.values) else: coords_dict[ky] = array.coords[ky].values @@ -198,34 +207,33 @@ def reshape(self, arr, n_pad=0, n_bin=None): n_bin = self._parse_nbin(n_bin) if arr.shape[-1] < n_bin: - raise Exception('n_bin is larger than length of input array') + raise Exception("n_bin is larger than length of input array") npd0 = int(n_pad // 2) npd1 = int((n_pad + 1) // 2) shp = self._outshape(arr.shape, n_pad=0, n_bin=n_bin) out = np.zeros( - self._outshape(arr.shape, n_pad=n_pad, n_bin=n_bin), - dtype=arr.dtype) + self._outshape(arr.shape, n_pad=n_pad, n_bin=n_bin), dtype=arr.dtype + ) if np.mod(n_bin, 1) == 0: # n_bin needs to be int n_bin = int(n_bin) # If n_bin is an integer, we can do this simply. - out[..., npd0: n_bin + npd0] = ( - arr[..., :(shp[-2] * shp[-1])]).reshape(shp, order='C') + out[..., npd0 : n_bin + npd0] = (arr[..., : (shp[-2] * shp[-1])]).reshape( + shp, order="C" + ) else: - inds = (np.arange(np.prod(shp[-2:])) * n_bin // int(n_bin) - ).astype(int) + inds = (np.arange(np.prod(shp[-2:])) * n_bin // int(n_bin)).astype(int) # If there are too many indices, drop one bin if inds[-1] >= arr.shape[-1]: - inds = inds[:-int(n_bin)] + inds = inds[: -int(n_bin)] shp[-2] -= 1 out = out[..., 1:, :] n_bin = int(n_bin) - out[..., npd0:n_bin + npd0] = (arr[..., inds] - ).reshape(shp, order='C') + out[..., npd0 : n_bin + npd0] = (arr[..., inds]).reshape(shp, order="C") n_bin = int(n_bin) if n_pad != 0: - out[..., 1:, :npd0] = out[..., :-1, n_bin:n_bin + npd0] - out[..., :-1, -npd1:] = out[..., 1:, npd0:npd0 + npd1] + out[..., 1:, :npd0] = out[..., :-1, n_bin : n_bin + npd0] + out[..., :-1, -npd1:] = out[..., 1:, npd0 : npd0 + npd1] return out @@ -336,7 +344,7 @@ def variance(self, arr, axis=-1, n_bin=None): def standard_deviation(self, arr, axis=-1, n_bin=None): """ Reshape the array `arr` to shape (...,n,n_bin+n_pad) - and take the standard deviation of each bin along the + and take the standard deviation of each bin along the specified `axis`. Parameters @@ -354,8 +362,17 @@ def standard_deviation(self, arr, axis=-1, n_bin=None): return np.nanstd(self.reshape(arr, n_bin=n_bin), axis=axis, dtype=np.float32) - def _psd_base(self, dat, fs=None, window='hann', noise=0, - n_bin=None, n_fft=None, n_pad=None, step=None): + def _psd_base( + self, + dat, + fs=None, + window="hann", + noise=0, + n_bin=None, + n_fft=None, + n_pad=None, + step=None, + ): """ Calculate power spectral density of `dat` @@ -371,10 +388,10 @@ def _psd_base(self, dat, fs=None, window='hann', noise=0, The white-noise level of the measurement (in the same units as `dat`). n_bin : int - n_bin of veldat2, number of elements per bin if 'None' is taken + n_bin of veldat2, number of elements per bin if 'None' is taken from VelBinner n_fft : int - n_fft of veldat2, number of elements per bin if 'None' is taken + n_fft of veldat2, number of elements per bin if 'None' is taken from VelBinner n_pad : int (optional) The number of values to pad with zero. Default = 0 @@ -403,36 +420,34 @@ def _psd_base(self, dat, fs=None, window='hann', noise=0, dat = self.reshape(dat, n_pad=n_pad) for slc in slice1d_along_axis(dat.shape, -1): - out[slc] = psd_1D(dat[slc], n_fft, fs, - window=window, step=step) - if noise != 0: - out -= noise**2 / (fs/2) + out[slc] = psd_1D(dat[slc], n_fft, fs, window=window, step=step) + if np.any(noise): + out -= noise**2 / (fs / 2) # Make sure all values of the PSD are >0 (but still small): out[out < 0] = np.min(np.abs(out)) / 100 return out - def _csd_base(self, dat1, dat2, fs=None, window='hann', - n_fft=None, n_bin=None): + def _csd_base(self, dat1, dat2, fs=None, window="hann", n_fft=None, n_bin=None): """ Calculate the cross power spectral density of `dat`. Parameters ---------- dat1 : numpy.ndarray - The first (shorter, if applicable) raw dataArray of which to + The first (shorter, if applicable) raw dataArray of which to calculate the cpsd. dat2 : numpy.ndarray - The second (the shorter, if applicable) raw dataArray of which to + The second (the shorter, if applicable) raw dataArray of which to calculate the cpsd. fs : float (optional) The sample rate (Hz). window : str String indicating the window function to use. Default is 'hanning' n_fft : int - n_fft of veldat2, number of elements per bin if 'None' is taken + n_fft of veldat2, number of elements per bin if 'None' is taken from VelBinner n_bin : int - n_bin of veldat2, number of elements per bin if 'None' is taken + n_bin of veldat2, number of elements per bin if 'None' is taken from VelBinner Returns @@ -444,7 +459,7 @@ def _csd_base(self, dat1, dat2, fs=None, window='hann', ----- PSD's are calculated based on sample rate units - The two velocity inputs do not have to be perfectly synchronized, but + The two velocity inputs do not have to be perfectly synchronized, but they should have the same start and end timestamps """ @@ -453,7 +468,7 @@ def _csd_base(self, dat1, dat2, fs=None, window='hann', n_fft = self.n_fft_coh # want each slice to carry the same timespan n_bin2 = self._parse_nbin(n_bin) # bins for shorter array - n_bin1 = int(dat1.shape[-1]/(dat2.shape[-1]/n_bin2)) + n_bin1 = int(dat1.shape[-1] / (dat2.shape[-1] / n_bin2)) oshp = self._outshape_fft(dat1.shape, n_fft=n_fft, n_bin=n_bin1) oshp[-2] = np.min([oshp[-2], int(dat2.shape[-1] // n_bin2)]) @@ -461,17 +476,16 @@ def _csd_base(self, dat1, dat2, fs=None, window='hann', # The data is detrended in psd, so we don't need to do it here: dat1 = self.reshape(dat1, n_pad=n_fft) dat2 = self.reshape(dat2, n_pad=n_fft) - out = np.empty(oshp, dtype='c{}'.format(dat1.dtype.itemsize * 2)) + out = np.empty(oshp, dtype="c{}".format(dat1.dtype.itemsize * 2)) if dat1.shape == dat2.shape: cross = cpsd_1D else: cross = cpsd_quasisync_1D for slc in slice1d_along_axis(out.shape, -1): - out[slc] = cross(dat1[slc], dat2[slc], n_fft, - fs, window=window) + out[slc] = cross(dat1[slc], dat2[slc], n_fft, fs, window=window) return out - def _fft_freq(self, fs=None, units='Hz', n_fft=None, coh=False): + def _fft_freq(self, fs=None, units="Hz", n_fft=None, coh=False): """ Wrapper to calculate the ordinary or radial frequency vector @@ -486,7 +500,7 @@ def _fft_freq(self, fs=None, units='Hz', n_fft=None, coh=False): (default: False) i.e. use self.n_fft_coh instead of self.n_fft. n_fft : int - n_fft of veldat2, number of elements per bin if 'None' is taken + n_fft of veldat2, number of elements per bin if 'None' is taken from VelBinner Returns @@ -502,11 +516,13 @@ def _fft_freq(self, fs=None, units='Hz', n_fft=None, coh=False): fs = self._parse_fs(fs) - if ('Hz' not in units) and ('rad' not in units): - raise Exception('Valid fft frequency vector units are Hz \ - or rad/s') + if ("Hz" not in units) and ("rad" not in units): + raise Exception( + "Valid fft frequency vector units are Hz \ + or rad/s" + ) - if 'rad' in units: - return fft_frequency(n_fft, 2*np.pi*fs) + if "rad" in units: + return fft_frequency(n_fft, 2 * np.pi * fs) else: return fft_frequency(n_fft, fs) diff --git a/mhkit/dolfyn/io/api.py b/mhkit/dolfyn/io/api.py index e540d53d0..1364a46dc 100644 --- a/mhkit/dolfyn/io/api.py +++ b/mhkit/dolfyn/io/api.py @@ -7,20 +7,27 @@ from .rdi import read_rdi from .base import _create_dataset, _get_filetype from ..rotate.base import _set_coords -from ..time import date2matlab, matlab2date, date2dt64, dt642date, date2epoch, epoch2date +from ..time import ( + date2matlab, + matlab2date, + date2dt64, + dt642date, + date2epoch, + epoch2date, +) def _check_file_ext(path, ext): filename = path.replace("\\", "/").rsplit("/")[-1] # windows/linux # for a filename like mcrl.water_velocity-1s.b1.20200813.150000.nc file_ext = filename.rsplit(".")[-1] - if '.' in filename: + if "." in filename: if file_ext != ext: raise IOError("File extension must be of the type {}".format(ext)) if file_ext == ext: return path - return path + '.' + ext + return path + "." + ext def _decode_cf(dataset: xr.Dataset) -> xr.Dataset: @@ -76,7 +83,7 @@ def read(fname, userdata=True, nens=None, **kwargs): userdata : True, False, or string of userdata.json filename (default ``True``) Whether to read the '.userdata.json' file. nens : None, int or 2-element tuple (start, stop) - Number of pings or ensembles to read from the file. + Number of pings or ensembles to read from the file. Default is None, read entire file **kwargs : dict Passed to instrument-specific parser. @@ -88,19 +95,21 @@ def read(fname, userdata=True, nens=None, **kwargs): """ file_type = _get_filetype(fname) - if file_type == '': - raise IOError("File '{}' looks like a git-lfs pointer. You may need to " - "install and initialize git-lfs. See https://git-lfs.github.com" - " for details.".format(fname)) + if file_type == "": + raise IOError( + "File '{}' looks like a git-lfs pointer. You may need to " + "install and initialize git-lfs. See https://git-lfs.github.com" + " for details.".format(fname) + ) elif file_type is None: - raise IOError("File '{}' is not recognized as a file-type that is readable by " - "DOLfYN. If you think it should be readable, try using the " - "appropriate read function (`read_rdi`, `read_nortek`, or " - "`read_signature`) found in dolfyn.io.api.".format(fname)) + raise IOError( + "File '{}' is not recognized as a file-type that is readable by " + "DOLfYN. If you think it should be readable, try using the " + "appropriate read function (`read_rdi`, `read_nortek`, or " + "`read_signature`) found in dolfyn.io.api.".format(fname) + ) else: - func_map = dict(RDI=read_rdi, - nortek=read_nortek, - signature=read_signature) + func_map = dict(RDI=read_rdi, nortek=read_nortek, signature=read_signature) func = func_map[file_type] return func(fname, userdata=userdata, nens=nens, **kwargs) @@ -130,16 +139,13 @@ def read_example(name, **kwargs): """ testdir = dirname(abspath(__file__)) - exdir = normpath(join(testdir, relpath('../../../examples/data/dolfyn/'))) - filename = exdir + '/' + name + exdir = normpath(join(testdir, relpath("../../../examples/data/dolfyn/"))) + filename = exdir + "/" + name return read(filename, **kwargs) -def save(ds, filename, - format='NETCDF4', engine='netcdf4', - compression=False, - **kwargs): +def save(ds, filename, format="NETCDF4", engine="netcdf4", compression=False, **kwargs): """ Save xarray dataset as netCDF (.nc). @@ -167,31 +173,41 @@ def save(ds, filename, See the xarray.to_netcdf documentation for more details. """ - filename = _check_file_ext(filename, 'nc') + filename = _check_file_ext(filename, "nc") # Handling complex values for netCDF4 - ds.attrs['complex_vars'] = [] + ds.attrs["complex_vars"] = [] for var in ds.data_vars: if np.iscomplexobj(ds[var]): - ds[var+'_real'] = ds[var].real - ds[var+'_imag'] = ds[var].imag + ds[var + "_real"] = ds[var].real + ds[var + "_imag"] = ds[var].imag ds = ds.drop_vars(var) - ds.attrs['complex_vars'].append(var) + ds.attrs["complex_vars"].append(var) # For variables that get rewritten to float64 elif ds[var].dtype == np.float64: - ds[var] = ds[var].astype('float32') - - if compression: - enc = dict() - for ky in ds.variables: - enc[ky] = dict(zlib=True, complevel=1) - if 'encoding' in kwargs: - # Overwrite ('update') values in enc with whatever is in kwargs['encoding'] - enc.update(kwargs['encoding']) - else: - kwargs['encoding'] = enc + ds[var] = ds[var].astype("float32") + + # Write variable encoding + enc = dict() + if "encoding" in kwargs: + enc.update(kwargs["encoding"]) + for ky in ds.variables: + # Save prior encoding + enc[ky] = ds[ky].encoding + # Remove unexpected netCDF4 encoding parameters + # https://github.com/pydata/xarray/discussions/5709 + params = ["szip", "zstd", "bzip2", "blosc", "contiguous", "chunksizes"] + [enc[ky].pop(p) for p in params if p in enc[ky]] + + if compression: + # New netcdf4-c cannot compress variable length strings + if ds[ky].size <= 1 or isinstance(ds[ky].data[0], str): + continue + enc[ky].update(dict(zlib=True, complevel=1)) + + kwargs["encoding"] = enc # Fix encoding on datetime64 variables. ds = _decode_cf(ds) @@ -214,25 +230,26 @@ def load(filename): An xarray dataset from the binary instrument data. """ - filename = _check_file_ext(filename, 'nc') + filename = _check_file_ext(filename, "nc") - ds = xr.load_dataset(filename, engine='netcdf4') + ds = xr.load_dataset(filename, engine="netcdf4") # Convert numpy arrays and strings back to lists for nm in ds.attrs: - if type(ds.attrs[nm]) == np.ndarray and ds.attrs[nm].size > 1: + if isinstance(ds.attrs[nm], np.ndarray) and ds.attrs[nm].size > 1: ds.attrs[nm] = list(ds.attrs[nm]) - elif type(ds.attrs[nm]) == str and nm in ['rotate_vars']: + elif isinstance(ds.attrs[nm], str) and nm in ["rotate_vars"]: ds.attrs[nm] = [ds.attrs[nm]] # Rejoin complex numbers - if hasattr(ds, 'complex_vars') and len(ds.complex_vars): - if len(ds.complex_vars[0]) == 1: - ds.attrs['complex_vars'] = [ds.complex_vars] - for var in ds.complex_vars: - ds[var] = ds[var+'_real'] + ds[var+'_imag'] * 1j - ds = ds.drop_vars([var+'_real', var+'_imag']) - ds.attrs.pop('complex_vars') + if hasattr(ds, "complex_vars"): + if len(ds.complex_vars): + if len(ds.complex_vars[0]) == 1: + ds.attrs["complex_vars"] = [ds.complex_vars] + for var in ds.complex_vars: + ds[var] = ds[var + "_real"] + ds[var + "_imag"] * 1j + ds = ds.drop_vars([var + "_real", var + "_imag"]) + ds.attrs.pop("complex_vars") return ds @@ -262,20 +279,18 @@ def save_mat(ds, filename, datenum=True): """ def copy_attrs(matfile, ds, key): - if hasattr(ds[key], 'units'): - matfile['units'][key] = ds[key].units - if hasattr(ds[key], 'long_name'): - matfile['long_name'][key] = ds[key].long_name - if hasattr(ds[key], 'standard_name'): - matfile['standard_name'][key] = ds[key].standard_name + if hasattr(ds[key], "units"): + matfile["units"][key] = ds[key].units + if hasattr(ds[key], "long_name"): + matfile["long_name"][key] = ds[key].long_name + if hasattr(ds[key], "standard_name"): + matfile["standard_name"][key] = ds[key].standard_name - filename = _check_file_ext(filename, 'mat') + filename = _check_file_ext(filename, "mat") # Convert time to datenum - t_coords = [t for t in ds.coords if np.issubdtype( - ds[t].dtype, np.datetime64)] - t_data = [t for t in ds.data_vars if np.issubdtype( - ds[t].dtype, np.datetime64)] + t_coords = [t for t in ds.coords if np.issubdtype(ds[t].dtype, np.datetime64)] + t_data = [t for t in ds.data_vars if np.issubdtype(ds[t].dtype, np.datetime64)] if datenum: func = date2matlab @@ -289,19 +304,25 @@ def copy_attrs(matfile, ds, key): dt = func(dt642date(ds[ky])) ds[ky].data = dt - ds.attrs['time_coords'] = t_coords - ds.attrs['time_data_vars'] = t_data + ds.attrs["time_coords"] = t_coords + ds.attrs["time_data_vars"] = t_data # Save xarray structure with more descriptive structure names - matfile = {'vars': {}, 'coords': {}, 'config': {}, - 'units': {}, 'long_name': {}, 'standard_name': {}} + matfile = { + "vars": {}, + "coords": {}, + "config": {}, + "units": {}, + "long_name": {}, + "standard_name": {}, + } for ky in ds.data_vars: - matfile['vars'][ky] = ds[ky].values + matfile["vars"][ky] = ds[ky].values copy_attrs(matfile, ds, ky) for ky in ds.coords: - matfile['coords'][ky] = ds[ky].values + matfile["coords"][ky] = ds[ky].values copy_attrs(matfile, ds, ky) - matfile['config'] = ds.attrs + matfile["config"] = ds.attrs sio.savemat(filename, matfile) @@ -318,7 +339,7 @@ def load_mat(filename, datenum=True): filename : str Filename and/or path with the '.mat' extension datenum : bool - If true, converts time from datenum. If false, converts time from + If true, converts time from datenum. If false, converts time from "epoch time". Returns @@ -331,19 +352,25 @@ def load_mat(filename, datenum=True): scipy.io.loadmat() """ - filename = _check_file_ext(filename, 'mat') + filename = _check_file_ext(filename, "mat") data = sio.loadmat(filename, struct_as_record=False, squeeze_me=True) - ds_dict = {'vars': {}, 'coords': {}, 'config': {}, - 'units': {}, 'long_name': {}, 'standard_name': {}} + ds_dict = { + "vars": {}, + "coords": {}, + "config": {}, + "units": {}, + "long_name": {}, + "standard_name": {}, + } for nm in ds_dict: key_list = data[nm]._fieldnames for ky in key_list: ds_dict[nm][ky] = getattr(data[nm], ky) - ds_dict['data_vars'] = ds_dict.pop('vars') - ds_dict['attrs'] = ds_dict.pop('config') + ds_dict["data_vars"] = ds_dict.pop("vars") + ds_dict["attrs"] = ds_dict.pop("config") # Recreate dataset ds = _create_dataset(ds_dict) @@ -351,16 +378,20 @@ def load_mat(filename, datenum=True): # Convert numpy arrays and strings back to lists for nm in ds.attrs: - if type(ds.attrs[nm]) == np.ndarray and ds.attrs[nm].size > 1: + if isinstance(ds.attrs[nm], np.ndarray) and ds.attrs[nm].size > 1: try: - ds.attrs[nm] = [x.strip(' ') for x in list(ds.attrs[nm])] + ds.attrs[nm] = [x.strip(" ") for x in list(ds.attrs[nm])] except: ds.attrs[nm] = list(ds.attrs[nm]) - elif type(ds.attrs[nm]) == str and nm in ['time_coords', 'time_data_vars', 'rotate_vars']: + elif isinstance(ds.attrs[nm], str) and nm in [ + "time_coords", + "time_data_vars", + "rotate_vars", + ]: ds.attrs[nm] = [ds.attrs[nm]] - if hasattr(ds, 'orientation_down'): - ds['orientation_down'] = ds['orientation_down'].astype(bool) + if hasattr(ds, "orientation_down"): + ds["orientation_down"] = ds["orientation_down"].astype(bool) if datenum: func = matlab2date @@ -368,15 +399,15 @@ def load_mat(filename, datenum=True): func = epoch2date # Restore datnum to np.dt64 - if hasattr(ds, 'time_coords'): - for ky in ds.attrs['time_coords']: + if hasattr(ds, "time_coords"): + for ky in ds.attrs["time_coords"]: dt = date2dt64(func(ds[ky].values)) ds = ds.assign_coords({ky: dt}) - ds.attrs.pop('time_coords') - if hasattr(ds, 'time_data_vars'): - for ky in ds.attrs['time_data_vars']: + ds.attrs.pop("time_coords") + if hasattr(ds, "time_data_vars"): + for ky in ds.attrs["time_data_vars"]: dt = date2dt64(func(ds[ky].values)) ds[ky].data = dt - ds.attrs.pop('time_data_vars') + ds.attrs.pop("time_data_vars") return ds diff --git a/mhkit/dolfyn/io/base.py b/mhkit/dolfyn/io/base.py index 8f3b4469a..545035cdb 100644 --- a/mhkit/dolfyn/io/base.py +++ b/mhkit/dolfyn/io/base.py @@ -23,18 +23,18 @@ def _get_filetype(fname): ' - if the file looks like a GIT-LFS pointer. """ - with open(fname, 'rb') as rdr: + with open(fname, "rb") as rdr: bytes = rdr.read(40) code = bytes[:2].hex() - if code in ['7f79', '7f7f']: - return 'RDI' - elif code in ['a50a']: - return 'signature' - elif code in ['a505']: + if code in ["7f79", "7f7f"]: + return "RDI" + elif code in ["a50a"]: + return "signature" + elif code in ["a505"]: # AWAC - return 'nortek' - elif bytes == b'version https://git-lfs.github.com/spec/': - return '' + return "nortek" + elif bytes == b"version https://git-lfs.github.com/spec/": + return "" else: return None @@ -42,13 +42,12 @@ def _get_filetype(fname): def _find_userdata(filename, userdata=True): # This function finds the file to read if userdata: - for basefile in [filename.rsplit('.', 1)[0], - filename]: - jsonfile = basefile + '.userdata.json' + for basefile in [filename.rsplit(".", 1)[0], filename]: + jsonfile = basefile + ".userdata.json" if os.path.isfile(jsonfile): return _read_userdata(jsonfile) - elif isinstance(userdata, (str, )) or hasattr(userdata, 'read'): + elif isinstance(userdata, (str,)) or hasattr(userdata, "read"): return _read_userdata(userdata) return {} @@ -60,232 +59,269 @@ def _read_userdata(fname): """ with open(fname) as data_file: data = json.load(data_file) - for nm in ['body2head_rotmat', 'body2head_vec']: + for nm in ["body2head_rotmat", "body2head_vec"]: if nm in data: - new_name = 'inst' + nm[4:] + new_name = "inst" + nm[4:] warnings.warn( - f'{nm} has been deprecated, please change this to {new_name} \ - in {fname}.') + f"{nm} has been deprecated, please change this to {new_name} \ + in {fname}." + ) data[new_name] = data.pop(nm) - if 'inst2head_rotmat' in data: - if data['inst2head_rotmat'] in ['identity', 'eye', 1, 1.]: - data['inst2head_rotmat'] = np.eye(3) + if "inst2head_rotmat" in data: + if data["inst2head_rotmat"] in ["identity", "eye", 1, 1.0]: + data["inst2head_rotmat"] = np.eye(3) else: - data['inst2head_rotmat'] = np.array(data['inst2head_rotmat']) - if 'inst2head_vec' in data and type(data['inst2head_vec']) != list: - data['inst2head_vec'] = list(data['inst2head_vec']) + data["inst2head_rotmat"] = np.array(data["inst2head_rotmat"]) + if "inst2head_vec" in data and type(data["inst2head_vec"]) != list: + data["inst2head_vec"] = list(data["inst2head_vec"]) return data def _handle_nan(data): """ - Finds trailing nan's that cause issues in running the rotation + Finds trailing nan's that cause issues in running the rotation algorithms and deletes them. """ - nan = np.zeros(data['coords']['time'].shape, dtype=bool) - l = data['coords']['time'].size + nan = np.zeros(data["coords"]["time"].shape, dtype=bool) + l = data["coords"]["time"].size - if any(np.isnan(data['coords']['time'])): - nan += np.isnan(data['coords']['time']) + if any(np.isnan(data["coords"]["time"])): + nan += np.isnan(data["coords"]["time"]) # Required for motion-correction algorithm - var = ['accel', 'angrt', 'mag'] - for key in data['data_vars']: + var = ["accel", "angrt", "mag"] + for key in data["data_vars"]: if any(val in key for val in var): - shp = data['data_vars'][key].shape + shp = data["data_vars"][key].shape if shp[-1] == l: if len(shp) == 1: - if any(np.isnan(data['data_vars'][key])): - nan += np.isnan(data['data_vars'][key]) + if any(np.isnan(data["data_vars"][key])): + nan += np.isnan(data["data_vars"][key]) elif len(shp) == 2: - if any(np.isnan(data['data_vars'][key][-1])): - nan += np.isnan(data['data_vars'][key][-1]) + if any(np.isnan(data["data_vars"][key][-1])): + nan += np.isnan(data["data_vars"][key][-1]) trailing = np.cumsum(nan)[-1] if trailing > 0: - data['coords']['time'] = data['coords']['time'][:-trailing] - for key in data['data_vars']: - if data['data_vars'][key].shape[-1] == l: - data['data_vars'][key] = data['data_vars'][key][..., :-trailing] + data["coords"]["time"] = data["coords"]["time"][:-trailing] + for key in data["data_vars"]: + if data["data_vars"][key].shape[-1] == l: + data["data_vars"][key] = data["data_vars"][key][..., :-trailing] return data def _create_dataset(data): - """Creates an xarray dataset from dictionary created from binary + """ + Creates an xarray dataset from dictionary created from binary readers. Direction 'dir' coordinates are set in `set_coords` """ - ds = xr.Dataset() - tag = ['_avg', '_b5', '_echo', '_bt', '_gps', '_ast', '_sl'] - - FoR = {} - try: - beams = data['attrs']['n_beams'] - except: - beams = data['attrs']['n_beams_avg'] + + tag = ["_avg", "_b5", "_echo", "_bt", "_gps", "_altraw", "_altraw_avg", "_sl"] + + ds_dict = {} + for key in data["coords"]: + ds_dict[key] = {"dims": (key), "data": data["coords"][key]} + + # Set various coordinate frames + if "n_beams_avg" in data["attrs"]: + beams = data["attrs"]["n_beams_avg"] + else: + beams = data["attrs"]["n_beams"] n_beams = max(min(beams, 4), 3) - beams = np.arange(1, n_beams+1, dtype=np.int32) - FoR['beam'] = xr.DataArray(beams, dims=['beam'], name='beam', attrs={ - 'units': '1', 'long_name': 'Beam Reference Frame'}) - FoR['dir'] = xr.DataArray(beams, dims=['dir'], name='dir', attrs={ - 'units': '1', 'long_name': 'Reference Frame'}) + beams = np.arange(1, n_beams + 1, dtype=np.int32) - for key in data['data_vars']: + ds_dict["beam"] = {"dims": ("beam"), "data": beams} + ds_dict["dir"] = {"dims": ("dir"), "data": beams} + data["units"].update({"beam": "1", "dir": "1"}) + data["long_name"].update({"beam": "Beam Reference Frame", "dir": "Reference Frame"}) + + # Iterate through data variables and add them to new dictionary + for key in data["data_vars"]: # orientation matrices - if 'mat' in key: - if 'inst' in key: # beam2inst & inst2head orientation matrices - ds[key] = xr.DataArray(data['data_vars'][key], - coords={'x1': beams, 'x2': beams}, - dims=['x1', 'x2'], - attrs={'units': '1', - 'long_name': 'Rotation Matrix'}) - elif 'orientmat' in key: # earth2inst orientation matrix + if "mat" in key: + if "inst" in key: # beam2inst & inst2head orientation matrices + if "x1" not in ds_dict: + ds_dict["x1"] = {"dims": ("x1"), "data": beams} + ds_dict["x2"] = {"dims": ("x2"), "data": beams} + + ds_dict[key] = {"dims": ("x1", "x2"), "data": data["data_vars"][key]} + data["units"].update({key: "1"}) + data["long_name"].update({key: "Rotation Matrix"}) + + elif "orientmat" in key: # earth2inst orientation matrix if any(val in key for val in tag): - tg = '_' + key.rsplit('_')[-1] + tg = "_" + key.rsplit("_")[-1] else: - tg = '' - earth = xr.DataArray(['E', 'N', 'U'], dims=['earth'], name='earth', attrs={ - 'units': '1', 'long_name': 'Earth Reference Frame'}) - inst = xr.DataArray(['X', 'Y', 'Z'], dims=['inst'], name='inst', attrs={ - 'units': '1', 'long_name': 'Instrument Reference Frame'}) - time = data['coords']['time'+tg] - ds[key] = xr.DataArray(data['data_vars'][key], - coords={'earth': earth, - 'inst': inst, 'time'+tg: time}, - dims=['earth', 'inst', 'time'+tg], - attrs={'units': data['units']['orientmat'], - 'long_name': data['long_name']['orientmat']}) + tg = "" + + ds_dict["earth"] = {"dims": ("earth"), "data": ["E", "N", "U"]} + ds_dict["inst"] = {"dims": ("inst"), "data": ["X", "Y", "Z"]} + ds_dict[key] = { + "dims": ("earth", "inst", "time" + tg), + "data": data["data_vars"][key], + } + data["units"].update( + {"earth": "1", "inst": "1", key: data["units"]["orientmat"]} + ) + data["long_name"].update( + { + "earth": "Earth Reference Frame", + "inst": "Instrument Reference Frame", + key: data["long_name"]["orientmat"], + } + ) # quaternion units never change - elif 'quaternions' in key: + elif "quaternions" in key: if any(val in key for val in tag): - tg = '_' + key.rsplit('_')[-1] + tg = "_" + key.rsplit("_")[-1] else: - tg = '' - q = xr.DataArray(['w', 'x', 'y', 'z'], dims=['q'], name='q', attrs={ - 'units': '1', 'long_name': 'Quaternion Vector Components'}) - time = data['coords']['time'+tg] - ds[key] = xr.DataArray(data['data_vars'][key], - coords={'q': q, - 'time'+tg: time}, - dims=['q', 'time'+tg], - attrs={'units': data['units']['quaternions'], - 'long_name': data['long_name']['quaternions']}) + tg = "" + + if "q" not in ds_dict: + ds_dict["q"] = {"dims": ("q"), "data": ["w", "x", "y", "z"]} + data["units"].update({"q": "1"}) + data["long_name"].update({"q": "Quaternion Vector Components"}) + + ds_dict[key] = {"dims": ("q", "time" + tg), "data": data["data_vars"][key]} + data["units"].update({key: data["units"]["quaternions"]}) + data["long_name"].update({key: data["long_name"]["quaternions"]}) + else: - # Assign each variable to a dataArray - ds[key] = xr.DataArray(data['data_vars'][key]) - # Assign metadata to each dataArray - for md in ['units', 'long_name', 'standard_name']: - if key in data[md]: - ds[key].attrs[md] = data[md][key] - try: # make sure ones with tags get units - tg = '_' + key.rsplit('_')[-1] - if any(val in key for val in tag): - ds[key].attrs[md] = data[md][key[:-len(tg)]] - except: - pass - - # Fill in dimensions and coordinates for each dataArray - shp = data['data_vars'][key].shape - l = len(shp) - if l == 1: # 1D variables - if any(val in key for val in tag): - tg = '_' + key.rsplit('_')[-1] + shp = data["data_vars"][key].shape + if len(shp) == 1: # 1D variables + if "_altraw_avg" in key: + tg = "_altraw_avg" + elif any(val in key for val in tag): + tg = "_" + key.rsplit("_")[-1] else: - tg = '' - ds[key] = ds[key].rename({'dim_0': 'time'+tg}) - ds[key] = ds[key].assign_coords( - {'time'+tg: data['coords']['time'+tg]}) - - elif l == 2: # 2D variables - if key == 'echo': - ds[key] = ds[key].rename({'dim_0': 'range_echo', - 'dim_1': 'time_echo'}) - ds[key] = ds[key].assign_coords({'range_echo': data['coords']['range_echo'], - 'time_echo': data['coords']['time_echo']}) + tg = "" + ds_dict[key] = {"dims": ("time" + tg), "data": data["data_vars"][key]} + + elif len(shp) == 2: # 2D variables + if key == "echo": + ds_dict[key] = { + "dims": ("range_echo", "time_echo"), + "data": data["data_vars"][key], + } + elif key == "samp_altraw": + ds_dict[key] = { + "dims": ("n_altraw", "time_altraw"), + "data": data["data_vars"][key], + } + elif key == "samp_altraw_avg": + ds_dict[key] = { + "dims": ("n_altraw_avg", "time_altraw_avg"), + "data": data["data_vars"][key], + } + # ADV/ADCP instrument vector data, bottom tracking elif shp[0] == n_beams and not any(val in key for val in tag[:3]): - if 'bt' in key and 'time_bt' in data['coords']: - tg = '_bt' + if "bt" in key and "time_bt" in data["coords"]: + tg = "_bt" else: - tg = '' - if any(key.rsplit('_')[0] in s for s in ['amp', 'corr', 'dist', 'prcnt_gd']): - dim0 = 'beam' + tg = "" + if any( + key.rsplit("_")[0] in s + for s in ["amp", "corr", "dist", "prcnt_gd"] + ): + dim0 = "beam" else: - dim0 = 'dir' - ds[key] = ds[key].rename({'dim_0': dim0, - 'dim_1': 'time'+tg}) - ds[key] = ds[key].assign_coords({dim0: FoR[dim0], - 'time'+tg: data['coords']['time'+tg]}) + dim0 = "dir" + ds_dict[key] = { + "dims": (dim0, "time" + tg), + "data": data["data_vars"][key], + } + # ADCP IMU data elif shp[0] == 3: if not any(val in key for val in tag): - tg = '' + tg = "" else: tg = [val for val in tag if val in key] tg = tg[0] - dirIMU = xr.DataArray([1, 2, 3], dims=['dirIMU'], name='dirIMU', attrs={ - 'units': '1', 'long_name': 'Reference Frame'}) - ds[key] = ds[key].rename({'dim_0': 'dirIMU', - 'dim_1': 'time'+tg}) - ds[key] = ds[key].assign_coords({'dirIMU': dirIMU, - 'time'+tg: data['coords']['time'+tg]}) - - ds[key].attrs['coverage_content_type'] = 'physicalMeasurement' - - elif l == 3: # 3D variables - if 'vel' in key: - dim0 = 'dir' + + if "dirIMU" not in ds_dict: + ds_dict["dirIMU"] = {"dims": ("dirIMU"), "data": [1, 2, 3]} + data["units"].update({"dirIMU": "1"}) + data["long_name"].update({"dirIMU": "Reference Frame"}) + + ds_dict[key] = { + "dims": ("dirIMU", "time" + tg), + "data": data["data_vars"][key], + } + + elif "b5" in tg: + ds_dict[key] = { + "dims": ("range_b5", "time_b5"), + "data": data["data_vars"][key], + } + + elif len(shp) == 3: # 3D variables + if "vel" in key: + dim0 = "dir" else: # amp, corr, prcnt_gd, status - dim0 = 'beam' + dim0 = "beam" - if not any(val in key for val in tag) or ('_avg' in key): - if '_avg' in key: - tg = '_avg' + if not any(val in key for val in tag) or ("_avg" in key): + if "_avg" in key: + tg = "_avg" else: - tg = '' - ds[key] = ds[key].rename({'dim_0': dim0, - 'dim_1': 'range'+tg, - 'dim_2': 'time'+tg}) - ds[key] = ds[key].assign_coords({dim0: FoR[dim0], - 'range'+tg: data['coords']['range'+tg], - 'time'+tg: data['coords']['time'+tg]}) - elif 'b5' in key: - # xarray can't handle coords of length 1 - ds[key] = ds[key][0] - ds[key] = ds[key].rename({'dim_1': 'range_b5', - 'dim_2': 'time_b5'}) - ds[key] = ds[key].assign_coords({'range_b5': data['coords']['range_b5'], - 'time_b5': data['coords']['time_b5']}) - elif 'sl' in key: - ds[key] = ds[key].rename({'dim_0': dim0, - 'dim_1': 'range_sl', - 'dim_2': 'time'}) - ds[key] = ds[key].assign_coords({'range_sl': data['coords']['range_sl'], - 'time': data['coords']['time']}) + tg = "" + ds_dict[key] = { + "dims": (dim0, "range" + tg, "time" + tg), + "data": data["data_vars"][key], + } + + elif "b5" in key: + # "vel_b5" sometimes stored as (1, range_b5, time_b5) + ds_dict[key] = { + "dims": ("range_b5", "time_b5"), + "data": data["data_vars"][key][0], + } + elif "sl" in key: + ds_dict[key] = { + "dims": (dim0, "range_sl", "time"), + "data": data["data_vars"][key], + } else: - ds = ds.drop_vars(key) - warnings.warn(f'Variable not included in dataset: {key}') - - ds[key].attrs['coverage_content_type'] = 'physicalMeasurement' + warnings.warn(f"Variable not included in dataset: {key}") + + # Create dataset + ds = xr.Dataset.from_dict(ds_dict) + + # Assign data array attributes + for key in ds.variables: + for md in ["units", "long_name", "standard_name"]: + if key in data[md]: + ds[key].attrs[md] = data[md][key] + if len(ds[key].shape) > 1: + ds[key].attrs["coverage_content_type"] = "physicalMeasurement" + try: # make sure ones with tags get units + tg = "_" + key.rsplit("_")[-1] + if any(val in key for val in tag): + ds[key].attrs[md] = data[md][key[: -len(tg)]] + except: + pass - # coordinate attributes + # Assign coordinate attributes for ky in ds.dims: - ds[ky].attrs['coverage_content_type'] = 'coordinate' - r_list = [r for r in ds.coords if 'range' in r] + ds[ky].attrs["coverage_content_type"] = "coordinate" + r_list = [r for r in ds.coords if "range" in r] for ky in r_list: - ds[ky].attrs['units'] = 'm' - ds[ky].attrs['long_name'] = 'Profile Range' - ds[ky].attrs['description'] = 'Distance to the center of each depth bin' - time_list = [t for t in ds.coords if 'time' in t] + ds[ky].attrs["units"] = "m" + ds[ky].attrs["long_name"] = "Profile Range" + ds[ky].attrs["description"] = "Distance to the center of each depth bin" + time_list = [t for t in ds.coords if "time" in t] for ky in time_list: - ds[ky].attrs['units'] = 'seconds since 1970-01-01 00:00:00' - ds[ky].attrs['long_name'] = 'Time' - ds[ky].attrs['standard_name'] = 'time' + ds[ky].attrs["units"] = "seconds since 1970-01-01 00:00:00" + ds[ky].attrs["long_name"] = "Time" + ds[ky].attrs["standard_name"] = "time" - # dataset metadata - ds.attrs = data['attrs'] + # Set dataset metadata + ds.attrs = data["attrs"] return ds diff --git a/mhkit/dolfyn/io/nortek.py b/mhkit/dolfyn/io/nortek.py index 4709df7aa..3cfc71e00 100644 --- a/mhkit/dolfyn/io/nortek.py +++ b/mhkit/dolfyn/io/nortek.py @@ -14,8 +14,9 @@ from ..rotate import api as rot -def read_nortek(filename, userdata=True, debug=False, do_checksum=False, - nens=None, **kwargs): +def read_nortek( + filename, userdata=True, debug=False, do_checksum=False, nens=None, **kwargs +): """ Read a classic Nortek (AWAC and Vector) datafile @@ -31,7 +32,7 @@ def read_nortek(filename, userdata=True, debug=False, do_checksum=False, do_checksum : bool Whether to perform the checksum of each data block. Default = False nens : None, int or 2-element tuple (start, stop) - Number of pings or ensembles to read from the file. + Number of pings or ensembles to read from the file. Default is None, read entire file Returns @@ -45,17 +46,18 @@ def read_nortek(filename, userdata=True, debug=False, do_checksum=False, for handler in logging.root.handlers[:]: logging.root.removeHandler(handler) filepath = Path(filename) - logfile = filepath.with_suffix('.dolfyn.log') - logging.basicConfig(filename=str(logfile), - filemode='w', - level=logging.NOTSET, - format='%(name)s - %(levelname)s - %(message)s') + logfile = filepath.with_suffix(".dolfyn.log") + logging.basicConfig( + filename=str(logfile), + filemode="w", + level=logging.NOTSET, + format="%(name)s - %(levelname)s - %(message)s", + ) userdata = _find_userdata(filename, userdata) - with _NortekReader(filename, debug=debug, do_checksum=do_checksum, - nens=nens) as rdr: - rdr.readfile() + rdr = _NortekReader(filename, debug=debug, do_checksum=do_checksum, nens=nens) + rdr.readfile() rdr.dat2sci() dat = rdr.data @@ -63,41 +65,44 @@ def read_nortek(filename, userdata=True, debug=False, do_checksum=False, dat = _handle_nan(dat) # Search for missing timestamps and interpolate them - coords = dat['coords'] - t_list = [t for t in coords if 'time' in t] + coords = dat["coords"] + t_list = [t for t in coords if "time" in t] for ky in t_list: tdat = coords[ky] tdat[tdat == 0] = np.NaN if np.isnan(tdat).any(): - tag = ky.lstrip('time') - warnings.warn("Zero/NaN values found in '{}'. Interpolating and " - "extrapolating them. To identify which values were filled later, " - "look for 0 values in 'status{}'".format(ky, tag)) - tdat = time._fill_time_gaps( - tdat, sample_rate_hz=dat['attrs']['fs']) - coords[ky] = time.epoch2dt64(tdat).astype('datetime64[ns]') + tag = ky.lstrip("time") + warnings.warn( + "Zero/NaN values found in '{}'. Interpolating and " + "extrapolating them. To identify which values were filled later, " + "look for 0 values in 'status{}'".format(ky, tag) + ) + tdat = time._fill_time_gaps(tdat, sample_rate_hz=dat["attrs"]["fs"]) + coords[ky] = time.epoch2dt64(tdat).astype("datetime64[ns]") # Apply rotation matrix and declination rotmat = None declin = None for nm in userdata: - if 'rotmat' in nm: + if "rotmat" in nm: rotmat = userdata[nm] - elif 'dec' in nm: + elif "dec" in nm: declin = userdata[nm] else: - dat['attrs'][nm] = userdata[nm] + dat["attrs"][nm] = userdata[nm] # Create xarray dataset from upper level dictionary ds = _create_dataset(dat) ds = _set_coords(ds, ref_frame=ds.coord_sys) - if 'orientmat' not in ds: - ds['orientmat'] = _calc_omat(ds['time'], - ds['heading'], - ds['pitch'], - ds['roll'], - ds.get('orientation_down', None)) + if "orientmat" not in ds: + ds["orientmat"] = _calc_omat( + ds["time"], + ds["heading"], + ds["pitch"], + ds["roll"], + ds.get("orientation_down", None), + ) if rotmat is not None: rot.set_inst2head_rotmat(ds, rotmat, inplace=True) @@ -114,11 +119,11 @@ def read_nortek(filename, userdata=True, debug=False, do_checksum=False, def _bcd2char(cBCD): - """Taken from the Nortek System Integrator Manual + """Taken from the Nortek System Integrator Manual "Example Program" Chapter. """ cBCD = min(cBCD, 153) - c = (cBCD & 15) + c = cBCD & 15 c += 10 * (cBCD >> 4) return c @@ -128,13 +133,13 @@ def _bitshift8(val): def _int2binarray(val, n): - out = np.zeros(n, dtype='bool') + out = np.zeros(n, dtype="bool") for idx, n in enumerate(range(n)): - out[idx] = val & (2 ** n) + out[idx] = val & (2**n) return out -class _NortekReader(): +class _NortekReader: """ A class for reading reading nortek binary files. This reader currently only supports AWAC and Vector data formats. @@ -153,27 +158,38 @@ class _NortekReader(): bufsize : int The size of the read buffer to use. Default = 100000 nens : None, int or 2-element tuple (start, stop) - Number of pings or ensembles to read from the file. + Number of pings or ensembles to read from the file. Default is None, read entire file """ _lastread = [None, None, None, None, None] - fun_map = {'0x00': 'read_user_cfg', - '0x04': 'read_head_cfg', - '0x05': 'read_hw_cfg', - '0x07': 'read_vec_checkdata', - '0x10': 'read_vec_data', - '0x11': 'read_vec_sysdata', - '0x12': 'read_vec_hdr', - '0x71': 'read_microstrain', - '0x20': 'read_awac_profile', - } - - def __init__(self, fname, endian=None, debug=False, - do_checksum=True, bufsize=100000, nens=None): + fun_map = { + "0x00": "read_user_cfg", + "0x04": "read_head_cfg", + "0x05": "read_hw_cfg", + "0x07": "read_vec_checkdata", + "0x10": "read_vec_data", + "0x11": "read_vec_sysdata", + "0x12": "read_vec_hdr", + "0x20": "read_awac_profile", + "0x30": "read_awac_waves", + "0x31": "read_awac_waves_hdr", + "0x36": "read_awac_waves", # "SUV" + "0x71": "read_microstrain", + } + + def __init__( + self, + fname, + endian=None, + debug=False, + do_checksum=True, + bufsize=100000, + nens=None, + ): self.fname = fname self._bufsize = bufsize - self.f = open(_abspath(fname), 'rb', 1000) + self.f = open(_abspath(fname), "rb", 1000) self.do_checksum = do_checksum self.filesize # initialize the filesize. self.debug = debug @@ -187,29 +203,32 @@ def __init__(self, fname, endian=None, debug=False, self._npings = nens else: if len(nens) != 2: - raise TypeError('nens must be: None (), int, or len 2') - warnings.warn("A 'start ensemble' is not yet supported " - "for the Nortek reader. This function will read " - "the entire file, then crop the beginning at " - "nens[0].") + raise TypeError("nens must be: None (), int, or len 2") + warnings.warn( + "A 'start ensemble' is not yet supported " + "for the Nortek reader. This function will read " + "the entire file, then crop the beginning at " + "nens[0]." + ) self._npings = nens[1] self._n_start = nens[0] if endian is None: - if unpack('HH', self.read(4)) == (1445, 24): - endian = '>' + if unpack("HH", self.read(4)) == (1445, 24): + endian = ">" else: - raise Exception("I/O error: could not determine the " - "'endianness' of the file. Are you sure this is a Nortek " - "file?") + raise Exception( + "I/O error: could not determine the " + "'endianness' of the file. Are you sure this is a Nortek " + "file?" + ) self.endian = endian self.f.seek(0, 0) # This is the configuration data: self.config = {} - err_msg = ("I/O error: The file does not " - "appear to be a Nortek data file.") + err_msg = "I/O error: The file does not " "appear to be a Nortek data file." # Read the header: if self.read_id() == 5: self.read_hw_cfg() @@ -223,49 +242,54 @@ def __init__(self, fname, endian=None, debug=False, self.read_user_cfg() else: raise Exception(err_msg) - if self.config['hdw']['serial_number'][0:3].upper() == 'WPR': - self.config['config_type'] = 'AWAC' - elif self.config['hdw']['serial_number'][0:3].upper() == 'VEC': - self.config['config_type'] = 'ADV' + if self.config["hdw"]["serial_number"][0:3].upper() == "WPR": + self.config["config_type"] = "AWAC" + elif self.config["hdw"]["serial_number"][0:3].upper() == "VEC": + self.config["config_type"] = "ADV" # Initialize the instrument type: - self._inst = self.config.pop('config_type') + self._inst = self.config.pop("config_type") # This is the position after reading the 'hardware', # 'head', and 'user' configuration. pnow = self.pos # Run the appropriate initialization routine (e.g. init_ADV). - getattr(self, 'init_' + self._inst)() + getattr(self, "init_" + self._inst)() self.f.close() # This has a small buffer, so close it. # This has a large buffer... - self.f = open(_abspath(fname), 'rb', bufsize) + self.f = open(_abspath(fname), "rb", bufsize) self.close = self.f.close if self._npings is not None: self.n_samp_guess = self._npings self.f.seek(pnow, 0) # Seek to the previous position. - da = self.data['attrs'] - if self.config['n_burst'] > 0: - fs = round(self.config['fs'], 7) - da['duty_cycle_n_burst'] = self.config['n_burst'] - da['duty_cycle_interval'] = self.config['burst_interval'] + da = self.data["attrs"] + if self.config["n_burst"] > 0: + fs = round(self.config["fs"], 7) + da["duty_cycle_n_burst"] = self.config["n_burst"] + da["duty_cycle_interval"] = self.config["burst_interval"] if fs > 1: - burst_seconds = self.config['n_burst']/fs + burst_seconds = self.config["n_burst"] / fs else: - burst_seconds = round(1/fs, 3) - da['duty_cycle_description'] = "{} second bursts collected at {} Hz, with bursts taken every {} minutes".format( - burst_seconds, fs, self.config['burst_interval']/60) - self.burst_start = np.zeros(self.n_samp_guess, dtype='bool') - da['fs'] = self.config['fs'] - da['coord_sys'] = {'XYZ': 'inst', - 'ENU': 'earth', - 'beam': 'beam'}[self.config['coord_sys_axes']] - da['has_imu'] = 0 # Initiate attribute + burst_seconds = round(1 / fs, 3) + da["duty_cycle_description"] = ( + "{} second bursts collected at {} Hz, with bursts taken every {} minutes".format( + burst_seconds, fs, self.config["burst_interval"] / 60 + ) + ) + self.burst_start = np.zeros(self.n_samp_guess, dtype="bool") + da["fs"] = self.config["fs"] + da["coord_sys"] = {"XYZ": "inst", "ENU": "earth", "beam": "beam"}[ + self.config["coord_sys_axes"] + ] + da["has_imu"] = 0 # Initiate attribute if self.debug: - logging.info('Init completed') + logging.info("Init completed") @property - def filesize(self,): - if not hasattr(self, '_filesz'): + def filesize( + self, + ): + if not hasattr(self, "_filesz"): pos = self.pos self.f.seek(0, 2) # Seek to the end of the file to determine the filesize. @@ -274,49 +298,61 @@ def filesize(self,): return self._filesz @property - def pos(self,): + def pos(self): return self.f.tell() - def init_ADV(self,): - dat = self.data = {'data_vars': {}, 'coords': {}, 'attrs': {}, - 'units': {}, 'long_name': {}, 'standard_name': {}, - 'sys': {}} - da = dat['attrs'] - dv = dat['data_vars'] - da['inst_make'] = 'Nortek' - da['inst_model'] = 'Vector' - da['inst_type'] = 'ADV' - da['rotate_vars'] = ['vel'] - dv['beam2inst_orientmat'] = self.config.pop('beam2inst_orientmat') - self.config['fs'] = 512 / self.config['awac']['avg_interval'] - da.update(self.config['usr']) - da.update(self.config['adv']) - da.update(self.config['head']) - da.update(self.config['hdw']) + def init_ADV(self): + dat = self.data = { + "data_vars": {}, + "coords": {}, + "attrs": {}, + "units": {}, + "long_name": {}, + "standard_name": {}, + "sys": {}, + } + da = dat["attrs"] + dv = dat["data_vars"] + da["inst_make"] = "Nortek" + da["inst_model"] = "Vector" + da["inst_type"] = "ADV" + da["rotate_vars"] = ["vel"] + dv["beam2inst_orientmat"] = self.config.pop("beam2inst_orientmat") + self.config["fs"] = 512 / self.config["awac"]["avg_interval"] + da.update(self.config["usr"]) + da.update(self.config["adv"]) + da.update(self.config["head"]) + da.update(self.config["hdw"]) # No apparent way to determine how many samples are in a file - dlta = self.code_spacing('0x11') + dlta = self.code_spacing("0x11") self.n_samp_guess = int(self.filesize / dlta + 1) - self.n_samp_guess *= int(self.config['fs']) - - def init_AWAC(self,): - dat = self.data = {'data_vars': {}, 'coords': {}, 'attrs': {}, - 'units': {}, 'long_name': {}, 'standard_name': {}, - 'sys': {}} - da = dat['attrs'] - dv = dat['data_vars'] - da['inst_make'] = 'Nortek' - da['inst_model'] = 'AWAC' - da['inst_type'] = 'ADCP' - dv['beam2inst_orientmat'] = self.config.pop('beam2inst_orientmat') - da['rotate_vars'] = ['vel'] - self.config['fs'] = 1. / self.config['awac']['avg_interval'] - da.update(self.config['usr']) - da.update(self.config['awac']) - da.update(self.config['head']) - da.update(self.config['hdw']) - - space = self.code_spacing('0x20') + self.n_samp_guess *= int(self.config["fs"]) + + def init_AWAC(self): + dat = self.data = { + "data_vars": {}, + "coords": {}, + "attrs": {}, + "units": {}, + "long_name": {}, + "standard_name": {}, + "sys": {}, + } + da = dat["attrs"] + dv = dat["data_vars"] + da["inst_make"] = "Nortek" + da["inst_model"] = "AWAC" + da["inst_type"] = "ADCP" + dv["beam2inst_orientmat"] = self.config.pop("beam2inst_orientmat") + da["rotate_vars"] = ["vel"] + self.config["fs"] = 1.0 / self.config["awac"]["avg_interval"] + da.update(self.config["usr"]) + da.update(self.config["awac"]) + da.update(self.config["head"]) + da.update(self.config["hdw"]) + + space = self.code_spacing("0x20") if space == 0: # code spacing is zero if there's only 1 profile self.n_samp_guess = 1 @@ -326,62 +362,62 @@ def init_AWAC(self,): def read(self, nbyte): byts = self.f.read(nbyte) if not (len(byts) == nbyte): - raise EOFError('Reached the end of the file') + raise EOFError("Reached the end of the file") return byts def findnext(self, do_cs=True): """Find the next data block by checking the checksum and the sync byte(0xa5) """ - sum = np.uint16(int('0xb58c', 0)) # Initialize the sum + sum = np.uint16(int("0xb58c", 0)) # Initialize the sum cs = 0 func = _bitshift8 func2 = np.uint8 - if self.endian == '<': + if self.endian == "<": func = np.uint8 func2 = _bitshift8 while True: - val = unpack(self.endian + 'H', self.read(2))[0] + val = unpack(self.endian + "H", self.read(2))[0] if func(val) == 165 and (not do_cs or cs == np.uint16(sum)): self.f.seek(-2, 1) return hex(func2(val)) sum += cs cs = val - def read_id(self,): - """Read the next 'ID' from the file. - """ + def read_id(self): + """Read the next 'ID' from the file.""" self._thisid_bytes = bts = self.read(2) - tmp = unpack(self.endian + 'BB', bts) + tmp = unpack(self.endian + "BB", bts) if self.debug: - logging.info('Position: {}, codes: {}'.format(self.f.tell(), tmp)) + logging.info("Position: {}, codes: {}".format(self.f.tell(), tmp)) if tmp[0] != 165: # This catches a corrupted data block. if self.debug: - logging.warning("Corrupted data block sync code (%d, %d) found " - "in ping %d. Searching for next valid code..." % - (tmp[0], tmp[1], self.c)) + logging.warning( + "Corrupted data block sync code (%d, %d) found " + "in ping %d. Searching for next valid code..." + % (tmp[0], tmp[1], self.c) + ) val = int(self.findnext(do_cs=False), 0) self.f.seek(2, 1) if self.debug: - logging.debug( - ' ...FOUND {} at position: {}.'.format(val, self.pos)) + logging.debug(" ...FOUND {} at position: {}.".format(val, self.pos)) return val return tmp[1] - def readnext(self,): - id = '0x%02x' % self.read_id() + def readnext(self): + id = "0x%02x" % self.read_id() if id in self.fun_map: func_name = self.fun_map[id] out = getattr(self, func_name)() # Should return None self._lastread = [func_name[5:]] + self._lastread[:-1] return out else: - logging.warning('Unrecognized identifier: ' + id) + logging.warning("Unrecognized identifier: " + id) self.f.seek(-2, 1) return 10 def readfile(self, nlines=None): - print('Reading file %s ...' % self.fname) + print("Reading file %s ..." % self.fname) retval = None try: while not retval: @@ -392,7 +428,7 @@ def readfile(self, nlines=None): self.findnext() retval = None if self._npings is not None and self.c >= self._npings: - if 'microstrain' in self._dtypes: + if "microstrain" in self._dtypes: try: self.readnext() except: @@ -400,10 +436,10 @@ def readfile(self, nlines=None): break except EOFError: if self.debug: - logging.info(' end of file at {} bytes.'.format(self.pos)) + logging.info(" end of file at {} bytes.".format(self.pos)) else: if self.debug: - logging.info(' stopped at {} bytes.'.format(self.pos)) + logging.info(" stopped at {} bytes.".format(self.pos)) self.c -= 1 _crop_data(self.data, slice(0, self.c), self.n_samp_guess) @@ -416,7 +452,7 @@ def findnextid(self, id): if nowid == 16: shift = 22 else: - sz = 2 * unpack(self.endian + 'H', self.read(2))[0] + sz = 2 * unpack(self.endian + "H", self.read(2))[0] shift = sz - 4 self.f.seek(shift, 1) return self.pos @@ -434,161 +470,189 @@ def code_spacing(self, searchcode, iternum=50): except EOFError: break if self.debug: - logging.info('p0={}, pos={}, i={}'.format(p0, self.pos, i)) + logging.info("p0={}, pos={}, i={}".format(p0, self.pos, i)) # Compute the average of the data size: return (self.pos - p0) / (i + 1) def checksum(self, byts): - """Perform a checksum on `byts` and read the checksum value. - """ + """Perform a checksum on `byts` and read the checksum value.""" if self.do_checksum: - if not np.sum(unpack(self.endian + str(int(1 + len(byts) / 2)) + 'H', - self._thisid_bytes + byts)) + \ - 46476 - unpack(self.endian + 'H', self.read(2)): - + if ( + not np.sum( + unpack( + self.endian + str(int(1 + len(byts) / 2)) + "H", + self._thisid_bytes + byts, + ) + ) + + 46476 + - unpack(self.endian + "H", self.read(2)) + ): raise Exception("CheckSum Failed at {}".format(self.pos)) else: self.f.seek(2, 1) - def read_user_cfg(self,): + def read_user_cfg(self): # ID: '0x00 = 00 if self.debug: - logging.info('Reading user configuration (0x00) ping #{} @ {}...' - .format(self.c, self.pos)) + logging.info( + "Reading user configuration (0x00) ping #{} @ {}...".format( + self.c, self.pos + ) + ) cfg_u = self.config byts = self.read(508) # the first two bytes are the size. - tmp = unpack(self.endian + - '2x18H6s4HI9H90H80s48xH50x6H4xH2x2H2xH30x8H', - byts) - cfg_u['usr'] = {} - cfg_u['adv'] = {} - cfg_u['awac'] = {} - - cfg_u['transmit_pulse_length_m'] = tmp[0] # counts - cfg_u['blank_dist'] = tmp[1] # overridden below - cfg_u['receive_length_m'] = tmp[2] # counts - cfg_u['time_between_pings'] = tmp[3] # counts - cfg_u['time_between_bursts'] = tmp[4] # counts - cfg_u['adv']['n_pings_per_burst'] = tmp[5] - cfg_u['awac']['avg_interval'] = tmp[6] - cfg_u['usr']['n_beams'] = tmp[7] + tmp = unpack(self.endian + "2x18H6s4HI9H90H80s48xH50x6H4xH2x2H2xH30x8H", byts) + cfg_u["usr"] = {} + cfg_u["adv"] = {} + cfg_u["awac"] = {} + + cfg_u["transmit_pulse_length_m"] = tmp[0] # counts + cfg_u["blank_dist"] = tmp[1] # overridden below + cfg_u["receive_length_m"] = tmp[2] # counts + cfg_u["time_between_pings"] = tmp[3] # counts + cfg_u["time_between_bursts"] = tmp[4] # counts + cfg_u["adv"]["n_pings_per_burst"] = tmp[5] + cfg_u["awac"]["avg_interval"] = tmp[6] + cfg_u["usr"]["n_beams"] = tmp[7] TimCtrlReg = _int2binarray(tmp[8], 16).astype(int) # From the nortek system integrator manual # (note: bit numbering is zero-based) - cfg_u['usr']['profile_mode'] = [ - 'single', 'continuous'][TimCtrlReg[1]] - cfg_u['usr']['burst_mode'] = str(bool(~TimCtrlReg[2])) - cfg_u['usr']['power_level'] = TimCtrlReg[5] + 2 * TimCtrlReg[6] + 1 - cfg_u['usr']['sync_out_pos'] = ['middle', 'end', ][TimCtrlReg[7]] - cfg_u['usr']['sample_on_sync'] = str(bool(TimCtrlReg[8])) - cfg_u['usr']['start_on_sync'] = str(bool(TimCtrlReg[9])) - cfg_u['PwrCtrlReg'] = _int2binarray(tmp[9], 16) - cfg_u['A1'] = tmp[10] - cfg_u['B0'] = tmp[11] - cfg_u['B1'] = tmp[12] - cfg_u['usr']['compass_update_rate'] = tmp[13] - cfg_u['coord_sys_axes'] = ['ENU', 'XYZ', 'beam'][tmp[14]] - cfg_u['usr']['n_bins'] = tmp[15] - cfg_u['bin_length'] = tmp[16] - cfg_u['burst_interval'] = tmp[17] - cfg_u['usr']['deployment_name'] = tmp[18].partition(b'\x00')[ - 0].decode('utf-8') - cfg_u['usr']['wrap_mode'] = str(bool(tmp[19])) - cfg_u['deployment_time'] = np.array(tmp[20:23]) - cfg_u['diagnotics_interval'] = tmp[23] + cfg_u["usr"]["profile_mode"] = ["single", "continuous"][TimCtrlReg[1]] + cfg_u["usr"]["burst_mode"] = str(bool(~TimCtrlReg[2])) + cfg_u["usr"]["power_level"] = TimCtrlReg[5] + 2 * TimCtrlReg[6] + 1 + cfg_u["usr"]["sync_out_pos"] = [ + "middle", + "end", + ][TimCtrlReg[7]] + cfg_u["usr"]["sample_on_sync"] = str(bool(TimCtrlReg[8])) + cfg_u["usr"]["start_on_sync"] = str(bool(TimCtrlReg[9])) + cfg_u["PwrCtrlReg"] = _int2binarray(tmp[9], 16) + cfg_u["A1"] = tmp[10] + cfg_u["B0"] = tmp[11] + cfg_u["B1"] = tmp[12] + cfg_u["usr"]["compass_update_rate"] = tmp[13] + cfg_u["coord_sys_axes"] = ["ENU", "XYZ", "beam"][tmp[14]] + cfg_u["usr"]["n_bins"] = tmp[15] + cfg_u["bin_length"] = tmp[16] + cfg_u["burst_interval"] = tmp[17] + cfg_u["usr"]["deployment_name"] = tmp[18].partition(b"\x00")[0].decode("utf-8") + cfg_u["usr"]["wrap_mode"] = str(bool(tmp[19])) + cfg_u["deployment_time"] = np.array(tmp[20:23]) + cfg_u["diagnotics_interval"] = tmp[23] Mode0 = _int2binarray(tmp[24], 16) - cfg_u['user_soundspeed_adj_factor'] = tmp[25] - cfg_u['n_samples_diag'] = tmp[26] - cfg_u['n_beams_cells_diag'] = tmp[27] - cfg_u['n_pings_diag_wave'] = tmp[28] + cfg_u["user_soundspeed_adj_factor"] = tmp[25] + cfg_u["n_samples_diag"] = tmp[26] + cfg_u["n_beams_cells_diag"] = tmp[27] + cfg_u["n_pings_diag_wave"] = tmp[28] ModeTest = _int2binarray(tmp[29], 16) - cfg_u['usr']['analog_in'] = tmp[30] + cfg_u["usr"]["analog_in"] = tmp[30] sfw_ver = str(tmp[31]) - cfg_u['usr']['software_version'] = sfw_ver[0] + \ - '.'+sfw_ver[1:3]+'.'+sfw_ver[3:] - cfg_u['usr']['salinity'] = tmp[32]/10 - cfg_u['VelAdjTable'] = np.array(tmp[33:123]) - cfg_u['usr']['comments'] = tmp[123].partition(b'\x00')[ - 0].decode('utf-8') - cfg_u['awac']['wave_processing_method'] = [ - 'PUV', 'SUV', 'MLM', 'MLMST', 'None'][tmp[124]] + cfg_u["usr"]["software_version"] = ( + sfw_ver[0] + "." + sfw_ver[1:3] + "." + sfw_ver[3:] + ) + cfg_u["usr"]["salinity"] = tmp[32] / 10 + cfg_u["VelAdjTable"] = np.array(tmp[33:123]) + cfg_u["usr"]["comments"] = tmp[123].partition(b"\x00")[0].decode("utf-8") + cfg_u["awac"]["wave_processing_method"] = [ + "PUV", + "SUV", + "MLM", + "MLMST", + "None", + ][tmp[124]] Mode1 = _int2binarray(tmp[125], 16) - cfg_u['awac']['prc_dyn_wave_cell_pos'] = int(tmp[126]/32767 * 100) - cfg_u['wave_transmit_pulse'] = tmp[127] - cfg_u['wave_blank_dist'] = tmp[128] - cfg_u['awac']['wave_cell_size'] = tmp[129] - cfg_u['awac']['n_samples_wave'] = tmp[130] - cfg_u['n_burst'] = tmp[131] - cfg_u['analog_out_scale'] = tmp[132] - cfg_u['corr_thresh'] = tmp[133] - cfg_u['transmit_pulse_lag2'] = tmp[134] # counts - cfg_u['QualConst'] = np.array(tmp[135:143]) + cfg_u["awac"]["prc_dyn_wave_cell_pos"] = int(tmp[126] / 32767 * 100) + cfg_u["wave_transmit_pulse"] = tmp[127] + cfg_u["wave_blank_dist"] = tmp[128] + cfg_u["awac"]["wave_cell_size"] = tmp[129] + cfg_u["awac"]["n_samples_wave"] = tmp[130] + cfg_u["n_burst"] = tmp[131] + cfg_u["analog_out_scale"] = tmp[132] + cfg_u["corr_thresh"] = tmp[133] + cfg_u["transmit_pulse_lag2"] = tmp[134] # counts + cfg_u["QualConst"] = np.array(tmp[135:143]) self.checksum(byts) - cfg_u['usr']['user_specified_sound_speed'] = str(Mode0[0]) - cfg_u['awac']['wave_mode'] = ['Disabled', 'Enabled'][int(Mode0[1])] - cfg_u['usr']['analog_output'] = str(Mode0[2]) - cfg_u['usr']['output_format'] = ['Vector', 'ADV'][int(Mode0[3])] # noqa - cfg_u['vel_scale_mm'] = [1, 0.1][int(Mode0[4])] - cfg_u['usr']['serial_output'] = str(Mode0[5]) - cfg_u['reserved_EasyQ'] = str(Mode0[6]) - cfg_u['usr']['power_output_analog'] = str(Mode0[8]) - cfg_u['mode_test_use_DSP'] = str(ModeTest[0]) - cfg_u['mode_test_filter_output'] = ['total', 'correction_only'][int(ModeTest[1])] # noqa - cfg_u['awac']['wave_fs'] = ['1 Hz', '2 Hz'][int(Mode1[0])] - cfg_u['awac']['wave_cell_position'] = ['fixed', 'dynamic'][int(Mode1[1])] # noqa - cfg_u['awac']['type_wave_cell_pos'] = ['pct_of_mean_pressure', 'pct_of_min_re'][int(Mode1[2])] # noqa - - def read_head_cfg(self,): + cfg_u["usr"]["user_specified_sound_speed"] = str(Mode0[0]) + cfg_u["awac"]["wave_mode"] = ["Disabled", "Enabled"][int(Mode0[1])] + cfg_u["usr"]["analog_output"] = str(Mode0[2]) + cfg_u["usr"]["output_format"] = ["Vector", "ADV"][int(Mode0[3])] # noqa + cfg_u["vel_scale_mm"] = [1, 0.1][int(Mode0[4])] + cfg_u["usr"]["serial_output"] = str(Mode0[5]) + cfg_u["reserved_EasyQ"] = str(Mode0[6]) + cfg_u["usr"]["power_output_analog"] = str(Mode0[8]) + cfg_u["mode_test_use_DSP"] = str(ModeTest[0]) + cfg_u["mode_test_filter_output"] = ["total", "correction_only"][ + int(ModeTest[1]) + ] # noqa + cfg_u["awac"]["wave_fs"] = ["1 Hz", "2 Hz"][int(Mode1[0])] + cfg_u["awac"]["wave_cell_position"] = ["fixed", "dynamic"][ + int(Mode1[1]) + ] # noqa + cfg_u["awac"]["type_wave_cell_pos"] = ["pct_of_mean_pressure", "pct_of_min_re"][ + int(Mode1[2]) + ] # noqa + + def read_head_cfg(self): # ID: '0x04 = 04 if self.debug: - logging.info('Reading head configuration (0x04) ping #{} @ {}...' - .format(self.c, self.pos)) + logging.info( + "Reading head configuration (0x04) ping #{} @ {}...".format( + self.c, self.pos + ) + ) cfg = self.config - cfg['head'] = {} + cfg["head"] = {} byts = self.read(220) - tmp = unpack(self.endian + '2x3H12s176s22sH', byts) + tmp = unpack(self.endian + "2x3H12s176s22sH", byts) head_config = _int2binarray(tmp[0], 16).astype(int) - cfg['head']['pressure_sensor'] = ['no', 'yes'][head_config[0]] - cfg['head']['compass'] = ['no', 'yes'][head_config[1]] - cfg['head']['tilt_sensor'] = ['no', 'yes'][head_config[2]] - cfg['head']['carrier_freq_kHz'] = tmp[1] - cfg['beam2inst_orientmat'] = np.array( - unpack(self.endian + '9h', tmp[4][8:26])).reshape(3, 3) / 4096. + cfg["head"]["pressure_sensor"] = ["no", "yes"][head_config[0]] + cfg["head"]["compass"] = ["no", "yes"][head_config[1]] + cfg["head"]["tilt_sensor"] = ["no", "yes"][head_config[2]] + cfg["head"]["carrier_freq_kHz"] = tmp[1] + cfg["beam2inst_orientmat"] = ( + np.array(unpack(self.endian + "9h", tmp[4][8:26])).reshape(3, 3) / 4096.0 + ) self.checksum(byts) - def read_hw_cfg(self,): + def read_hw_cfg(self): # ID 0x05 = 05 if self.debug: - logging.info('Reading hardware configuration (0x05) ping #{} @ {}...' - .format(self.c, self.pos)) + logging.info( + "Reading hardware configuration (0x05) ping #{} @ {}...".format( + self.c, self.pos + ) + ) cfg_hw = self.config - cfg_hw['hdw'] = {} + cfg_hw["hdw"] = {} byts = self.read(44) - tmp = unpack(self.endian + '2x14s6H12x4s', byts) - cfg_hw['hdw']['serial_number'] = tmp[0][:8].decode('utf-8') - cfg_hw['ProLogID'] = unpack('B', tmp[0][8:9])[0] - cfg_hw['hdw']['ProLogFWver'] = tmp[0][10:].decode('utf-8') - cfg_hw['board_config'] = tmp[1] - cfg_hw['board_freq'] = tmp[2] - cfg_hw['hdw']['PIC_version'] = tmp[3] - cfg_hw['hdw']['hardware_rev'] = tmp[4] - cfg_hw['hdw']['recorder_size_bytes'] = tmp[5] * 65536 + tmp = unpack(self.endian + "2x14s6H12x4s", byts) + cfg_hw["hdw"]["serial_number"] = tmp[0][:8].decode("utf-8") + cfg_hw["ProLogID"] = unpack("B", tmp[0][8:9])[0] + cfg_hw["hdw"]["ProLogFWver"] = tmp[0][10:].decode("utf-8") + cfg_hw["board_config"] = tmp[1] + cfg_hw["board_freq"] = tmp[2] + cfg_hw["hdw"]["PIC_version"] = tmp[3] + cfg_hw["hdw"]["hardware_rev"] = tmp[4] + cfg_hw["hdw"]["recorder_size_bytes"] = tmp[5] * 65536 status = _int2binarray(tmp[6], 16).astype(int) - cfg_hw['hdw']['vel_range'] = ['normal', 'high'][status[0]] - cfg_hw['hdw']['firmware_version'] = tmp[7].decode('utf-8') + cfg_hw["hdw"]["vel_range"] = ["normal", "high"][status[0]] + cfg_hw["hdw"]["firmware_version"] = tmp[7].decode("utf-8") self.checksum(byts) def rd_time(self, strng): - """Read the time from the first 6bytes of the input string. - """ - min, sec, day, hour, year, month = unpack('BBBBBB', strng[:6]) - return time.date2epoch(datetime(time._fullyear(_bcd2char(year)), - _bcd2char(month), - _bcd2char(day), - _bcd2char(hour), - _bcd2char(min), - _bcd2char(sec)))[0] + """Read the time from the first 6bytes of the input string.""" + min, sec, day, hour, year, month = unpack("BBBBBB", strng[:6]) + return time.date2epoch( + datetime( + time._fullyear(_bcd2char(year)), + _bcd2char(month), + _bcd2char(day), + _bcd2char(hour), + _bcd2char(min), + _bcd2char(sec), + ) + )[0] def _init_data(self, vardict): """Initialize the data object according to vardict. @@ -600,9 +664,9 @@ def _init_data(self, vardict): how to initialize each data variable. """ - shape_args = {'n': self.n_samp_guess} + shape_args = {"n": self.n_samp_guess} try: - shape_args['nbins'] = self.config['usr']['n_bins'] + shape_args["nbins"] = self.config["usr"]["n_bins"] except KeyError: pass for nm, va in list(vardict.items()): @@ -613,70 +677,78 @@ def _init_data(self, vardict): else: if nm not in self.data[va.group]: self.data[va.group][nm] = va._empty_array(**shape_args) - self.data['units'][nm] = va.units - self.data['long_name'][nm] = va.long_name + self.data["units"][nm] = va.units + self.data["long_name"][nm] = va.long_name if va.standard_name: - self.data['standard_name'][nm] = va.standard_name + self.data["standard_name"][nm] = va.standard_name - def read_vec_data(self,): + def read_vec_data(self): # ID: 0x10 = 16 c = self.c dat = self.data if self.debug: - logging.info('Reading vector velocity data (0x10) ping #{} @ {}...' - .format(self.c, self.pos)) + logging.info( + "Reading vector velocity data (0x10) ping #{} @ {}...".format( + self.c, self.pos + ) + ) - if 'vel' not in dat['data_vars']: + if "vel" not in dat["data_vars"]: self._init_data(nortek_defs.vec_data) - self._dtypes += ['vec_data'] + self._dtypes += ["vec_data"] byts = self.read(20) - ds = dat['sys'] - dv = dat['data_vars'] - (ds['AnaIn2LSB'][c], - ds['Count'][c], - dv['PressureMSB'][c], - ds['AnaIn2MSB'][c], - dv['PressureLSW'][c], - ds['AnaIn1'][c], - dv['vel'][0, c], - dv['vel'][1, c], - dv['vel'][2, c], - dv['amp'][0, c], - dv['amp'][1, c], - dv['amp'][2, c], - dv['corr'][0, c], - dv['corr'][1, c], - dv['corr'][2, c]) = unpack(self.endian + '4B2H3h6B', byts) + ds = dat["sys"] + dv = dat["data_vars"] + ( + ds["AnaIn2LSB"][c], + ds["Count"][c], + dv["PressureMSB"][c], + ds["AnaIn2MSB"][c], + dv["PressureLSW"][c], + ds["AnaIn1"][c], + dv["vel"][0, c], + dv["vel"][1, c], + dv["vel"][2, c], + dv["amp"][0, c], + dv["amp"][1, c], + dv["amp"][2, c], + dv["corr"][0, c], + dv["corr"][1, c], + dv["corr"][2, c], + ) = unpack(self.endian + "4B2H3h6B", byts) self.checksum(byts) self.c += 1 - def read_vec_checkdata(self,): + def read_vec_checkdata(self): # ID: 0x07 = 07 if self.debug: - logging.info('Reading vector check data (0x07) ping #{} @ {}...' - .format(self.c, self.pos)) + logging.info( + "Reading vector check data (0x07) ping #{} @ {}...".format( + self.c, self.pos + ) + ) byts0 = self.read(6) checknow = {} - tmp = unpack(self.endian + '2x2H', byts0) # The first two are size. - checknow['Samples'] = tmp[0] - n = checknow['Samples'] - checknow['First_samp'] = tmp[1] - checknow['Amp1'] = tbx._nans(n, dtype=np.uint8) + 8 - checknow['Amp2'] = tbx._nans(n, dtype=np.uint8) + 8 - checknow['Amp3'] = tbx._nans(n, dtype=np.uint8) + 8 + tmp = unpack(self.endian + "2x2H", byts0) # The first two are size. + checknow["Samples"] = tmp[0] + n = checknow["Samples"] + checknow["First_samp"] = tmp[1] + checknow["Amp1"] = tbx._nans(n, dtype=np.uint8) + 8 + checknow["Amp2"] = tbx._nans(n, dtype=np.uint8) + 8 + checknow["Amp3"] = tbx._nans(n, dtype=np.uint8) + 8 byts1 = self.read(3 * n) - tmp = unpack(self.endian + (3 * n * 'B'), byts1) - for idx, nm in enumerate(['Amp1', 'Amp2', 'Amp3']): - checknow[nm] = np.array(tmp[idx * n:(idx + 1) * n], dtype=np.uint8) + tmp = unpack(self.endian + (3 * n * "B"), byts1) + for idx, nm in enumerate(["Amp1", "Amp2", "Amp3"]): + checknow[nm] = np.array(tmp[idx * n : (idx + 1) * n], dtype=np.uint8) self.checksum(byts0 + byts1) - if 'checkdata' not in self.config: - self.config['checkdata'] = checknow + if "checkdata" not in self.config: + self.config["checkdata"] = checknow else: - if not isinstance(self.config['checkdata'], list): - self.config['checkdata'] = [self.config['checkdata']] - self.config['checkdata'] += [checknow] + if not isinstance(self.config["checkdata"], list): + self.config["checkdata"] = [self.config["checkdata"]] + self.config["checkdata"] += [checknow] def _sci_data(self, vardict): """ @@ -700,92 +772,104 @@ def _sci_data(self, vardict): if retval is not None: dat[nm] = retval - def sci_vec_data(self,): + def sci_vec_data(self): self._sci_data(nortek_defs.vec_data) dat = self.data - dat['data_vars']['pressure'] = ( - dat['data_vars']['PressureMSB'].astype('float32') * 65536 + - dat['data_vars']['PressureLSW'].astype('float32')) / 1000. - dat['units']['pressure'] = 'dbar' - dat['long_name']['pressure'] = 'Pressure' - dat['standard_name']['pressure'] = 'sea_water_pressure' + dat["data_vars"]["pressure"] = ( + dat["data_vars"]["PressureMSB"].astype("float32") * 65536 + + dat["data_vars"]["PressureLSW"].astype("float32") + ) / 1000.0 + dat["units"]["pressure"] = "dbar" + dat["long_name"]["pressure"] = "Pressure" + dat["standard_name"]["pressure"] = "sea_water_pressure" - dat['data_vars'].pop('PressureMSB') - dat['data_vars'].pop('PressureLSW') + dat["data_vars"].pop("PressureMSB") + dat["data_vars"].pop("PressureLSW") # Apply velocity scaling (1 or 0.1) - dat['data_vars']['vel'] *= self.config['vel_scale_mm'] + dat["data_vars"]["vel"] *= self.config["vel_scale_mm"] - def read_vec_hdr(self,): + def read_vec_hdr(self): # ID: '0x12 = 18 if self.debug: - logging.info('Reading vector header data (0x12) ping #{} @ {}...' - .format(self.c, self.pos)) + logging.info( + "Reading vector header data (0x12) ping #{} @ {}...".format( + self.c, self.pos + ) + ) byts = self.read(38) # The first two are size, the next 6 are time. - tmp = unpack(self.endian + '8xH7B21x', byts) + tmp = unpack(self.endian + "8xH7B21x", byts) hdrnow = {} - hdrnow['time'] = self.rd_time(byts[2:8]) - hdrnow['NRecords'] = tmp[0] - hdrnow['Noise1'] = tmp[1] - hdrnow['Noise2'] = tmp[2] - hdrnow['Noise3'] = tmp[3] - hdrnow['Spare0'] = byts[13:14].decode('utf-8') - hdrnow['Corr1'] = tmp[5] - hdrnow['Corr2'] = tmp[6] - hdrnow['Corr3'] = tmp[7] - hdrnow['Spare1'] = byts[17:].decode('utf-8') + hdrnow["time"] = self.rd_time(byts[2:8]) + hdrnow["NRecords"] = tmp[0] + hdrnow["Noise1"] = tmp[1] + hdrnow["Noise2"] = tmp[2] + hdrnow["Noise3"] = tmp[3] + hdrnow["Spare0"] = byts[13:14].decode("utf-8") + hdrnow["Corr1"] = tmp[5] + hdrnow["Corr2"] = tmp[6] + hdrnow["Corr3"] = tmp[7] + hdrnow["Spare1"] = byts[17:].decode("utf-8") self.checksum(byts) - if 'data_header' not in self.config: - self.config['data_header'] = hdrnow + if "data_header" not in self.config: + self.config["data_header"] = hdrnow else: - if not isinstance(self.config['data_header'], list): - self.config['data_header'] = [self.config['data_header']] - self.config['data_header'] += [hdrnow] + if not isinstance(self.config["data_header"], list): + self.config["data_header"] = [self.config["data_header"]] + self.config["data_header"] += [hdrnow] - def read_vec_sysdata(self,): + def read_vec_sysdata(self): # ID: 0x11 = 17 c = self.c if self.debug: - logging.info('Reading vector system data (0x11) ping #{} @ {}...' - .format(self.c, self.pos)) + logging.info( + "Reading vector system data (0x11) ping #{} @ {}...".format( + self.c, self.pos + ) + ) dat = self.data - if self._lastread[:2] == ['vec_checkdata', 'vec_hdr', ]: + if self._lastread[:2] == [ + "vec_checkdata", + "vec_hdr", + ]: self.burst_start[c] = True - if 'time' not in dat['coords']: + if "time" not in dat["coords"]: self._init_data(nortek_defs.vec_sysdata) - self._dtypes += ['vec_sysdata'] + self._dtypes += ["vec_sysdata"] byts = self.read(24) # The first two are size (skip them). - dat['coords']['time'][c] = self.rd_time(byts[2:8]) - ds = dat['sys'] - dv = dat['data_vars'] - (dv['batt'][c], - dv['c_sound'][c], - dv['heading'][c], - dv['pitch'][c], - dv['roll'][c], - dv['temp'][c], - dv['error'][c], - dv['status'][c], - ds['AnaIn'][c]) = unpack(self.endian + '2H3hH2BH', byts[8:]) + dat["coords"]["time"][c] = self.rd_time(byts[2:8]) + ds = dat["sys"] + dv = dat["data_vars"] + ( + dv["batt"][c], + dv["c_sound"][c], + dv["heading"][c], + dv["pitch"][c], + dv["roll"][c], + dv["temp"][c], + dv["error"][c], + dv["status"][c], + ds["AnaIn"][c], + ) = unpack(self.endian + "3H3h2BH", byts[8:]) self.checksum(byts) - def sci_vec_sysdata(self,): + def sci_vec_sysdata(self): """Translate the data in the vec_sysdata structure into scientific units. """ dat = self.data - fs = dat['attrs']['fs'] + fs = dat["attrs"]["fs"] self._sci_data(nortek_defs.vec_sysdata) - t = dat['coords']['time'] - dv = dat['data_vars'] - dat['sys']['_sysi'] = ~np.isnan(t) + t = dat["coords"]["time"] + dv = dat["data_vars"] + dat["sys"]["_sysi"] = ~np.isnan(t) # These are the indices in the sysdata variables # that are not interpolated. - nburst = self.config['n_burst'] - dv['orientation_down'] = tbx._nans(len(t), dtype='bool') + nburst = self.config["n_burst"] + dv["orientation_down"] = tbx._nans(len(t), dtype="bool") if nburst == 0: num_bursts = 1 nburst = len(t) @@ -793,7 +877,7 @@ def sci_vec_sysdata(self,): num_bursts = int(len(t) // nburst + 1) for nb in range(num_bursts): iburst = slice(nb * nburst, (nb + 1) * nburst) - sysi = dat['sys']['_sysi'][iburst] + sysi = dat["sys"]["_sysi"][iburst] if len(sysi) == 0: break # Skip the first entry for the interpolation process @@ -803,242 +887,328 @@ def sci_vec_sysdata(self,): p = np.poly1d(np.polyfit(inds, t[iburst][inds], 1)) t[iburst] = p(arng) elif len(inds) == 1: - t[iburst] = ((arng - inds[0]) / (fs * 3600 * 24) + - t[iburst][inds[0]]) + t[iburst] = (arng - inds[0]) / (fs * 3600 * 24) + t[iburst][inds[0]] else: - t[iburst] = (t[iburst][0] + arng / (fs * 24 * 3600)) + t[iburst] = t[iburst][0] + arng / (fs * 24 * 3600) - tmpd = tbx._nans_like(dv['heading'][iburst]) + tmpd = tbx._nans_like(dv["heading"][iburst]) # The first status bit should be the orientation. - tmpd[sysi] = dv['status'][iburst][sysi] & 1 + tmpd[sysi] = dv["status"][iburst][sysi] & 1 tbx.fillgaps(tmpd, extrapFlg=True) tmpd = np.nan_to_num(tmpd, nan=0) # nans in pitch roll heading slope = np.diff(tmpd) tmpd[1:][slope < 0] = 1 tmpd[:-1][slope > 0] = 0 - dv['orientation_down'][iburst] = tmpd.astype('bool') - tbx.interpgaps(dv['batt'], t) - tbx.interpgaps(dv['c_sound'], t) - tbx.interpgaps(dv['heading'], t) - tbx.interpgaps(dv['pitch'], t) - tbx.interpgaps(dv['roll'], t) - tbx.interpgaps(dv['temp'], t) - - def read_microstrain(self,): - """Read ADV microstrain sensor (IMU) data - """ + dv["orientation_down"][iburst] = tmpd.astype("bool") + tbx.interpgaps(dv["batt"], t) + tbx.interpgaps(dv["c_sound"], t) + tbx.interpgaps(dv["heading"], t) + tbx.interpgaps(dv["pitch"], t) + tbx.interpgaps(dv["roll"], t) + tbx.interpgaps(dv["temp"], t) + + def read_microstrain(self): + """Read ADV microstrain sensor (IMU) data""" + def update_defs(dat, mag=False, orientmat=False): - imu_data = {'accel': ['m s-2', 'Acceleration'], - 'angrt': ['rad s-1', 'Angular Velocity'], - 'mag': ['gauss', 'Compass'], - 'orientmat': ['1', 'Orientation Matrix']} + imu_data = { + "accel": ["m s-2", "Acceleration"], + "angrt": ["rad s-1", "Angular Velocity"], + "mag": ["gauss", "Compass"], + "orientmat": ["1", "Orientation Matrix"], + } for ky in imu_data: - dat['units'].update({ky: imu_data[ky][0]}) - dat['long_name'].update({ky: imu_data[ky][1]}) + dat["units"].update({ky: imu_data[ky][0]}) + dat["long_name"].update({ky: imu_data[ky][1]}) if not mag: - dat['units'].pop('mag') - dat['long_name'].pop('mag') + dat["units"].pop("mag") + dat["long_name"].pop("mag") if not orientmat: - dat['units'].pop('orientmat') - dat['long_name'].pop('orientmat') + dat["units"].pop("orientmat") + dat["long_name"].pop("orientmat") # 0x71 = 113 if self.c == 0: - logging.warning('First "microstrain data" block ' - 'is before first "vector system data" block.') + logging.warning( + 'First "microstrain data" block ' + 'is before first "vector system data" block.' + ) else: self.c -= 1 if self.debug: - logging.info('Reading vector microstrain data (0x71) ping #{} @ {}...' - .format(self.c, self.pos)) + logging.info( + "Reading vector microstrain data (0x71) ping #{} @ {}...".format( + self.c, self.pos + ) + ) byts0 = self.read(4) # The first 2 are the size, 3rd is count, 4th is the id. - ahrsid = unpack(self.endian + '3xB', byts0)[0] - if hasattr(self, '_ahrsid') and self._ahrsid != ahrsid: - logging.warning('AHRS_ID changes mid-file!') + ahrsid = unpack(self.endian + "3xB", byts0)[0] + if hasattr(self, "_ahrsid") and self._ahrsid != ahrsid: + logging.warning("AHRS_ID changes mid-file!") if ahrsid in [195, 204, 210, 211]: self._ahrsid = ahrsid c = self.c dat = self.data - dv = dat['data_vars'] - da = dat['attrs'] - da['has_imu'] = 1 # logical - if 'accel' not in dv: - self._dtypes += ['microstrain'] + dv = dat["data_vars"] + da = dat["attrs"] + da["has_imu"] = 1 # logical + if "accel" not in dv: + self._dtypes += ["microstrain"] if ahrsid == 195: - self._orient_dnames = ['accel', 'angrt', 'orientmat'] - dv['accel'] = tbx._nans((3, self.n_samp_guess), - dtype=np.float32) - dv['angrt'] = tbx._nans((3, self.n_samp_guess), - dtype=np.float32) - dv['orientmat'] = tbx._nans((3, 3, self.n_samp_guess), - dtype=np.float32) - rv = ['accel', 'angrt'] - if not all(x in da['rotate_vars'] for x in rv): - da['rotate_vars'].extend(rv) + self._orient_dnames = ["accel", "angrt", "orientmat"] + dv["accel"] = tbx._nans((3, self.n_samp_guess), dtype=np.float32) + dv["angrt"] = tbx._nans((3, self.n_samp_guess), dtype=np.float32) + dv["orientmat"] = tbx._nans((3, 3, self.n_samp_guess), dtype=np.float32) + rv = ["accel", "angrt"] + if not all(x in da["rotate_vars"] for x in rv): + da["rotate_vars"].extend(rv) update_defs(dat, mag=False, orientmat=True) if ahrsid in [204, 210]: - self._orient_dnames = ['accel', 'angrt', 'mag', 'orientmat'] - dv['accel'] = tbx._nans((3, self.n_samp_guess), - dtype=np.float32) - dv['angrt'] = tbx._nans((3, self.n_samp_guess), - dtype=np.float32) - dv['mag'] = tbx._nans((3, self.n_samp_guess), - dtype=np.float32) - rv = ['accel', 'angrt', 'mag'] - if not all(x in da['rotate_vars'] for x in rv): - da['rotate_vars'].extend(rv) + self._orient_dnames = ["accel", "angrt", "mag", "orientmat"] + dv["accel"] = tbx._nans((3, self.n_samp_guess), dtype=np.float32) + dv["angrt"] = tbx._nans((3, self.n_samp_guess), dtype=np.float32) + dv["mag"] = tbx._nans((3, self.n_samp_guess), dtype=np.float32) + rv = ["accel", "angrt", "mag"] + if not all(x in da["rotate_vars"] for x in rv): + da["rotate_vars"].extend(rv) if ahrsid == 204: - dv['orientmat'] = tbx._nans((3, 3, self.n_samp_guess), - dtype=np.float32) + dv["orientmat"] = tbx._nans( + (3, 3, self.n_samp_guess), dtype=np.float32 + ) update_defs(dat, mag=True, orientmat=True) if ahrsid == 211: - self._orient_dnames = ['angrt', 'accel', 'mag'] - dv['angrt'] = tbx._nans((3, self.n_samp_guess), - dtype=np.float32) - dv['accel'] = tbx._nans((3, self.n_samp_guess), - dtype=np.float32) - dv['mag'] = tbx._nans((3, self.n_samp_guess), - dtype=np.float32) - rv = ['angrt', 'accel', 'mag'] - if not all(x in da['rotate_vars'] for x in rv): - da['rotate_vars'].extend(rv) + self._orient_dnames = ["angrt", "accel", "mag"] + dv["angrt"] = tbx._nans((3, self.n_samp_guess), dtype=np.float32) + dv["accel"] = tbx._nans((3, self.n_samp_guess), dtype=np.float32) + dv["mag"] = tbx._nans((3, self.n_samp_guess), dtype=np.float32) + rv = ["angrt", "accel", "mag"] + if not all(x in da["rotate_vars"] for x in rv): + da["rotate_vars"].extend(rv) update_defs(dat, mag=True, orientmat=False) - byts = '' + byts = "" if ahrsid == 195: # 0xc3 byts = self.read(64) - dt = unpack(self.endian + '6f9f4x', byts) - (dv['angrt'][:, c], - dv['accel'][:, c]) = (dt[0:3], dt[3:6],) - dv['orientmat'][:, :, c] = ((dt[6:9], dt[9:12], dt[12:15])) + dt = unpack(self.endian + "6f9f4x", byts) + (dv["angrt"][:, c], dv["accel"][:, c]) = ( + dt[0:3], + dt[3:6], + ) + dv["orientmat"][:, :, c] = (dt[6:9], dt[9:12], dt[12:15]) elif ahrsid == 204: # 0xcc byts = self.read(78) # This skips the "DWORD" (4 bytes) and the AHRS checksum # (2 bytes) - dt = unpack(self.endian + '18f6x', byts) - (dv['accel'][:, c], - dv['angrt'][:, c], - dv['mag'][:, c]) = (dt[0:3], dt[3:6], dt[6:9],) - dv['orientmat'][:, :, c] = ((dt[9:12], dt[12:15], dt[15:18])) + dt = unpack(self.endian + "18f6x", byts) + (dv["accel"][:, c], dv["angrt"][:, c], dv["mag"][:, c]) = ( + dt[0:3], + dt[3:6], + dt[6:9], + ) + dv["orientmat"][:, :, c] = (dt[9:12], dt[12:15], dt[15:18]) elif ahrsid == 211: byts = self.read(42) - dt = unpack(self.endian + '9f6x', byts) - (dv['angrt'][:, c], - dv['accel'][:, c], - dv['mag'][:, c]) = (dt[0:3], dt[3:6], dt[6:9],) + dt = unpack(self.endian + "9f6x", byts) + (dv["angrt"][:, c], dv["accel"][:, c], dv["mag"][:, c]) = ( + dt[0:3], + dt[3:6], + dt[6:9], + ) else: - logging.warning('Unrecognized IMU identifier: ' + str(ahrsid)) + logging.warning("Unrecognized IMU identifier: " + str(ahrsid)) self.f.seek(-2, 1) return 10 self.checksum(byts0 + byts) self.c += 1 # reset the increment - def sci_microstrain(self,): - """Rotate orientation data into ADV coordinate system. - """ + def sci_microstrain(self): + """Rotate orientation data into ADV coordinate system.""" # MS = MicroStrain - dv = self.data['data_vars'] + dv = self.data["data_vars"] for nm in self._orient_dnames: # Rotate the MS orientation data (in MS coordinate system) # to be consistent with the ADV coordinate system. # (x,y,-z)_ms = (z,y,x)_adv - (dv[nm][2], - dv[nm][0]) = (dv[nm][0], - -dv[nm][2].copy()) - if 'orientmat' in self._orient_dnames: + (dv[nm][2], dv[nm][0]) = (dv[nm][0], -dv[nm][2].copy()) + if "orientmat" in self._orient_dnames: # MS coordinate system is in North-East-Down (NED), # we want East-North-Up (ENU) - dv['orientmat'][:, 2] *= -1 - (dv['orientmat'][:, 0], - dv['orientmat'][:, 1]) = (dv['orientmat'][:, 1], - dv['orientmat'][:, 0].copy()) - if 'accel' in dv: + dv["orientmat"][:, 2] *= -1 + (dv["orientmat"][:, 0], dv["orientmat"][:, 1]) = ( + dv["orientmat"][:, 1], + dv["orientmat"][:, 0].copy(), + ) + if "accel" in dv: # This value comes from the MS 3DM-GX3 MIP manual - dv['accel'] *= 9.80665 + dv["accel"] *= 9.80665 if self._ahrsid in [195, 211]: # These are DAng and DVel, so we convert them to angrt, accel here - dv['angrt'] *= self.config['fs'] - dv['accel'] *= self.config['fs'] + dv["angrt"] *= self.config["fs"] + dv["accel"] *= self.config["fs"] - def read_awac_profile(self,): + def read_awac_profile(self): # ID: '0x20' = 32 dat = self.data if self.debug: - logging.info('Reading AWAC velocity data (0x20) ping #{} @ {}...' - .format(self.c, self.pos)) - nbins = self.config['usr']['n_bins'] - if 'temp' not in dat['data_vars']: + logging.info( + "Reading AWAC velocity data (0x20) ping #{} @ {}...".format( + self.c, self.pos + ) + ) + nbins = self.config["usr"]["n_bins"] + if "temp" not in dat["data_vars"]: self._init_data(nortek_defs.awac_profile) - self._dtypes += ['awac_profile'] + self._dtypes += ["awac_profile"] # Note: docs state there is 'fill' byte at the end, if nbins is odd, # but doesn't appear to be the case - n = self.config['usr']['n_beams'] - byts = self.read(116 + n*3 * nbins) + n = self.config["usr"]["n_beams"] + byts = self.read(116 + n * 3 * nbins) c = self.c - dat['coords']['time'][c] = self.rd_time(byts[2:8]) - ds = dat['sys'] - dv = dat['data_vars'] - (dv['error'][c], - ds['AnaIn1'][c], - dv['batt'][c], - dv['c_sound'][c], - dv['heading'][c], - dv['pitch'][c], - dv['roll'][c], - p_msb, - dv['status'][c], - p_lsw, - dv['temp'][c],) = unpack(self.endian + '7HBB2H', byts[8:28]) - dv['pressure'][c] = (65536 * p_msb + p_lsw) + dat["coords"]["time"][c] = self.rd_time(byts[2:8]) + ds = dat["sys"] + dv = dat["data_vars"] + ( + dv["error"][c], + ds["AnaIn1"][c], + dv["batt"][c], + dv["c_sound"][c], + dv["heading"][c], + dv["pitch"][c], + dv["roll"][c], + p_msb, + dv["status"][c], + p_lsw, + dv["temp"][c], + ) = unpack(self.endian + "5H2hBBHh", byts[8:28]) + dv["pressure"][c] = 65536 * p_msb + p_lsw # The nortek system integrator manual specifies an 88byte 'spare' # field, therefore we start at 116. - tmp = unpack(self.endian + str(n * nbins) + 'h' + - str(n * nbins) + 'B', byts[116:116 + n*3 * nbins]) + tmp = unpack( + self.endian + str(n * nbins) + "h" + str(n * nbins) + "B", + byts[116 : 116 + n * 3 * nbins], + ) for idx in range(n): - dv['vel'][idx, :, c] = tmp[idx * nbins: (idx + 1) * nbins] - dv['amp'][idx, :, c] = tmp[(idx + n) * nbins: (idx + n+1) * nbins] + dv["vel"][idx, :, c] = tmp[idx * nbins : (idx + 1) * nbins] + dv["amp"][idx, :, c] = tmp[(idx + n) * nbins : (idx + n + 1) * nbins] self.checksum(byts) self.c += 1 - def sci_awac_profile(self,): + def sci_awac_profile(self): self._sci_data(nortek_defs.awac_profile) # Calculate the ranges. - cs_coefs = {2000: 0.0239, - 1000: 0.0478, - 600: 0.0797, - 400: 0.1195} + cs_coefs = {2000: 0.0239, 1000: 0.0478, 600: 0.0797, 400: 0.1195} h_ang = 25 * (np.pi / 180) # Head angle is 25 degrees for all awacs. # Cell size - cs = round(float(self.config['bin_length']) / 256. * - cs_coefs[self.config['head']['carrier_freq_kHz']] * np.cos(h_ang), ndigits=2) + cs = round( + float(self.config["bin_length"]) + / 256.0 + * cs_coefs[self.config["head"]["carrier_freq_kHz"]] + * np.cos(h_ang), + ndigits=2, + ) # Blanking distance - bd = round(self.config['blank_dist'] * - 0.0229 * np.cos(h_ang) - cs, ndigits=2) + bd = round(self.config["blank_dist"] * 0.0229 * np.cos(h_ang) - cs, ndigits=2) - r = (np.float32(np.arange(self.config['usr']['n_bins']))+1)*cs + bd - self.data['coords']['range'] = r - self.data['attrs']['cell_size'] = cs - self.data['attrs']['blank_dist'] = bd + r = (np.float32(np.arange(self.config["usr"]["n_bins"])) + 1) * cs + bd + self.data["coords"]["range"] = r + self.data["attrs"]["cell_size"] = cs + self.data["attrs"]["blank_dist"] = bd - def dat2sci(self,): + def read_awac_waves_hdr(self): + # ID: '0x31' + c = self.c + if self.debug: + print( + "Reading vector header data (0x31) ping #{} @ {}...".format( + self.c, self.pos + ) + ) + hdrnow = {} + dat = self.data + ds = dat["sys"] + dv = dat["data_vars"] + if "time" not in dat["coords"]: + self._init_data(nortek_defs.waves_hdrdata) + byts = self.read(56) + # The first two are size, the next 6 are time. + tmp = unpack(self.endian + "8x4H3h2HhH4B6H5h", byts) + dat["coords"]["time"][c] = self.rd_time(byts[2:8]) + hdrnow["n_records_alt"] = tmp[0] + hdrnow["blank_dist_alt"] = tmp[1] # counts + ds["batt_alt"][c] = tmp[2] # voltage (0.1 V) + dv["c_sound_alt"][c] = tmp[3] # c (0.1 m/s) + dv["heading_alt"][c] = tmp[4] # (0.1 deg) + dv["pitch_alt"][c] = tmp[5] # (0.1 deg) + dv["roll_alt"][c] = tmp[6] # (0.1 deg) + dv["pressure1_alt"][c] = tmp[7] # min pressure previous profile (0.001 dbar) + dv["pressure2_alt"][c] = tmp[8] # max pressure previous profile (0.001 dbar) + dv["temp_alt"][c] = tmp[9] # (0.01 deg C) + hdrnow["cell_size_alt"][c] = tmp[10] # (counts of T3) + hdrnow["noise_alt"][c] = tmp[11:15] # noise amplitude beam 1-4 (counts) + hdrnow["proc_magn_alt"][c] = tmp[15:19] # processing magnitude beam 1-4 + hdrnow["n_past_window_alt"] = tmp[ + 19 + ] # number of samples of AST window past boundary + hdrnow["n_window_alt"] = tmp[20] # AST window size (# samples) + hdrnow["Spare1"] = tmp[21:] + self.checksum(byts) + if "data_header" not in self.config: + self.config["data_header"] = hdrnow + else: + if not isinstance(self.config["data_header"], list): + self.config["data_header"] = [self.config["data_header"]] + self.config["data_header"] += [hdrnow] + + def read_awac_waves(self): + """Read awac wave and suv data""" + # IDs: 0x30 & 0x36 + c = self.c + dat = self.data + if self.debug: + print( + "Reading awac wave data (0x30) ping #{} @ {}...".format( + self.c, self.pos + ) + ) + if "dist1_alt" not in dat["data_vars"]: + self._init_data(nortek_defs.wave_data) + self._dtypes += ["wave_data"] + # The first two are size + byts = self.read(20) + ds = dat["sys"] + dv = dat["data_vars"] + ( + dv["pressure"][c], # (0.001 dbar) + dv["dist1_alt"][c], # distance 1 to surface, vertical beam (mm) + ds["AnaIn_alt"][c], # analog input 1 + dv["vel_alt"][0, c], # velocity beam 1 (mm/s) East for SUV + dv["vel_alt"][1, c], # North for SUV + dv["vel_alt"][2, c], # Up for SUV + dv["dist2_alt"][ + c + ], # distance 2 to surface, vertical beam (mm) or vel 4 for non-AST + dv["amp_alt"][0, c], # amplitude beam 1 (counts) + dv["amp_alt"][1, c], # amplitude beam 2 (counts) + dv["amp_alt"][2, c], # amplitude beam 3 (counts) + # AST quality (counts) or amplitude beam 4 for non-AST + dv["quality_alt"][c], + ) = unpack(self.endian + "3H4h4B", byts) + self.checksum(byts) + self.c += 1 + + def dat2sci(self): for nm in self._dtypes: - getattr(self, 'sci_' + nm)() - for nm in ['data_header', 'checkdata']: + getattr(self, "sci_" + nm)() + for nm in ["data_header", "checkdata"]: if nm in self.config and isinstance(self.config[nm], list): self.config[nm] = _recatenate(self.config[nm]) - def __exit__(self, type, value, trace): - self.close() - - def __enter__(self): - return self - def _crop_data(obj, range, n_lastdim): for nm, dat in obj.items(): @@ -1049,12 +1219,11 @@ def _crop_data(obj, range, n_lastdim): def _recatenate(obj): out = type(obj[0])() for ky in list(obj[0].keys()): - if ky in ['__data_groups__', '_type']: + if ky in ["__data_groups__", "_type"]: continue val0 = obj[0][ky] if isinstance(val0, np.ndarray) and val0.size > 1: - out[ky] = np.concatenate([val[ky][..., None] for val in obj], - axis=-1) + out[ky] = np.concatenate([val[ky][..., None] for val in obj], axis=-1) else: out[ky] = np.array([val[ky] for val in obj]) return out diff --git a/mhkit/dolfyn/io/nortek2.py b/mhkit/dolfyn/io/nortek2.py index fe4e3c9e7..fd984a817 100644 --- a/mhkit/dolfyn/io/nortek2.py +++ b/mhkit/dolfyn/io/nortek2.py @@ -14,8 +14,15 @@ from ..time import epoch2dt64, _fill_time_gaps -def read_signature(filename, userdata=True, nens=None, rebuild_index=False, - debug=False, **kwargs): +def read_signature( + filename, + userdata=True, + nens=None, + rebuild_index=False, + debug=False, + dual_profile=False, + **kwargs +): """ Read a Nortek Signature (.ad2cp) datafile @@ -26,13 +33,15 @@ def read_signature(filename, userdata=True, nens=None, rebuild_index=False, userdata : bool To search for and use a .userdata.json or not nens : None, int or 2-element tuple (start, stop) - Number of pings or ensembles to read from the file. + Number of pings or ensembles to read from the file. Default is None, read entire file rebuild_index : bool Force rebuild of dolfyn-written datafile index. Useful for code updates. Default = False debug : bool Logs debugger ouput if true. Default = False + dual_profile : bool + Set to true if instrument is running multiple profiles. Default = False Returns ------- @@ -45,11 +54,13 @@ def read_signature(filename, userdata=True, nens=None, rebuild_index=False, for handler in logging.root.handlers[:]: logging.root.removeHandler(handler) filepath = Path(filename) - logfile = filepath.with_suffix('.dolfyn.log') - logging.basicConfig(filename=str(logfile), - filemode='w', - level=logging.NOTSET, - format='%(name)s - %(levelname)s - %(message)s') + logfile = filepath.with_suffix(".dolfyn.log") + logging.basicConfig( + filename=str(logfile), + filemode="w", + level=logging.NOTSET, + format="%(name)s - %(levelname)s - %(message)s", + ) if nens is None: nens = [0, None] @@ -61,51 +72,58 @@ def read_signature(filename, userdata=True, nens=None, rebuild_index=False, else: # passes: it's a list/tuple/array if n != 2: - raise TypeError('nens must be: None (), int, or len 2') + raise TypeError("nens must be: None (), int, or len 2") userdata = _find_userdata(filename, userdata) - rdr = _Ad2cpReader(filename, rebuild_index=rebuild_index, debug=debug) + rdr = _Ad2cpReader( + filename, rebuild_index=rebuild_index, debug=debug, dual_profile=dual_profile + ) d = rdr.readfile(nens[0], nens[1]) rdr.sci_data(d) + if rdr._dp: + _clean_dp_skips(d) out = _reorg(d) _reduce(out) # Convert time to dt64 and fill gaps - coords = out['coords'] - t_list = [t for t in coords if 'time' in t] + coords = out["coords"] + t_list = [t for t in coords if "time" in t] for ky in t_list: tdat = coords[ky] tdat[tdat == 0] = np.NaN if np.isnan(tdat).any(): - tag = ky.lstrip('time') - warnings.warn("Zero/NaN values found in '{}'. Interpolating and " - "extrapolating them. To identify which values were filled later, " - "look for 0 values in 'status{}'".format(ky, tag)) - tdat = _fill_time_gaps(tdat, sample_rate_hz=out['attrs']['fs']) - coords[ky] = epoch2dt64(tdat).astype('datetime64[ns]') + tag = ky.lstrip("time") + warnings.warn( + "Zero/NaN values found in '{}'. Interpolating and " + "extrapolating them. To identify which values were filled later, " + "look for 0 values in 'status{}'".format(ky, tag) + ) + tdat = _fill_time_gaps(tdat, sample_rate_hz=out["attrs"]["fs"]) + coords[ky] = epoch2dt64(tdat).astype("datetime64[ns]") declin = None for nm in userdata: - if 'dec' in nm: + if "dec" in nm: declin = userdata[nm] else: - out['attrs'][nm] = userdata[nm] + out["attrs"][nm] = userdata[nm] # Create xarray dataset from upper level dictionary ds = _create_dataset(out) ds = _set_coords(ds, ref_frame=ds.coord_sys) - if 'orientmat' not in ds: - ds['orientmat'] = _euler2orient( - ds['time'], ds['heading'], ds['pitch'], ds['roll']) + if "orientmat" not in ds: + ds["orientmat"] = _euler2orient( + ds["time"], ds["heading"], ds["pitch"], ds["roll"] + ) if declin is not None: set_declination(ds, declin, inplace=True) # Convert config dictionary to json string for key in list(ds.attrs.keys()): - if 'config' in key: + if "config" in key: ds.attrs[key] = json.dumps(ds.attrs[key]) # Close handler @@ -114,32 +132,53 @@ def read_signature(filename, userdata=True, nens=None, rebuild_index=False, logging.root.removeHandler(handler) handler.close() - return ds - - -class _Ad2cpReader(): - def __init__(self, fname, endian=None, bufsize=None, rebuild_index=False, - debug=False): + # Return two datasets if dual profile + if rdr._dp: + return split_dp_datasets(ds) + else: + return ds + + +class _Ad2cpReader: + def __init__( + self, + fname, + endian=None, + bufsize=None, + rebuild_index=False, + debug=False, + dual_profile=False, + ): self.fname = fname self.debug = debug self._check_nortek(endian) self.f.seek(0, 2) # Seek to end self._eof = self.f.tell() - self._index = lib.get_index(fname, - reload=rebuild_index, - debug=debug) + self.start_pos = self._check_header() + self._index, self._dp = lib.get_index( + fname, + pos=self.start_pos, + eof=self._eof, + rebuild=rebuild_index, + debug=debug, + dp=dual_profile, + ) self._reopen(bufsize) self.filehead_config = self._read_filehead_config_string() - self._ens_pos = self._index['pos'][lib._boolarray_firstensemble_ping( - self._index)] + self._ens_pos = self._index["pos"][ + lib._boolarray_firstensemble_ping(self._index) + ] self._lastblock_iswhole = self._calc_lastblock_iswhole() self._config = lib._calc_config(self._index) self._init_burst_readers() self.unknown_ID_count = {} - def _calc_lastblock_iswhole(self, ): - blocksize, blocksize_count = np.unique(np.diff(self._ens_pos), - return_counts=True) + def _calc_lastblock_iswhole( + self, + ): + blocksize, blocksize_count = np.unique( + np.diff(self._ens_pos), return_counts=True + ) standard_blocksize = blocksize[blocksize_count.argmax()] return (self._eof - self._ens_pos[-1]) == standard_blocksize @@ -147,17 +186,36 @@ def _check_nortek(self, endian): self._reopen(10) byts = self.f.read(2) if endian is None: - if unpack('<' + 'BB', byts) == (165, 10): - endian = '<' - elif unpack('>' + 'BB', byts) == (165, 10): - endian = '>' + if unpack("<" + "BB", byts) == (165, 10): + endian = "<" + elif unpack(">" + "BB", byts) == (165, 10): + endian = ">" else: raise Exception( "I/O error: could not determine the 'endianness' " "of the file. Are you sure this is a Nortek " - "AD2CP file?") + "AD2CP file?" + ) self.endian = endian + def _check_header(self): + def find_all(s, c): + idx = s.find(c) + while idx != -1: + yield idx + idx = s.find(c, idx + 1) + + # Open the entire file + self._reopen(self._eof) + pk = self.f.peek(1) + # Search for multiple saved headers + found = [i for i in find_all(pk, b"GETCLOCKSTR")] + if len(found) < 2: + return 0 + else: + start_idx = found[-1] - 11 + return start_idx + def _reopen(self, bufsize=None): if bufsize is None: bufsize = 1000000 @@ -165,15 +223,17 @@ def _reopen(self, bufsize=None): self.f.close() except AttributeError: pass - self.f = open(_abspath(self.fname), 'rb', bufsize) + self.f = open(_abspath(self.fname), "rb", bufsize) - def _read_filehead_config_string(self, ): + def _read_filehead_config_string( + self, + ): hdr = self._read_hdr() out = {} - s_id, string = self._read_str(hdr['sz']) - string = string.decode('utf-8') + s_id, string = self._read_str(hdr["sz"]) + string = string.decode("utf-8") for ln in string.splitlines(): - ky, val = ln.split(',', 1) + ky, val = ln.split(",", 1) if ky in out: # There are more than one of this key if not isinstance(out[ky], list): @@ -185,11 +245,11 @@ def _read_filehead_config_string(self, ): out[ky] = val out2 = {} for ky in out: - if ky.startswith('GET'): + if ky.startswith("GET"): dat = out[ky] - d = out2[ky.lstrip('GET')] = dict() - for itm in dat.split(','): - k, val = itm.split('=') + d = out2[ky.lstrip("GET")] = dict() + for itm in dat.split(","): + k, val = itm.split("=") try: val = int(val) except ValueError: @@ -202,43 +262,60 @@ def _read_filehead_config_string(self, ): out2[ky] = out[ky] return out2 - def _init_burst_readers(self, ): + def _init_burst_readers( + self, + ): self._burst_readers = {} for rdr_id, cfg in self._config.items(): if rdr_id == 28: self._burst_readers[rdr_id] = defs._calc_echo_struct( - cfg['_config'], cfg['n_cells']) + cfg["_config"], cfg["n_cells"] + ) elif rdr_id == 23: self._burst_readers[rdr_id] = defs._calc_bt_struct( - cfg['_config'], cfg['n_beams']) + cfg["_config"], cfg["n_beams"] + ) else: self._burst_readers[rdr_id] = defs._calc_burst_struct( - cfg['_config'], cfg['n_beams'], cfg['n_cells']) + cfg["_config"], cfg["n_beams"], cfg["n_cells"] + ) def init_data(self, ens_start, ens_stop): outdat = {} nens = int(ens_stop - ens_start) - n26 = ((self._index['ID'] == 26) & - (self._index['ens'] >= ens_start) & - (self._index['ens'] < ens_stop)).sum() + + # ID 26 and 31 recorded infrequently + def n_id(id): + return ( + (self._index["ID"] == id) + & (self._index["ens"] >= ens_start) + & (self._index["ens"] < ens_stop) + ).sum() + + n_altraw = {26: n_id(26), 31: n_id(31)} + if not n_altraw[26] and 26 in self._burst_readers: + self._burst_readers.pop(26) + if not n_altraw[31] and 31 in self._burst_readers: + self._burst_readers.pop(31) + for ky in self._burst_readers: - if ky == 26: - n = n26 - ens = np.zeros(n, dtype='uint32') + if (ky == 26) or (ky == 31): + n = n_altraw[ky] + ens = np.zeros(n, dtype="uint32") else: - ens = np.arange(ens_start, - ens_stop).astype('uint32') + ens = np.arange(ens_start, ens_stop).astype("uint32") n = nens outdat[ky] = self._burst_readers[ky].init_data(n) - outdat[ky]['ensemble'] = ens - outdat[ky]['units'] = self._burst_readers[ky].data_units() - outdat[ky]['long_name'] = self._burst_readers[ky].data_longnames() - outdat[ky]['standard_name'] = self._burst_readers[ky].data_stdnames() + outdat[ky]["ensemble"] = ens + outdat[ky]["units"] = self._burst_readers[ky].data_units() + outdat[ky]["long_name"] = self._burst_readers[ky].data_longnames() + outdat[ky]["standard_name"] = self._burst_readers[ky].data_stdnames() + return outdat def _read_hdr(self, do_cs=False): res = defs.header.read2dict(self.f, cs=do_cs) - if res['sync'] != 165: + if res["sync"] != 165: raise Exception("Out of sync!") return res @@ -262,27 +339,30 @@ def readfile(self, ens_start=0, ens_stop=None): ens_stop = int(ens_stop) nens = ens_stop - ens_start outdat = self.init_data(ens_start, ens_stop) - outdat['filehead_config'] = self.filehead_config - print('Reading file %s ...' % self.fname) + outdat["filehead_config"] = self.filehead_config + print("Reading file %s ..." % self.fname) c = 0 - c26 = 0 + c_altraw = {26: 0, 31: 0} self.f.seek(self._ens_pos[ens_start], 0) while True: try: hdr = self._read_hdr() except IOError: return outdat - id = hdr['id'] - if id in [21, 22, 23, 24, 28]: # vel, bt, vel_b5, echo + id = hdr["id"] + if id in [21, 22, 23, 24, 28]: # "burst data record" (vel + ast), + # "avg data record" (vel_avg + ast_avg), "bottom track data record" (bt), + # "interleaved burst data record" (vel_b5), "echosounder record" (echo) self._read_burst(id, outdat[id], c) - elif id in [26]: # alt_raw (altimeter burst) - rdr = self._burst_readers[26] - if not hasattr(rdr, '_nsamp_index'): + elif id in [26, 31]: + # "burst altimeter raw record" (_altraw), "avg altimeter raw record" (_altraw_avg) + rdr = self._burst_readers[id] + if not hasattr(rdr, "_nsamp_index"): first_pass = True - tmp_idx = rdr._nsamp_index = rdr._names.index('altraw_nsamp') # noqa + tmp_idx = rdr._nsamp_index = rdr._names.index("nsamp_alt") shift = rdr._nsamp_shift = calcsize( - defs._format(rdr._format[:tmp_idx], - rdr._N[:tmp_idx])) + defs._format(rdr._format[:tmp_idx], rdr._N[:tmp_idx]) + ) else: first_pass = False tmp_idx = rdr._nsamp_index @@ -290,50 +370,53 @@ def readfile(self, ens_start=0, ens_stop=None): tmp_idx = tmp_idx + 2 # Don't add in-place self.f.seek(shift, 1) # Now read the num_samples - sz = unpack('= _posnow): + while self.f.tell() >= _posnow: c += 1 if c + ens_start + 1 >= nens_total: # Again check end of count list @@ -375,15 +457,42 @@ def sci_data(self, dat): continue rdr = self._burst_readers[id] rdr.sci_data(dnow) - if 'vel' in dnow and 'vel_scale' in dnow: - dnow['vel'] = (dnow['vel'] * - 10.0 ** dnow['vel_scale']).astype('float32') - - def __exit__(self, type, value, trace,): - self.f.close() - - def __enter__(self,): - return self + if "vel" in dnow and "vel_scale" in dnow: + dnow["vel"] = (dnow["vel"] * 10.0 ** dnow["vel_scale"]).astype( + "float32" + ) + + +def _altraw_reorg(outdat, tag=""): + """Submethod for `_reorg` particular to raw altimeter pings (ID 26 and 31)""" + for ky in list(outdat["data_vars"]): + if ky.endswith("raw" + tag) and not ky.endswith("_altraw" + tag): + outdat["data_vars"].pop(ky) + outdat["coords"]["time_altraw" + tag] = outdat["coords"].pop("timeraw" + tag) + # convert "signed fractional" to float + outdat["data_vars"]["samp_altraw" + tag] = ( + outdat["data_vars"]["samp_altraw" + tag].astype("float32") / 2**8 + ) + + # Read altimeter status + outdat["data_vars"].pop("status_altraw" + tag) + status_alt = lib._alt_status2data(outdat["data_vars"]["status_alt" + tag]) + for ky in status_alt: + outdat["attrs"][ky + tag] = lib._collapse( + status_alt[ky].astype("uint8"), name=ky + ) + outdat["data_vars"].pop("status_alt" + tag) + + # Power level index + power = {0: "high", 1: "med-high", 2: "med-low", 3: "low"} + outdat["attrs"]["power_level_alt" + tag] = power[ + outdat["attrs"].pop("power_level_idx_alt" + tag) + ] + + # Other attrs + for ky in list(outdat["attrs"]): + if ky.endswith("raw" + tag): + outdat["attrs"][ky.split("raw")[0] + "_alt" + tag] = outdat["attrs"].pop(ky) def _reorg(dat): @@ -392,17 +501,31 @@ def _reorg(dat): (organized by ID), and combines them into a single dictionary. """ - outdat = {'data_vars': {}, 'coords': {}, 'attrs': {}, - 'units': {}, 'long_name': {}, 'standard_name': {}, - 'sys': {}, 'altraw': {}} - cfg = outdat['attrs'] - cfh = cfg['filehead_config'] = dat['filehead_config'] - cfg['inst_model'] = (cfh['ID'].split(',')[0][5:-1]) - cfg['inst_make'] = 'Nortek' - cfg['inst_type'] = 'ADCP' - - for id, tag in [(21, ''), (22, '_avg'), (23, '_bt'), - (24, '_b5'), (26, '_ast'), (28, '_echo')]: + outdat = { + "data_vars": {}, + "coords": {}, + "attrs": {}, + "units": {}, + "long_name": {}, + "standard_name": {}, + "sys": {}, + "altraw": {}, + } + cfg = outdat["attrs"] + cfh = cfg["filehead_config"] = dat["filehead_config"] + cfg["inst_model"] = cfh["ID"].split(",")[0][5:-1] + cfg["inst_make"] = "Nortek" + cfg["inst_type"] = "ADCP" + + for id, tag in [ + (21, ""), + (22, "_avg"), + (23, "_bt"), + (24, "_b5"), + (26, "raw"), + (28, "_echo"), + (31, "raw_avg"), + ]: if id in [24, 26]: collapse_exclude = [0] else: @@ -410,211 +533,322 @@ def _reorg(dat): if id not in dat: continue dnow = dat[id] - outdat['units'].update(dnow['units']) - outdat['long_name'].update(dnow['long_name']) - for ky in dnow['units']: - if not dnow['standard_name'][ky]: - dnow['standard_name'].pop(ky) - outdat['standard_name'].update(dnow['standard_name']) - cfg['burst_config' + tag] = lib._headconfig_int2dict( - lib._collapse(dnow['config'], exclude=collapse_exclude, - name='config')) - outdat['coords']['time' + tag] = lib._calc_time( - dnow['year'] + 1900, - dnow['month'], - dnow['day'], - dnow['hour'], - dnow['minute'], - dnow['second'], - dnow['usec100'].astype('uint32') * 100) + outdat["units"].update(dnow["units"]) + outdat["long_name"].update(dnow["long_name"]) + for ky in dnow["units"]: + if not dnow["standard_name"][ky]: + dnow["standard_name"].pop(ky) + outdat["standard_name"].update(dnow["standard_name"]) + cfg["burst_config" + tag] = lib._headconfig_int2dict( + lib._collapse(dnow["config"], exclude=collapse_exclude, name="config") + ) + outdat["coords"]["time" + tag] = lib._calc_time( + dnow["year"] + 1900, + dnow["month"], + dnow["day"], + dnow["hour"], + dnow["minute"], + dnow["second"], + dnow["usec100"].astype("uint32") * 100, + ) tmp = lib._beams_cy_int2dict( - lib._collapse(dnow['beam_config'], exclude=collapse_exclude, - name='beam_config'), 21) - cfg['n_cells' + tag] = tmp['n_cells'] - cfg['coord_sys_axes' + tag] = tmp['cy'] - cfg['n_beams' + tag] = tmp['n_beams'] - cfg['ambig_vel' + - tag] = lib._collapse(dnow['ambig_vel'], name='ambig_vel') - - for ky in ['SerialNum', 'cell_size', 'blank_dist', 'nominal_corr', - 'power_level_dB']: - cfg[ky + tag] = lib._collapse(dnow[ky], - exclude=collapse_exclude, - name=ky) - - for ky in ['c_sound', 'temp', 'pressure', 'heading', 'pitch', 'roll', - 'mag', 'accel', 'batt', 'temp_clock', 'error', - 'status', 'ensemble', - ]: - outdat['data_vars'][ky + tag] = dnow[ky] - if 'ensemble' in ky: - outdat['data_vars'][ky + tag] += 1 - outdat['units'][ky + tag] = '#' - outdat['long_name'][ky + tag] = 'Ensemble Number' - outdat['standard_name'][ky + tag] = 'number_of_observations' - - for ky in ['vel', 'amp', 'corr', 'prcnt_gd', 'echo', 'dist', - 'orientmat', 'angrt', 'quaternions', 'ast_pressure', - 'alt_dist', 'alt_quality', 'alt_status', - 'ast_dist', 'ast_quality', 'ast_offset_time', - 'altraw_nsamp', 'altraw_dsamp', 'altraw_samp', - 'status0', 'fom', 'temp_press', 'press_std', - 'pitch_std', 'roll_std', 'heading_std', 'xmit_energy', - ]: + lib._collapse( + dnow["beam_config"], exclude=collapse_exclude, name="beam_config" + ), + 21, # always 21 here + ) + cfg["n_cells" + tag] = tmp["n_cells"] + cfg["coord_sys_axes" + tag] = tmp["cy"] + cfg["n_beams" + tag] = tmp["n_beams"] + cfg["ambig_vel" + tag] = lib._collapse(dnow["ambig_vel"], name="ambig_vel") + + for ky in [ + "SerialNum", + "cell_size", + "blank_dist", + "nominal_corr", + "power_level_dB", + ]: + cfg[ky + tag] = lib._collapse(dnow[ky], exclude=collapse_exclude, name=ky) + + for ky in [ + "c_sound", + "temp", + "pressure", + "heading", + "pitch", + "roll", + "mag", + "accel", + "batt", + "temp_clock", + "error", + "status", + "ensemble", + ]: + outdat["data_vars"][ky + tag] = dnow[ky] + if "ensemble" in ky: + outdat["data_vars"][ky + tag] += 1 + outdat["units"][ky + tag] = "#" + outdat["long_name"][ky + tag] = "Ensemble Number" + outdat["standard_name"][ky + tag] = "number_of_observations" + + for ky in [ + "vel", + "amp", + "corr", + "prcnt_gd", + "echo", + "dist", + "orientmat", + "angrt", + "quaternions", + "pressure_alt", + "le_dist_alt", + "le_quality_alt", + "status_alt", + "ast_dist_alt", + "ast_quality_alt", + "ast_offset_time_alt", + "nsamp_alt", + "dsamp_alt", + "samp_alt", + "status0", + "fom", + "temp_press", + "press_std", + "pitch_std", + "roll_std", + "heading_std", + "xmit_energy", + ]: if ky in dnow: - outdat['data_vars'][ky + tag] = dnow[ky] + outdat["data_vars"][ky + tag] = dnow[ky] # Move 'altimeter raw' data to its own down-sampled structure if 26 in dat: - ard = outdat['altraw'] - for ky in list(outdat['data_vars']): - if ky.endswith('_ast'): - grp = ky.split('.')[0] - if '.' in ky and grp not in ard: - ard[grp] = {} - ard[ky.rstrip('_ast')] = outdat['data_vars'].pop(ky) - - # Read altimeter status - alt_status = lib._alt_status2data(outdat['data_vars']['alt_status']) - for ky in alt_status: - outdat['attrs'][ky] = lib._collapse( - alt_status[ky].astype('uint8'), name=ky) - outdat['data_vars'].pop('alt_status') - - # Power level index - power = {0: 'high', 1: 'med-high', 2: 'med-low', 3: 'low'} - outdat['attrs']['power_level_alt'] = power[outdat['attrs'].pop( - 'power_level_idx_alt')] + _altraw_reorg(outdat) + if 31 in dat: + _altraw_reorg(outdat, tag="_avg") # Read status data - status0_vars = [x for x in outdat['data_vars'] if 'status0' in x] + status0_vars = [x for x in outdat["data_vars"] if "status0" in x] # Status data is the same across all tags, and there is always a 'status' and 'status0' status0_key = status0_vars[0] - status0_data = lib._status02data(outdat['data_vars'][status0_key]) - status_key = status0_key.replace('0', '') - status_data = lib._status2data(outdat['data_vars'][status_key]) + status0_data = lib._status02data(outdat["data_vars"][status0_key]) + status_key = status0_key.replace("0", "") + status_data = lib._status2data(outdat["data_vars"][status_key]) # Individual status codes # Wake up state - wake = {0: 'bad power', 1: 'power on', 2: 'break', 3: 'clock'} - outdat['attrs']['wakeup_state'] = wake[lib._collapse( - status_data.pop('wakeup_state'), name=ky)] + wake = {0: "bad power", 1: "power on", 2: "break", 3: "clock"} + outdat["attrs"]["wakeup_state"] = wake[ + lib._collapse(status_data.pop("wakeup_state"), name=ky) + ] # Instrument direction # 0: XUP, 1: XDOWN, 2: YUP, 3: YDOWN, 4: ZUP, 5: ZDOWN, # 7: AHRS, handle as ZUP - nortek_orient = {0: 'horizontal', 1: 'horizontal', 2: 'horizontal', - 3: 'horizontal', 4: 'up', 5: 'down', 7: 'AHRS'} - outdat['attrs']['orientation'] = nortek_orient[lib._collapse( - status_data.pop('orient_up'), name='orientation')] + nortek_orient = { + 0: "horizontal", + 1: "horizontal", + 2: "horizontal", + 3: "horizontal", + 4: "up", + 5: "down", + 7: "AHRS", + } + outdat["attrs"]["orientation"] = nortek_orient[ + lib._collapse(status_data.pop("orient_up"), name="orientation") + ] # Orientation detection - orient_status = {0: 'fixed', 1: 'auto_UD', 3: 'AHRS-3D'} - outdat['attrs']['orient_status'] = orient_status[lib._collapse( - status_data.pop('auto_orientation'), name='orient_status')] + orient_status = {0: "fixed", 1: "auto_UD", 3: "AHRS-3D"} + outdat["attrs"]["orient_status"] = orient_status[ + lib._collapse(status_data.pop("auto_orientation"), name="orient_status") + ] # Status variables - for ky in ['low_volt_skip', 'active_config', 'telemetry_data', 'boost_running']: - outdat['data_vars'][ky] = status_data[ky].astype('uint8') + for ky in ["low_volt_skip", "active_config", "telemetry_data", "boost_running"]: + outdat["data_vars"][ky] = status_data[ky].astype("uint8") # Processor idle state - need to save as 1/0 per netcdf attribute limitations for ky in status0_data: - outdat['attrs'][ky] = lib._collapse( - status0_data[ky].astype('uint8'), name=ky) + outdat["attrs"][ky] = lib._collapse(status0_data[ky].astype("uint8"), name=ky) - # Remove status0 variables - keep status variables as they useful for finding missing pings - [outdat['data_vars'].pop(var) for var in status0_vars] + # Remove status0 variables - keep status variables as they are useful for finding missing pings + [outdat["data_vars"].pop(var) for var in status0_vars] # Set coordinate system if 21 not in dat: - cfg['rotate_vars'] = [] - cy = cfg['coord_sys_axes_avg'] + cfg["rotate_vars"] = [] + cy = cfg["coord_sys_axes_avg"] else: - cfg['rotate_vars'] = ['vel', ] - cy = cfg['coord_sys_axes'] - outdat['attrs']['coord_sys'] = {'XYZ': 'inst', - 'ENU': 'earth', - 'beam': 'beam'}[cy] + cfg["rotate_vars"] = [ + "vel", + ] + cy = cfg["coord_sys_axes"] + outdat["attrs"]["coord_sys"] = {"XYZ": "inst", "ENU": "earth", "beam": "beam"}[cy] # Copy appropriate vars to rotate_vars - for ky in ['accel', 'angrt', 'mag']: - for dky in outdat['data_vars'].keys(): - if dky == ky or dky.startswith(ky + '_'): - outdat['attrs']['rotate_vars'].append(dky) - if 'vel_bt' in outdat['data_vars']: - outdat['attrs']['rotate_vars'].append('vel_bt') - if 'vel_avg' in outdat['data_vars']: - outdat['attrs']['rotate_vars'].append('vel_avg') + for ky in ["accel", "angrt", "mag"]: + for dky in outdat["data_vars"].keys(): + if dky == ky or dky.startswith(ky + "_"): + outdat["attrs"]["rotate_vars"].append(dky) + if "vel_bt" in outdat["data_vars"]: + outdat["attrs"]["rotate_vars"].append("vel_bt") + if "vel_avg" in outdat["data_vars"]: + outdat["attrs"]["rotate_vars"].append("vel_avg") return outdat +def _clean_dp_skips(data): + """ + Removes zeros from interwoven measurements taken in a dual profile + configuration. + """ + + for id in data: + if id == "filehead_config": + continue + # Check where 'ver' is zero (should be 1 (for bt) or 3 (everything else)) + skips = np.where(data[id]["ver"] != 0) + for var in data[id]: + if var not in ["units", "long_name", "standard_name"]: + data[id][var] = np.squeeze(data[id][var][..., skips], axis=-2) + + def _reduce(data): - """This function takes the output from `reorg`, and further simplifies the + """ + This function takes the output from `reorg`, and further simplifies the data. Mostly this is combining system, environmental, and orientation data --- from different data structures within the same ensemble --- by averaging. """ - - dv = data['data_vars'] - dc = data['coords'] - da = data['attrs'] + + dv = data["data_vars"] + dc = data["coords"] + da = data["attrs"] # Average these fields - for ky in ['c_sound', 'temp', 'pressure', - 'temp_press', 'temp_clock', 'batt']: - lib._reduce_by_average(dv, ky, ky + '_b5') + for ky in ["c_sound", "temp", "pressure", "temp_press", "temp_clock", "batt"]: + lib._reduce_by_average(dv, ky, ky + "_b5") # Angle-averaging is treated separately - for ky in ['heading', 'pitch', 'roll']: - lib._reduce_by_average_angle(dv, ky, ky + '_b5') - - if 'vel' in dv: - dc['range'] = ((np.arange(dv['vel'].shape[1])+1) * - da['cell_size'] + - da['blank_dist']) - da['fs'] = da['filehead_config']['BURST']['SR'] - tmat = da['filehead_config']['XFBURST'] - if 'vel_avg' in dv: - dc['range_avg'] = ((np.arange(dv['vel_avg'].shape[1])+1) * - da['cell_size_avg'] + - da['blank_dist_avg']) - dv['orientmat'] = dv.pop('orientmat_avg') - tmat = da['filehead_config']['XFAVG'] - da['fs'] = da['filehead_config']['PLAN']['MIAVG'] - da['avg_interval_sec'] = da['filehead_config']['AVG']['AI'] - da['bandwidth'] = da['filehead_config']['AVG']['BW'] - if 'vel_b5' in dv: - dc['range_b5'] = ((np.arange(dv['vel_b5'].shape[1])+1) * - da['cell_size_b5'] + - da['blank_dist_b5']) - if 'echo_echo' in dv: - dv['echo'] = dv.pop('echo_echo') - dc['range_echo'] = ((np.arange(dv['echo'].shape[0])+1) * - da['cell_size_echo'] + - da['blank_dist_echo']) - - if 'orientmat' in data['data_vars']: - da['has_imu'] = 1 # logical + for ky in ["heading", "pitch", "roll"]: + lib._reduce_by_average_angle(dv, ky, ky + "_b5") + + if "vel" in dv: + dc["range"] = (np.arange(dv["vel"].shape[1]) + 1) * da["cell_size"] + da[ + "blank_dist" + ] + da["fs"] = da["filehead_config"]["BURST"]["SR"] + tmat = da["filehead_config"]["XFBURST"] + if "vel_avg" in dv: + dc["range_avg"] = (np.arange(dv["vel_avg"].shape[1]) + 1) * da[ + "cell_size_avg" + ] + da["blank_dist_avg"] + if "orientmat" not in dv: + dv["orientmat"] = dv.pop("orientmat_avg") + tmat = da["filehead_config"]["XFAVG"] + da["fs"] = da["filehead_config"]["PLAN"]["MIAVG"] + da["avg_interval_sec"] = da["filehead_config"]["AVG"]["AI"] + da["bandwidth"] = da["filehead_config"]["AVG"]["BW"] + if "vel_b5" in dv: + # vel_b5 is sometimes shape 2 and sometimes shape 3 + dc["range_b5"] = (np.arange(dv["vel_b5"].shape[-2]) + 1) * da[ + "cell_size_b5" + ] + da["blank_dist_b5"] + if "echo_echo" in dv: + dv["echo"] = dv.pop("echo_echo") + dc["range_echo"] = (np.arange(dv["echo"].shape[0]) + 1) * da[ + "cell_size_echo" + ] + da["blank_dist_echo"] + + if "orientmat" in data["data_vars"]: + da["has_imu"] = 1 # logical # Signature AHRS rotation matrix returned in "inst->earth" # Change to dolfyn's "earth->inst" - dv['orientmat'] = np.rollaxis(dv['orientmat'], 1) + dv["orientmat"] = np.rollaxis(dv["orientmat"], 1) else: - da['has_imu'] = 0 - - theta = da['filehead_config']['BEAMCFGLIST'][0] - if 'THETA=' in theta: - da['beam_angle'] = int(theta[13:15]) - - tm = np.zeros((tmat['ROWS'], tmat['COLS']), dtype=np.float32) - for irow in range(tmat['ROWS']): - for icol in range(tmat['COLS']): - tm[irow, icol] = tmat['M' + str(irow + 1) + str(icol + 1)] - dv['beam2inst_orientmat'] = tm + da["has_imu"] = 0 + + theta = da["filehead_config"]["BEAMCFGLIST"][0] + if "THETA=" in theta: + da["beam_angle"] = int(theta[13:15]) + + tm = np.zeros((tmat["ROWS"], tmat["COLS"]), dtype=np.float32) + for irow in range(tmat["ROWS"]): + for icol in range(tmat["COLS"]): + tm[irow, icol] = tmat["M" + str(irow + 1) + str(icol + 1)] + dv["beam2inst_orientmat"] = tm # If burst velocity isn't used, need to copy one for 'time' - if 'time' not in dc: + if "time" not in dc: for val in dc: - if 'time' in val: + if "time" in val: time = val - dc['time'] = dc[time] + dc["time"] = dc[time] + + +def split_dp_datasets(ds): + """ + Splits a dataset containing dual profiles into individual profiles + """ + + # Figure out which variables belong to which profile based on length of time variables + t_dict = {} + for t in ds.coords: + if "time" in t: + t_dict[t] = ds[t].size + + other_coords = [] + for key, val in t_dict.items(): + if val != t_dict["time"]: + if key.endswith("altraw"): + # altraw goes with burst, altraw_avg goes with avg + continue + other_coords.append(key) + # Fetch variables, coordinates, and attrs for second profiling configuration + other_vars = [ + v for v in ds.data_vars if any(x in ds[v].coords for x in other_coords) + ] + other_tags = [s.split("_")[-1] for s in other_coords] + other_coords += [v for v in ds.coords if any(x in v for x in other_tags)] + other_attrs = [s for s in ds.attrs if any(x in s for x in other_tags)] + critical_attrs = [ + "inst_model", + "inst_make", + "inst_type", + "fs", + "orientation", + "orient_status", + "has_imu", + "beam_angle", + ] + + # Create second dataset + ds2 = type(ds)() + for a in other_attrs + critical_attrs: + ds2.attrs[a] = ds.attrs[a] + for v in other_vars: + ds2[v] = ds[v] + # Set rotate_vars + rotate_vars2 = [v for v in ds.attrs["rotate_vars"] if v in other_vars] + ds2.attrs["rotate_vars"] = rotate_vars2 + # Set orientation matricies + ds2["beam2inst_orientmat"] = ds["beam2inst_orientmat"] + ds2 = ds2.rename({"orientmat_" + other_tags[0]: "orientmat"}) + # Set original coordinate system + cy = ds2.attrs["coord_sys_axes_" + other_tags[0]] + ds2.attrs["coord_sys"] = {"XYZ": "inst", "ENU": "earth", "beam": "beam"}[cy] + ds2 = _set_coords(ds2, ref_frame=ds2.coord_sys) + + # Clean up first dataset + [ds.attrs.pop(ky) for ky in other_attrs] + ds = ds.drop_vars(other_vars + other_coords) + for itm in rotate_vars2: + ds.attrs["rotate_vars"].remove(itm) + + return ds, ds2 diff --git a/mhkit/dolfyn/io/nortek2_defs.py b/mhkit/dolfyn/io/nortek2_defs.py index 6b9b1d8f2..82723545c 100644 --- a/mhkit/dolfyn/io/nortek2_defs.py +++ b/mhkit/dolfyn/io/nortek2_defs.py @@ -4,15 +4,15 @@ from . import nortek2_lib as lib -dt32 = 'float32' +dt32 = "float32" grav = 9.81 # The starting value for the checksum: -cs0 = int('0xb58c', 0) +cs0 = int("0xb58c", 0) def _nans(*args, **kwargs): out = np.empty(*args, **kwargs) - if out.dtype.kind == 'f': + if out.dtype.kind == "f": out[:] = np.NaN else: out[:] = 0 @@ -20,15 +20,15 @@ def _nans(*args, **kwargs): def _format(form, N): - out = '' + out = "" for f, n in zip(form, N): if n > 1: - out += '{}'.format(n) + out += "{}".format(n) out += f return out -class _DataDef(): +class _DataDef: def __init__(self, list_of_defs): self._names = [] self._format = [] @@ -46,22 +46,22 @@ def __init__(self, list_of_defs): if len(itm) > 4: self._units.append(itm[4]) else: - self._units.append('1') + self._units.append("1") if len(itm) > 5: self._long_name.append(itm[5]) else: - self._long_name.append('') + self._long_name.append("") if len(itm) > 6: self._standard_name.append(itm[6]) else: - self._standard_name.append('') + self._standard_name.append("") if itm[2] == []: self._N.append(1) else: self._N.append(int(np.prod(itm[2]))) - self._struct = Struct('<' + self.format) + self._struct = Struct("<" + self.format) self.nbyte = self._struct.size - self._cs_struct = Struct('<' + '{}H'.format(int(self.nbyte // 2))) + self._cs_struct = Struct("<" + "{}H".format(int(self.nbyte // 2))) def init_data(self, npings): out = {} @@ -80,7 +80,9 @@ def read_into(self, fobj, data, ens, cs=None): data[nm][..., ens] = np.asarray(d).reshape(shp) @property - def format(self, ): + def format( + self, + ): return _format(self._format, self._N) def read(self, fobj, cs=None): @@ -99,24 +101,22 @@ def read(self, fobj, cs=None): off = cs0 cs_res = sum(self._cs_struct.unpack(bytes)) + off if csval is not False and (cs_res % 65536) != csval: - raise Exception('Checksum failed!') + raise Exception("Checksum failed!") out = [] c = 0 for idx, n in enumerate(self._N): if n == 1: out.append(data[c]) else: - out.append(data[c:(c + n)]) + out.append(data[c : (c + n)]) c += n return out def read2dict(self, fobj, cs=False): - return {self._names[idx]: dat - for idx, dat in enumerate(self.read(fobj, cs=cs))} + return {self._names[idx]: dat for idx, dat in enumerate(self.read(fobj, cs=cs))} def sci_data(self, data): - for ky, func in zip(self._names, - self._sci_func): + for ky, func in zip(self._names, self._sci_func): if func is None: continue data[ky] = func(data[ky]) @@ -140,7 +140,7 @@ def data_stdnames(self): return stdnms -class _LinFunc(): +class _LinFunc: """A simple linear offset and scaling object. Usage: @@ -165,129 +165,248 @@ def __call__(self, array): return array -header = _DataDef([ - ('sync', 'B', [], None), - ('hsz', 'B', [], None), - ('id', 'B', [], None), - ('fam', 'B', [], None), - ('sz', 'H', [], None), - ('cs', 'H', [], None), - ('hcs', 'H', [], None), -]) +header = _DataDef( + [ + ("sync", "B", [], None), + ("hsz", "B", [], None), + ("id", "B", [], None), + ("fam", "B", [], None), + ("sz", "H", [], None), + ("cs", "H", [], None), + ("hcs", "H", [], None), + ] +) _burst_hdr = [ - ('ver', 'B', [], None), - ('DatOffset', 'B', [], None), - ('config', 'H', [], None), - ('SerialNum', 'I', [], None), - ('year', 'B', [], None), - ('month', 'B', [], None), - ('day', 'B', [], None), - ('hour', 'B', [], None), - ('minute', 'B', [], None), - ('second', 'B', [], None), - ('usec100', 'H', [], None), - ('c_sound', 'H', [], _LinFunc(0.1, dtype=dt32), 'm s-1', - 'Speed of Sound', 'speed_of_sound_in_sea_water'), - ('temp', 'H', [], _LinFunc(0.01, dtype=dt32), - 'degree_C', 'Temperature', 'sea_water_temperature'), - ('pressure', 'I', [], _LinFunc(0.001, dtype=dt32), - 'dbar', 'Pressure', 'sea_water_pressure'), - ('heading', 'H', [], _LinFunc(0.01, dtype=dt32), - 'degree', 'Heading', 'platform_orientation'), - ('pitch', 'h', [], _LinFunc(0.01, dtype=dt32), - 'degree', 'Pitch', 'platform_pitch'), - ('roll', 'h', [], _LinFunc(0.01, dtype=dt32), 'degree', 'Roll', 'platform_roll'), - ('beam_config', 'H', [], None), - ('cell_size', 'H', [], _LinFunc(0.001), 'm'), - ('blank_dist', 'H', [], _LinFunc(0.01), 'm'), - ('nominal_corr', 'B', [], None, '%'), - ('temp_press', 'B', [], _LinFunc(0.2, -20, dtype=dt32), - 'degree_C', 'Pressure Sensor Temperature'), - ('batt', 'H', [], _LinFunc(0.1, dtype=dt32), - 'V', 'Battery Voltage', 'battery_voltage'), - ('mag', 'h', [3], _LinFunc(0.1, dtype=dt32), 'uT', 'Compass'), - ('accel', 'h', [3], _LinFunc(1. / 16384 * grav, dtype=dt32), - 'm s-2', 'Acceleration'), - ('ambig_vel', 'h', [], _LinFunc(0.001, dtype=dt32), 'm s-1'), - ('data_desc', 'H', [], None), - ('xmit_energy', 'H', [], None, 'dB', 'Sound Pressure Level of Acoustic Signal'), - ('vel_scale', 'b', [], None), - ('power_level_dB', 'b', [], _LinFunc(dtype=dt32), 'dB', 'Power Level'), - ('temp_mag', 'h', [], None), # uncalibrated - ('temp_clock', 'h', [], _LinFunc(0.01, dtype=dt32), - 'degree_C', 'Internal Clock Temperature'), - ('error', 'H', [], None, '1', 'Error Code'), - ('status0', 'H', [], None, '1', 'Status 0 Code'), - ('status', 'I', [], None, '1', 'Status Code'), - ('_ensemble', 'I', [], None), + ("ver", "B", [], None), + ("DatOffset", "B", [], None), + ("config", "H", [], None), + ("SerialNum", "I", [], None), + ("year", "B", [], None), + ("month", "B", [], None), + ("day", "B", [], None), + ("hour", "B", [], None), + ("minute", "B", [], None), + ("second", "B", [], None), + ("usec100", "H", [], None), + ( + "c_sound", + "H", + [], + _LinFunc(0.1, dtype=dt32), + "m s-1", + "Speed of Sound", + "speed_of_sound_in_sea_water", + ), + ( + "temp", + "h", + [], + _LinFunc(0.01, dtype=dt32), + "degree_C", + "Temperature", + "sea_water_temperature", + ), + ( + "pressure", + "I", + [], + _LinFunc(0.001, dtype=dt32), + "dbar", + "Pressure", + "sea_water_pressure", + ), + ( + "heading", + "H", + [], + _LinFunc(0.01, dtype=dt32), + "degree", + "Heading", + "platform_orientation", + ), + ("pitch", "h", [], _LinFunc(0.01, dtype=dt32), "degree", "Pitch", "platform_pitch"), + ("roll", "h", [], _LinFunc(0.01, dtype=dt32), "degree", "Roll", "platform_roll"), + ("beam_config", "H", [], None), + ("cell_size", "H", [], _LinFunc(0.001), "m"), + ("blank_dist", "H", [], _LinFunc(0.01), "m"), + ("nominal_corr", "B", [], None, "%"), + ( + "temp_press", + "b", + [], + _LinFunc(0.2, -20, dtype=dt32), + "degree_C", + "Pressure Sensor Temperature", + ), + ( + "batt", + "H", + [], + _LinFunc(0.1, dtype=dt32), + "V", + "Battery Voltage", + "battery_voltage", + ), + ("mag", "h", [3], _LinFunc(0.1, dtype=dt32), "uT", "Compass"), + ( + "accel", + "h", + [3], + _LinFunc(1.0 / 16384 * grav, dtype=dt32), + "m s-2", + "Acceleration", + ), + ("ambig_vel", "h", [], _LinFunc(0.001, dtype=dt32), "m s-1"), + ("data_desc", "H", [], None), + ("xmit_energy", "H", [], None, "dB", "Sound Pressure Level of Acoustic Signal"), + ("vel_scale", "b", [], None), + ("power_level_dB", "b", [], _LinFunc(dtype=dt32), "dB", "Power Level"), + ("temp_mag", "h", [], None), # uncalibrated + ( + "temp_clock", + "h", + [], + _LinFunc(0.01, dtype=dt32), + "degree_C", + "Internal Clock Temperature", + ), + ("error", "H", [], None, "1", "Error Code"), + ("status0", "H", [], None, "1", "Status 0 Code"), + ("status", "I", [], None, "1", "Status Code"), + ("_ensemble", "I", [], None), ] _bt_hdr = [ - ('ver', 'B', [], None), - ('DatOffset', 'B', [], None), - ('config', 'H', [], None), - ('SerialNum', 'I', [], None), - ('year', 'B', [], None), - ('month', 'B', [], None), - ('day', 'B', [], None), - ('hour', 'B', [], None), - ('minute', 'B', [], None), - ('second', 'B', [], None), - ('usec100', 'H', [], None), - ('c_sound', 'H', [], _LinFunc(0.1, dtype=dt32), 'm s-1', - 'Speed of Sound', 'speed_of_sound_in_sea_water'), - ('temp', 'H', [], _LinFunc(0.01, dtype=dt32), - 'degree_C', 'Temperature', 'sea_water_temperature'), - ('pressure', 'I', [], _LinFunc(0.001, dtype=dt32), - 'dbar', 'Pressure', 'sea_water_pressure'), - ('heading', 'H', [], _LinFunc(0.01, dtype=dt32), - 'degree', 'Heading', 'platform_orientation'), - ('pitch', 'h', [], _LinFunc(0.01, dtype=dt32), - 'degree', 'Pitch', 'platform_pitch'), - ('roll', 'h', [], _LinFunc(0.01, dtype=dt32), 'degree', 'Roll', 'platform_roll'), - ('beam_config', 'H', [], None), - ('cell_size', 'H', [], _LinFunc(0.001), 'm'), - ('blank_dist', 'H', [], _LinFunc(0.01), 'm'), - ('nominal_corr', 'B', [], None, '%'), - ('unused', 'B', [], None), - ('batt', 'H', [], _LinFunc(0.1, dtype=dt32), - 'V', 'Battery Voltage', 'battery_voltage'), - ('mag', 'h', [3], None, 'uT', 'Compass'), - ('accel', 'h', [3], _LinFunc(1. / 16384 * grav, dtype=dt32), - 'm s-2', 'Acceleration', ''), - ('ambig_vel', 'I', [], _LinFunc(0.001, dtype=dt32), 'm s-1'), - ('data_desc', 'H', [], None), - ('xmit_energy', 'H', [], None, 'dB', 'Sound Pressure Level of Acoustic Signal'), - ('vel_scale', 'b', [], None), - ('power_level_dB', 'b', [], _LinFunc(dtype=dt32), 'dB'), - ('temp_mag', 'h', [], None), # uncalibrated - ('temp_clock', 'h', [], _LinFunc(0.01, dtype=dt32), - 'degree_C', 'Internal Clock Temperature'), - ('error', 'I', [], None, '1', 'Error Code'), - ('status', 'I', [], None, '1', 'Status Code'), - ('_ensemble', 'I', [], None), + ("ver", "B", [], None), + ("DatOffset", "B", [], None), + ("config", "H", [], None), + ("SerialNum", "I", [], None), + ("year", "B", [], None), + ("month", "B", [], None), + ("day", "B", [], None), + ("hour", "B", [], None), + ("minute", "B", [], None), + ("second", "B", [], None), + ("usec100", "H", [], None), + ( + "c_sound", + "H", + [], + _LinFunc(0.1, dtype=dt32), + "m s-1", + "Speed of Sound", + "speed_of_sound_in_sea_water", + ), + ( + "temp", + "h", + [], + _LinFunc(0.01, dtype=dt32), + "degree_C", + "Temperature", + "sea_water_temperature", + ), + ( + "pressure", + "I", + [], + _LinFunc(0.001, dtype=dt32), + "dbar", + "Pressure", + "sea_water_pressure", + ), + ( + "heading", + "H", + [], + _LinFunc(0.01, dtype=dt32), + "degree", + "Heading", + "platform_orientation", + ), + ("pitch", "h", [], _LinFunc(0.01, dtype=dt32), "degree", "Pitch", "platform_pitch"), + ("roll", "h", [], _LinFunc(0.01, dtype=dt32), "degree", "Roll", "platform_roll"), + ("beam_config", "H", [], None), + ("cell_size", "H", [], _LinFunc(0.001), "m"), + ("blank_dist", "H", [], _LinFunc(0.01), "m"), + ("nominal_corr", "B", [], None, "%"), + ("unused", "B", [], None), + ( + "batt", + "H", + [], + _LinFunc(0.1, dtype=dt32), + "V", + "Battery Voltage", + "battery_voltage", + ), + ("mag", "h", [3], None, "uT", "Compass"), + ( + "accel", + "h", + [3], + _LinFunc(1.0 / 16384 * grav, dtype=dt32), + "m s-2", + "Acceleration", + "", + ), + ("ambig_vel", "I", [], _LinFunc(0.001, dtype=dt32), "m s-1"), + ("data_desc", "H", [], None), + ("xmit_energy", "H", [], None, "dB", "Sound Pressure Level of Acoustic Signal"), + ("vel_scale", "b", [], None), + ("power_level_dB", "b", [], _LinFunc(dtype=dt32), "dB"), + ("temp_mag", "h", [], None), # uncalibrated + ( + "temp_clock", + "h", + [], + _LinFunc(0.01, dtype=dt32), + "degree_C", + "Internal Clock Temperature", + ), + ("error", "I", [], None, "1", "Error Code"), + ("status", "I", [], None, "1", "Status Code"), + ("_ensemble", "I", [], None), ] _ahrs_def = [ - ('orientmat', 'f', [3, 3], None, '1', 'Orientation Matrix'), - ('quaternions', 'f', [4], None, '1', 'Quaternions'), - ('angrt', 'f', [3], _LinFunc(np.pi / 180, dtype=dt32), 'rad s-1', 'Angular Velocity'), + ("orientmat", "f", [3, 3], None, "1", "Orientation Matrix"), + ("quaternions", "f", [4], None, "1", "Quaternions"), + ( + "angrt", + "f", + [3], + _LinFunc(np.pi / 180, dtype=dt32), + "rad s-1", + "Angular Velocity", + ), ] def _calc_bt_struct(config, nb): - flags = lib._headconfig_int2dict(config, mode='bt') + flags = lib._headconfig_int2dict(config, mode="bt") dd = copy(_bt_hdr) - if flags['vel']: + if flags["vel"]: # units handled in Ad2cpReader.sci_data - dd.append(('vel', 'i', [nb], None, 'm s-1', 'Platform Velocity from Bottom Track')) - if flags['dist']: - dd.append(('dist', 'i', [nb], _LinFunc(0.001, dtype=dt32), 'm', 'Bottom Track Measured Depth')) - if flags['fom']: - dd.append(('fom', 'H', [nb], None, '1', 'Figure of Merit')) - if flags['ahrs']: + dd.append( + ("vel", "i", [nb], None, "m s-1", "Platform Velocity from Bottom Track") + ) + if flags["dist"]: + dd.append( + ( + "dist", + "i", + [nb], + _LinFunc(0.001, dtype=dt32), + "m", + "Bottom Track Measured Depth", + ) + ) + if flags["fom"]: + dd.append(("fom", "H", [nb], None, "1", "Figure of Merit")) + if flags["ahrs"]: dd += _ahrs_def return _DataDef(dd) @@ -295,14 +414,27 @@ def _calc_bt_struct(config, nb): def _calc_echo_struct(config, nc): flags = lib._headconfig_int2dict(config) dd = copy(_burst_hdr) - dd[19] = ('blank_dist', 'H', [], _LinFunc(0.001)) # m - if any([flags[nm] for nm in ['vel', 'amp', 'corr', 'alt', 'ast', - 'alt_raw', 'p_gd', 'std']]): + dd[19] = ("blank_dist", "H", [], _LinFunc(0.001)) # m + if any( + [ + flags[nm] + for nm in ["vel", "amp", "corr", "le", "ast", "altraw", "p_gd", "std"] + ] + ): raise Exception("Echosounder ping contains invalid data?") - if flags['echo']: - dd += [('echo', 'H', [nc], _LinFunc(0.01, dtype=dt32), 'dB', - 'Echo Sounder Acoustic Signal Backscatter', 'acoustic_target_strength_in_sea_water')] - if flags['ahrs']: + if flags["echo"]: + dd += [ + ( + "echo", + "H", + [nc], + _LinFunc(0.01, dtype=dt32), + "dB", + "Echo Sounder Acoustic Signal Backscatter", + "acoustic_target_strength_in_sea_water", + ) + ] + if flags["ahrs"]: dd += _ahrs_def return _DataDef(dd) @@ -310,53 +442,157 @@ def _calc_echo_struct(config, nc): def _calc_burst_struct(config, nb, nc): flags = lib._headconfig_int2dict(config) dd = copy(_burst_hdr) - if flags['echo']: + if flags["echo"]: raise Exception("Echosounder data found in velocity ping?") - if flags['vel']: - dd.append(('vel', 'h', [nb, nc], None, 'm s-1', 'Water Velocity')) - if flags['amp']: - dd.append(('amp', 'B', [nb, nc], _LinFunc(0.5, dtype=dt32), '1', 'Acoustic Signal Amplitude', - 'signal_intensity_from_multibeam_acoustic_doppler_velocity_sensor_in_sea_water')) - if flags['corr']: - dd.append(('corr', 'B', [nb, nc], None, '%', 'Acoustic Signal Correlation', - 'beam_consistency_indicator_from_multibeam_acoustic_doppler_velocity_profiler_in_sea_water')) - if flags['alt']: + if flags["vel"]: + dd.append(("vel", "h", [nb, nc], None, "m s-1", "Water Velocity")) + if flags["amp"]: + dd.append( + ( + "amp", + "B", + [nb, nc], + _LinFunc(0.5, dtype=dt32), + "1", + "Acoustic Signal Amplitude", + "signal_intensity_from_multibeam_acoustic_doppler_velocity_sensor_in_sea_water", + ) + ) + if flags["corr"]: + dd.append( + ( + "corr", + "B", + [nb, nc], + None, + "%", + "Acoustic Signal Correlation", + "beam_consistency_indicator_from_multibeam_acoustic_doppler_velocity_profiler_in_sea_water", + ) + ) + if flags["le"]: # There may be a problem here with reading 32bit floats if # nb and nc are odd - dd += [('alt_dist', 'f', [], _LinFunc(dtype=dt32), 'm', 'Altimeter Range', 'altimeter_range'), - ('alt_quality', 'H', [], _LinFunc(0.01, dtype=dt32), '1', 'Altimeter Quality Indicator'), - ('alt_status', 'H', [], None, '1', 'Altimeter Status')] - if flags['ast']: dd += [ - ('ast_dist', 'f', [], _LinFunc(dtype=dt32), 'm', 'Acoustic Surface Tracking Range'), - ('ast_quality', 'H', [], _LinFunc(0.01, dtype=dt32), '1', - 'Acoustic Surface Tracking Quality Indicator'), - ('ast_offset_time', 'h', [], _LinFunc(0.0001, dtype=dt32), - 's', 'Acoustic Surface Tracking Time Offset to Velocity Ping'), - ('ast_pressure', 'f', [], None, 'dbar', 'Pressure measured during AST ping', - 'sea_water_pressure'), - ('ast_spare', 'B7x', [], None), + ( + "le_dist_alt", + "f", + [], + _LinFunc(dtype=dt32), + "m", + "Altimeter Range Leading Edge Algorithm", + "altimeter_range", + ), + ( + "le_quality_alt", + "H", + [], + _LinFunc(0.01, dtype=dt32), + "dB", + "Altimeter Quality Indicator Leading Edge Algorithm", + ), + ("status_alt", "H", [], None, "1", "Altimeter Status"), + ] + if flags["ast"]: + dd += [ + ( + "ast_dist_alt", + "f", + [], + _LinFunc(dtype=dt32), + "m", + "Altimeter Range Acoustic Surface Tracking", + "altimeter_range", + ), + ( + "ast_quality_alt", + "H", + [], + _LinFunc(0.01, dtype=dt32), + "dB", + "Altimeter Quality Indicator Acoustic Surface Tracking", + ), + ( + "ast_offset_time_alt", + "h", + [], + _LinFunc(0.0001, dtype=dt32), + "s", + "Acoustic Surface Tracking Time Offset to Velocity Ping", + ), + ( + "pressure_alt", + "f", + [], + None, + "dbar", + "Pressure measured during AST ping", + "sea_water_pressure", + ), + # This use of 'x' here is a hack + ("spare", "B7x", [], None), ] - if flags['alt_raw']: + if flags["altraw"]: dd += [ - ('altraw_nsamp', 'I', [], None, '1', 'Number of Altimeter Samples'), - ('altraw_dsamp', 'H', [], _LinFunc(0.0001, dtype=dt32), 'm', - 'Altimeter Distance between Samples'), - ('altraw_samp', 'h', [], None), + ("nsamp_alt", "I", [], None, "1", "Number of Altimeter Samples"), + ( + "dsamp_alt", + "H", + [], + _LinFunc(0.0001, dtype=dt32), + "m", + "Altimeter Distance between Samples", + ), + ("samp_alt", "h", [], None, "1", "Altimeter Samples"), ] - if flags['ahrs']: + if flags["ahrs"]: dd += _ahrs_def - if flags['p_gd']: - dd += [('percent_good', 'B', [nc], None, '%', 'Percent Good', - 'proportion_of_acceptable_signal_returns_from_acoustic_instrument_in_sea_water')] - if flags['std']: - dd += [('pitch_std', 'h', [], - _LinFunc(0.01, dtype=dt32), 'degree', 'Pitch Standard Deviation'), - ('roll_std', 'h', [], - _LinFunc(0.01, dtype=dt32), 'degree', 'Roll Standard Deviation'), - ('heading_std', 'h', [], - _LinFunc(0.01, dtype=dt32), 'degree', 'Heading Standard Deviation'), - ('press_std', 'h', [], - _LinFunc(0.1, dtype=dt32), 'dbar', 'Pressure Standard Deviation'), - ('std_spare', 'H22x', [], None)] + if flags["p_gd"]: + dd += [ + ( + "percent_good", + "B", + [nc], + None, + "%", + "Percent Good", + "proportion_of_acceptable_signal_returns_from_acoustic_instrument_in_sea_water", + ) + ] + if flags["std"]: + dd += [ + ( + "pitch_std", + "h", + [], + _LinFunc(0.01, dtype=dt32), + "degree", + "Pitch Standard Deviation", + ), + ( + "roll_std", + "h", + [], + _LinFunc(0.01, dtype=dt32), + "degree", + "Roll Standard Deviation", + ), + ( + "heading_std", + "h", + [], + _LinFunc(0.01, dtype=dt32), + "degree", + "Heading Standard Deviation", + ), + ( + "press_std", + "h", + [], + _LinFunc(0.1, dtype=dt32), + "dbar", + "Pressure Standard Deviation", + ), + ("std_spare", "H22x", [], None), + ] return _DataDef(dd) diff --git a/mhkit/dolfyn/io/nortek2_lib.py b/mhkit/dolfyn/io/nortek2_lib.py index f3575b6e6..3336651f5 100644 --- a/mhkit/dolfyn/io/nortek2_lib.py +++ b/mhkit/dolfyn/io/nortek2_lib.py @@ -26,9 +26,13 @@ def _reduce_by_average_angle(data, ky0, ky1, degrees=True): rad_fact = 1 if ky1 in data: if ky0 in data: - data[ky0] = np.angle( - np.exp(1j * data.pop(ky0) * rad_fact) + - np.exp(1j * data.pop(ky1) * rad_fact)) / rad_fact + data[ky0] = ( + np.angle( + np.exp(1j * data.pop(ky0) * rad_fact) + + np.exp(1j * data.pop(ky1) * rad_fact) + ) + / rad_fact + ) else: data[ky0] = data.pop(ky1) @@ -36,56 +40,65 @@ def _reduce_by_average_angle(data, ky0, ky1, degrees=True): # This is the data-type of the index file. # This must match what is written-out by the create_index function. _index_version = 1 -_hdr = struct.Struct(' 60) # This probably indicates a corrupted byte, so we just insert None. @@ -94,113 +107,174 @@ def _calc_time(year, month, day, hour, minute, second, usec, zero_is_bad=True): return dt -def _create_index(infile, outfile, N_ens, debug): +def _create_index(infile, outfile, init_pos, eof, debug): logging = getLogger() - print("Indexing {}...".format(infile), end='') - fin = open(_abspath(infile), 'rb') - fout = open(_abspath(outfile), 'wb') - fout.write(b'Index Ver:') - fout.write(struct.pack(' 0: - # Covers all id keys saved in "burst mode" - ens[idk] = last_ens[idk]+1 + if last_ens[idk] > 0: + if (ens[idk] == 1) or (ens[idk] < last_ens[idk]): + # Covers all id keys saved in "burst mode" + # Covers ID keys not saved in sequential order + ens[idk] = last_ens[idk] + 1 if last_ens[idk] > 0 and last_ens[idk] != ens[idk]: N[idk] += 1 - fout.write(struct.pack(' N_id)[0] + # Check if spacing is equal for dual profiling ADCPs + if dp: + skip_size = np.diff(ibad) + n_skip, count = np.unique(skip_size, return_counts=True) + # If multiple skips are of the same size, assume okay + for n, c in zip(n_skip, count): + if c > 1: + skip_size[skip_size == n] = 0 + # assume last "ibad" element is always good for dp's + mask = np.append(skip_size, 0).astype(bool) if any(skip_size) else [] + ibad = ibad[mask] for ib in ibad: FLAG = True # The ping number reported here may not be quite right if # the ensemble count is wrong. - warnings.warn("Skipped ping (ID: {}) in file {} at ensemble {}." - .format(id, infile, idx['ens'][inds[ib + 1] - 1])) - hwe[inds[(ib + 1):]] += 1 - ens[inds[(ib + 1):]] += 1 - - # This block fixes skips that originate from before this file. - delta = max(hwe[:N_id]) - hwe[:N_id] - for d, id in zip(delta, idx['ID'][:N_id]): - if d != 0: - FLAG = True - hwe[id == idx['ID']] += d - ens[id == idx['ID']] += d + warnings.warn( + "Skipped ping (ID: {}) in file {} at ensemble {}.".format( + id, infile, idx["ens"][inds[ib + 1] - 1] + ) + ) + hwe[inds[(ib + 1) :]] += 1 + ens[inds[(ib + 1) :]] += 1 - if np.any(np.diff(ens) > 1) and FLAG: - idx['ens'] = np.unwrap(hwe.astype(np.int64), period=period) - hwe[0] + return dp def _boolarray_firstensemble_ping(index): """ - Return a boolean of the index that indicates only the first ping in + Return a boolean of the index that indicates only the first ping in each ensemble. """ - dens = np.ones(index['ens'].shape, dtype='bool') - dens[1:] = np.diff(index['ens']) != 0 + dens = np.ones(index["ens"].shape, dtype="bool") + dens[1:] = np.diff(index["ens"]) != 0 return dens -def get_index(infile, reload=False, debug=False): +def get_index(infile, pos=0, eof=2**32, rebuild=False, debug=False, dp=False): """ This function reads ad2cp.index files @@ -219,21 +293,21 @@ def get_index(infile, reload=False, debug=False): Tuple containing info held within index file """ - index_file = infile + '.index' - if not path.isfile(index_file) or reload: - _create_index(infile, index_file, 2 ** 32, debug) - f = open(_abspath(index_file), 'rb') + index_file = infile + ".index" + if not path.isfile(index_file) or rebuild or debug: + _create_index(infile, index_file, pos, eof, debug) + f = open(_abspath(index_file), "rb") file_head = f.read(12) - if file_head[:10] == b'Index Ver:': - index_ver = struct.unpack('> n) & 1) -def _headconfig_int2dict(val, mode='burst'): +def _headconfig_int2dict(val, mode="burst"): """ Convert the burst Configuration bit-mask to a dict of bools. @@ -330,7 +408,7 @@ def _headconfig_int2dict(val, mode='burst'): For 'burst' configs, or 'bottom-track' configs. """ - if (mode == 'burst') or (mode == 'avg'): + if (mode == "burst") or (mode == "avg"): return dict( press_valid=_getbit(val, 0), temp_valid=_getbit(val, 1), @@ -340,8 +418,8 @@ def _headconfig_int2dict(val, mode='burst'): vel=_getbit(val, 5), amp=_getbit(val, 6), corr=_getbit(val, 7), - alt=_getbit(val, 8), - alt_raw=_getbit(val, 9), + le=_getbit(val, 8), + altraw=_getbit(val, 9), ast=_getbit(val, 10), echo=_getbit(val, 11), ahrs=_getbit(val, 12), @@ -349,7 +427,7 @@ def _headconfig_int2dict(val, mode='burst'): std=_getbit(val, 14), # bit 15 is unused ) - elif mode == 'bt': + elif mode == "bt": return dict( press_valid=_getbit(val, 0), temp_valid=_getbit(val, 1), @@ -371,9 +449,9 @@ def _status02data(val): bi = _BitIndexer(val) out = {} if any(bi[15]): # 'status0_in_use' - out['proc_idle_less_3pct'] = bi[0] - out['proc_idle_less_6pct'] = bi[1] - out['proc_idle_less_12pct'] = bi[2] + out["proc_idle_less_3pct"] = bi[0] + out["proc_idle_less_6pct"] = bi[1] + out["proc_idle_less_12pct"] = bi[2] return out @@ -383,18 +461,18 @@ def _status2data(val): # Integrators Guide (2017) bi = _BitIndexer(val) out = {} - out['wakeup_state'] = bi[28:32] - out['orient_up'] = bi[25:28] - out['auto_orientation'] = bi[22:25] - out['previous_wakeup_state'] = bi[18:22] - out['low_volt_skip'] = bi[17] - out['active_config'] = bi[16] - out['echo_index'] = bi[12:16] - out['telemetry_data'] = bi[11] - out['boost_running'] = bi[10] - out['echo_freq_bin'] = bi[5:10] + out["wakeup_state"] = bi[28:32] + out["orient_up"] = bi[25:28] + out["auto_orientation"] = bi[22:25] + out["previous_wakeup_state"] = bi[18:22] + out["low_volt_skip"] = bi[17] + out["active_config"] = bi[16] + out["echo_index"] = bi[12:16] + out["telemetry_data"] = bi[11] + out["boost_running"] = bi[10] + out["echo_freq_bin"] = bi[5:10] # 2,3,4 unused - out['bd_scaling'] = bi[1] # if True: cm scaling of blanking dist + out["bd_scaling"] = bi[1] # if True: cm scaling of blanking dist # 0 unused return out @@ -404,25 +482,26 @@ def _alt_status2data(val): # Integrators Guide (2017) bi = _BitIndexer(val) out = {} - out['tilt_over_5deg'] = bi[0] - out['tilt_over_10deg'] = bi[1] - out['multibeam_alt'] = bi[2] - out['n_beams_alt'] = bi[3:7] - out['power_level_idx_alt'] = bi[7:10] + out["tilt_over_5deg"] = bi[0] + out["tilt_over_10deg"] = bi[1] + out["multibeam_alt"] = bi[2] + out["n_beams_alt"] = bi[3:7] + out["power_level_idx_alt"] = bi[7:10] return out def _beams_cy_int2dict(val, id): - """Convert the beams/coordinate-system bytes to a dict of values. - """ + """Convert the beams/coordinate-system bytes to a dict of values.""" if id == 28: # 0x1C (echosounder) return dict(n_cells=val) - + elif id in [26, 31]: + return dict(n_cells=val & (2**10 - 1), cy="beam", n_beams=1) return dict( - n_cells=val & (2 ** 10 - 1), - cy=['ENU', 'XYZ', 'beam', None][val >> 10 & 3], - n_beams=val >> 12) + n_cells=val & (2**10 - 1), + cy=["ENU", "XYZ", "beam", None][val >> 10 & 3], + n_beams=val >> 12, + ) def _isuniform(vec, exclude=[]): @@ -442,8 +521,7 @@ def _collapse(vec, name=None, exclude=[]): elif _isuniform(vec, exclude=exclude): return list(set(np.unique(vec)) - set(exclude))[0] else: - uniq, idx, counts = np.unique( - vec, return_index=True, return_counts=True) + uniq, idx, counts = np.unique(vec, return_index=True, return_counts=True) if all(e == counts[0] for e in counts): val = max(vec) # pings saved out of order, but equal # of pings @@ -452,11 +530,14 @@ def _collapse(vec, name=None, exclude=[]): if not set(uniq) == set([0, val]) and set(counts) == set([1, np.max(counts)]): # warn when the 'wrong value' is not just a single zero. - warnings.warn("The variable {} is expected to be uniform, but it is not.\n" - "Values found: {} (counts: {}).\n" - "Using the most common value: {}".format( - name, list(uniq), list(counts), val)) - + warnings.warn( + "The variable {} is expected to be uniform, but it is not.\n" + "Values found: {} (counts: {}).\n" + "Using the most common value: {}".format( + name, list(uniq), list(counts), val + ) + ) + return val @@ -471,33 +552,41 @@ def _calc_config(index): A dict containing the key information for initializing arrays. """ - ids = np.unique(index['ID']) + ids = np.unique(index["ID"]) config = {} for id in ids: - if id not in [21, 22, 23, 24, 26, 28]: + if id not in [21, 22, 23, 24, 26, 28, 31]: continue if id == 23: - type = 'bt' - elif id == 22: - type = 'avg' + type = "bt" + elif (id == 22) or (id == 31): + type = "avg" else: - type = 'burst' - inds = index['ID'] == id - _config = index['config'][inds] - _beams_cy = index['beams_cy'][inds] + type = "burst" + inds = index["ID"] == id + _config = index["config"][inds] + _beams_cy = index["beams_cy"][inds] + # Check that these variables are consistent if not _isuniform(_config): - raise Exception("config are not identical for id: 0x{:X}." - .format(id)) + raise Exception("config are not identical for id: 0x{:X}.".format(id)) if not _isuniform(_beams_cy): - raise Exception("beams_cy are not identical for id: 0x{:X}." - .format(id)) + err = True + if id == 23: + # change in "n_cells" doesn't matter + lob = np.unique(_beams_cy) + beams = list(map(_beams_cy_int2dict, lob, 23 * np.ones(lob.size))) + if all([d["cy"] for d in beams]) and all([d["n_beams"] for d in beams]): + err = False + if err: + raise Exception("beams_cy are not identical for id: 0x{:X}.".format(id)) + # Now that we've confirmed they are the same: config[id] = _headconfig_int2dict(_config[0], mode=type) config[id].update(_beams_cy_int2dict(_beams_cy[0], id)) - config[id]['_config'] = _config[0] - config[id]['_beams_cy'] = _beams_cy[0] - config[id]['type'] = type - config[id].pop('cy', None) + config[id]["_config"] = _config[0] + config[id]["_beams_cy"] = _beams_cy[0] + config[id]["type"] = type + config[id].pop("cy", None) return config diff --git a/mhkit/dolfyn/io/nortek_defs.py b/mhkit/dolfyn/io/nortek_defs.py index 180af05eb..c3e6a9757 100644 --- a/mhkit/dolfyn/io/nortek_defs.py +++ b/mhkit/dolfyn/io/nortek_defs.py @@ -1,8 +1,9 @@ import numpy as np + nan = np.nan -class _VarAtts(): +class _VarAtts: """ A data variable attributes class. @@ -36,11 +37,21 @@ class _VarAtts(): A list of names for each dimension of the array. """ - def __init__(self, dims=[], dtype=None, group='data_vars', - view_type=None, default_val=None, - offset=0, factor=1, - title_name=None, units='1', dim_names=None, - long_name='', standard_name=''): + def __init__( + self, + dims=[], + dtype=None, + group="data_vars", + view_type=None, + default_val=None, + offset=0, + factor=1, + title_name=None, + units="1", + dim_names=None, + long_name="", + standard_name="", + ): self.dims = list(dims) if dtype is None: dtype = np.float32 @@ -66,7 +77,7 @@ def shape(self, **kwargs): if hit: return a else: - return self.dims + [kwargs['n']] + return self.dims + [kwargs["n"]] def _empty_array(self, **kwargs): out = np.zeros(self.shape(**kwargs), dtype=self.dtype) @@ -102,241 +113,431 @@ def sci_func(self, data): vec_data = { - 'AnaIn2LSB': _VarAtts(dims=[], - dtype=np.uint8, - group='sys', - ), - 'Count': _VarAtts(dims=[], - dtype=np.uint8, - group='sys', - units='1', - ), - 'PressureMSB': _VarAtts(dims=[], - dtype=np.uint8, - group='data_vars', - ), - 'AnaIn2MSB': _VarAtts(dims=[], - dtype=np.uint8, - group='sys', - ), - 'PressureLSW': _VarAtts(dims=[], - dtype=np.uint16, - group='data_vars', - ), - 'AnaIn1': _VarAtts(dims=[], - dtype=np.uint16, - group='sys', - ), - 'vel': _VarAtts(dims=[3], - dtype=np.float32, - group='data_vars', - factor=0.001, - default_val=nan, - units='m s-1', - long_name='Water Velocity', - ), - 'amp': _VarAtts(dims=[3], - dtype=np.uint8, - group='data_vars', - units='1', - long_name='Acoustic Signal Amplitude', - standard_name='signal_intensity_from_multibeam_acoustic_doppler_velocity_sensor_in_sea_water' - ), - 'corr': _VarAtts(dims=[3], - dtype=np.uint8, - group='data_vars', - units='%', - long_name='Acoustic Signal Correlation', - ), + "AnaIn2LSB": _VarAtts( + dims=[], + dtype=np.uint8, + group="sys", + ), + "Count": _VarAtts( + dims=[], + dtype=np.uint8, + group="sys", + units="1", + ), + "PressureMSB": _VarAtts( + dims=[], + dtype=np.uint8, + group="data_vars", + ), + "AnaIn2MSB": _VarAtts( + dims=[], + dtype=np.uint8, + group="sys", + ), + "PressureLSW": _VarAtts( + dims=[], + dtype=np.uint16, + group="data_vars", + ), + "AnaIn1": _VarAtts( + dims=[], + dtype=np.uint16, + group="sys", + ), + "vel": _VarAtts( + dims=[3], + dtype=np.float32, + group="data_vars", + factor=0.001, + default_val=nan, + units="m s-1", + long_name="Water Velocity", + ), + "amp": _VarAtts( + dims=[3], + dtype=np.uint8, + group="data_vars", + units="1", + long_name="Acoustic Signal Amplitude", + standard_name="signal_intensity_from_multibeam_acoustic_doppler_velocity_sensor_in_sea_water", + ), + "corr": _VarAtts( + dims=[3], + dtype=np.uint8, + group="data_vars", + units="%", + long_name="Acoustic Signal Correlation", + ), } vec_sysdata = { - 'time': _VarAtts(dims=[], - dtype=np.float64, - group='coords', - default_val=nan, - units='seconds since 1970-01-01 00:00:00', - long_name='Time', - standard_name='time', - ), - 'batt': _VarAtts(dims=[], - dtype=np.float32, - group='data_vars', - default_val=nan, - factor=0.1, - units='V', - long_name='Battery Voltage', - ), - 'c_sound': _VarAtts(dims=[], - dtype=np.float32, - group='data_vars', - default_val=nan, - factor=0.1, - units='m s-1', - long_name='Speed of Sound', - standard_name='speed_of_sound_in_sea_water', - ), - 'heading': _VarAtts(dims=[], - dtype=np.float32, - group='data_vars', - default_val=nan, - factor=0.1, - units='degree', - long_name='Heading', - standard_name='platform_orientation', - ), - 'pitch': _VarAtts(dims=[], - dtype=np.float32, - group='data_vars', - default_val=nan, - factor=0.1, - units='degree', - long_name='Pitch', - standard_name='platform_pitch', - ), - 'roll': _VarAtts(dims=[], - dtype=np.float32, - group='data_vars', - default_val=nan, - factor=0.1, - units='degree', - long_name='Roll', - standard_name='platform_roll' - ), - 'temp': _VarAtts(dims=[], - dtype=np.float32, - group='data_vars', - default_val=nan, - factor=0.01, - units='degree_C', - long_name='Temperature', - standard_name='sea_water_temperature', - ), - 'error': _VarAtts(dims=[], - dtype=np.uint8, - group='data_vars', - default_val=nan, - long_name='Error Code', - ), - 'status': _VarAtts(dims=[], - dtype=np.uint8, - group='data_vars', - default_val=nan, - long_name='Status Code' - ), - 'AnaIn': _VarAtts(dims=[], - dtype=np.float32, - group='sys', - default_val=nan, - ), - 'orientation_down': _VarAtts(dims=[], - dtype=bool, - group='data_vars', - default_val=nan, - long_name='Orientation of ADV Communication Cable' - ), + "time": _VarAtts( + dims=[], + dtype=np.float64, + group="coords", + default_val=nan, + units="seconds since 1970-01-01 00:00:00 UTC", + long_name="Time", + standard_name="time", + ), + "batt": _VarAtts( + dims=[], + dtype=np.float32, + group="data_vars", + default_val=nan, + factor=0.1, + units="V", + long_name="Battery Voltage", + ), + "c_sound": _VarAtts( + dims=[], + dtype=np.float32, + group="data_vars", + default_val=nan, + factor=0.1, + units="m s-1", + long_name="Speed of Sound", + standard_name="speed_of_sound_in_sea_water", + ), + "heading": _VarAtts( + dims=[], + dtype=np.float32, + group="data_vars", + default_val=nan, + factor=0.1, + units="degree", + long_name="Heading", + standard_name="platform_orientation", + ), + "pitch": _VarAtts( + dims=[], + dtype=np.float32, + group="data_vars", + default_val=nan, + factor=0.1, + units="degree", + long_name="Pitch", + standard_name="platform_pitch", + ), + "roll": _VarAtts( + dims=[], + dtype=np.float32, + group="data_vars", + default_val=nan, + factor=0.1, + units="degree", + long_name="Roll", + standard_name="platform_roll", + ), + "temp": _VarAtts( + dims=[], + dtype=np.float32, + group="data_vars", + default_val=nan, + factor=0.01, + units="degree_C", + long_name="Temperature", + standard_name="sea_water_temperature", + ), + "error": _VarAtts( + dims=[], + dtype=np.uint8, + group="data_vars", + default_val=nan, + long_name="Error Code", + ), + "status": _VarAtts( + dims=[], + dtype=np.uint8, + group="data_vars", + default_val=nan, + long_name="Status Code", + ), + "AnaIn": _VarAtts( + dims=[], + dtype=np.float32, + group="sys", + default_val=nan, + ), + "orientation_down": _VarAtts( + dims=[], + dtype=bool, + group="data_vars", + default_val=nan, + long_name="Orientation of ADV Communication Cable", + ), } awac_profile = { - 'time': _VarAtts(dims=[], - dtype=np.float64, - group='coords', - units='seconds since 1970-01-01 00:00:00', - long_name='Time', - standard_name='time', - ), - 'error': _VarAtts(dims=[], - dtype=np.uint16, - group='data_vars', - long_name='Error Code', - ), - 'AnaIn1': _VarAtts(dims=[], - dtype=np.float32, - group='sys', - default_val=nan, - units='n/a', - ), - 'batt': _VarAtts(dims=[], - dtype=np.float32, - group='data_vars', - default_val=nan, - factor=0.1, - units='V', - long_name='Battery Voltage', - ), - 'c_sound': _VarAtts(dims=[], - dtype=np.float32, - group='data_vars', - default_val=nan, - factor=0.1, - units='m s-1', - long_name='Speed of Sound', - standard_name='speed_of_sound_in_sea_water', - ), - 'heading': _VarAtts(dims=[], - dtype=np.float32, - group='data_vars', - default_val=nan, - factor=0.1, - units='degree', - long_name='Heading', - standard_name='platform_orientation', - ), - 'pitch': _VarAtts(dims=[], - dtype=np.float32, - group='data_vars', - default_val=nan, - factor=0.1, - units='degree', - long_name='Pitch', - standard_name='platform_pitch', - ), - 'roll': _VarAtts(dims=[], - dtype=np.float32, - group='data_vars', - default_val=nan, - factor=0.1, - units='degree', - long_name='Roll', - standard_name='platform_roll' - ), - 'pressure': _VarAtts(dims=[], - dtype=np.float32, - group='data_vars', - default_val=nan, - factor=0.001, - units='dbar', - long_name='Pressure', - standard_name='sea_water_pressure', - ), - 'status': _VarAtts(dims=[], - dtype=np.float32, - group='data_vars', - default_val=nan, - long_name='Status Code' - ), - 'temp': _VarAtts(dims=[], - dtype=np.float32, - group='data_vars', - default_val=nan, - factor=0.01, - units='degree_C', - long_name='Temperature', - standard_name='sea_water_temperature', - ), - 'vel': _VarAtts(dims=[3, 'nbins', 'n'], # how to change this for different # of beams? - dtype=np.float32, - group='data_vars', - default_val=nan, - factor=0.001, - units='m s-1', - long_name='Water Velocity', - ), - 'amp': _VarAtts(dims=[3, 'nbins', 'n'], - dtype=np.uint8, - group='data_vars', - units='1', - long_name='Acoustic Signal Amplitude', - standard_name='signal_intensity_from_multibeam_acoustic_doppler_velocity_sensor_in_sea_water', - ), + "time": _VarAtts( + dims=[], + dtype=np.float64, + group="coords", + units="seconds since 1970-01-01 00:00:00 UTC", + long_name="Time", + standard_name="time", + ), + "error": _VarAtts( + dims=[], + dtype=np.uint16, + group="data_vars", + long_name="Error Code", + ), + "AnaIn1": _VarAtts( + dims=[], + dtype=np.float32, + group="sys", + default_val=nan, + units="n/a", + ), + "batt": _VarAtts( + dims=[], + dtype=np.float32, + group="data_vars", + default_val=nan, + factor=0.1, + units="V", + long_name="Battery Voltage", + ), + "c_sound": _VarAtts( + dims=[], + dtype=np.float32, + group="data_vars", + default_val=nan, + factor=0.1, + units="m s-1", + long_name="Speed of Sound", + standard_name="speed_of_sound_in_sea_water", + ), + "heading": _VarAtts( + dims=[], + dtype=np.float32, + group="data_vars", + default_val=nan, + factor=0.1, + units="degree", + long_name="Heading", + standard_name="platform_orientation", + ), + "pitch": _VarAtts( + dims=[], + dtype=np.float32, + group="data_vars", + default_val=nan, + factor=0.1, + units="degree", + long_name="Pitch", + standard_name="platform_pitch", + ), + "roll": _VarAtts( + dims=[], + dtype=np.float32, + group="data_vars", + default_val=nan, + factor=0.1, + units="degree", + long_name="Roll", + standard_name="platform_roll", + ), + "pressure": _VarAtts( + dims=[], + dtype=np.float32, + group="data_vars", + default_val=nan, + factor=0.001, + units="dbar", + long_name="Pressure", + standard_name="sea_water_pressure", + ), + "status": _VarAtts( + dims=[], + dtype=np.float32, + group="data_vars", + default_val=nan, + long_name="Status Code", + ), + "temp": _VarAtts( + dims=[], + dtype=np.float32, + group="data_vars", + default_val=nan, + factor=0.01, + units="degree_C", + long_name="Temperature", + standard_name="sea_water_temperature", + ), + "vel": _VarAtts( + dims=[3, "nbins", "n"], # how to change this for different # of beams? + dtype=np.float32, + group="data_vars", + default_val=nan, + factor=0.001, + units="m s-1", + long_name="Water Velocity", + ), + "amp": _VarAtts( + dims=[3, "nbins", "n"], + dtype=np.uint8, + group="data_vars", + units="1", + long_name="Acoustic Signal Amplitude", + standard_name="signal_intensity_from_multibeam_acoustic_doppler_velocity_sensor_in_sea_water", + ), +} + +waves_hdrdata = { + "time_alt": _VarAtts( + dims=[], + dtype=np.float64, + group="coords", + default_val=nan, + units="seconds since 1970-01-01 00:00:00 UTC", + long_name="Time", + standard_name="time", + ), + "batt_alt": _VarAtts( + dims=[], + dtype=np.uint16, + group="data_vars", + default_val=nan, + factor=0.1, + units="V", + long_name="Battery Voltage", + ), + "c_sound_alt": _VarAtts( + dims=[], + dtype=np.float32, + group="data_vars", + default_val=nan, + factor=0.1, + units="m s-1", + long_name="Speed of Sound", + standard_name="speed_of_sound_in_sea_water", + ), + "heading_alt": _VarAtts( + dims=[], + dtype=np.float32, + group="data_vars", + default_val=nan, + factor=0.1, + units="degree", + long_name="Heading", + standard_name="platform_orientation", + ), + "pitch_alt": _VarAtts( + dims=[], + dtype=np.float32, + group="data_vars", + default_val=nan, + factor=0.1, + units="degree", + long_name="Pitch", + standard_name="platform_pitch", + ), + "roll_alt": _VarAtts( + dims=[], + dtype=np.float32, + group="data_vars", + default_val=nan, + factor=0.1, + units="degree", + long_name="Roll", + standard_name="platform_roll", + ), + "pressure1_alt": _VarAtts( + dims=[], + dtype=np.float32, + group="data_vars", + default_val=nan, + factor=0.001, + units="dbar", + long_name="Pressure Min", + standard_name="sea_water_pressure", + ), + "pressure2_alt": _VarAtts( + dims=[], + dtype=np.float32, + group="data_vars", + default_val=nan, + factor=0.001, + units="dbar", + long_name="Pressure Max", + standard_name="sea_water_pressure", + ), + "temp_alt": _VarAtts( + dims=[], + dtype=np.float32, + group="data_vars", + default_val=nan, + factor=0.01, + units="degree_C", + long_name="Temperature", + standard_name="sea_water_temperature", + ), +} + +waves_data = { + "pressure_alt": _VarAtts( + dims=[], + dtype=np.float32, + group="data_vars", + default_val=nan, + factor=0.001, + units="dbar", + long_name="Pressure", + standard_name="sea_water_pressure", + ), + "dist1_alt": _VarAtts( + dims=[], + dtype=np.uint16, + group="data_vars", + default_val=nan, + factor=0.001, + units="m", + long_name="AST distance1 on vertical beam", + standard_name="altimeter_range", + ), + "dist2_alt": _VarAtts( + dims=[], + dtype=np.uint16, + group="data_vars", + default_val=nan, + factor=0.001, + units="m", + long_name="AST distance2 on vertical beam", + standard_name="altimeter_range", + ), + "AnaIn1_alt": _VarAtts( + dims=[], + dtype=np.float32, + group="sys", + default_val=nan, + units="n/a", + ), + "vel_alt": _VarAtts( + dims=[4, "n"], + dtype=np.float32, + group="data_vars", + default_val=nan, + factor=0.001, + units="m s-1", + long_name="Water Velocity", + ), + "amp_alt": _VarAtts( + dims=[4, "n"], + dtype=np.uint8, + group="data_vars", + default_val=nan, + units="1", + long_name="Acoustic Signal Amplitude", + standard_name="signal_intensity_from_multibeam_acoustic_doppler_velocity_sensor_in_sea_water", + ), + "quality_alt": _VarAtts( + dims=[], + dtype=np.float32, + group="data_vars", + default_val=nan, + units="1", + long_name="Altimeter Quality Indicator", + ), } diff --git a/mhkit/dolfyn/io/rdi.py b/mhkit/dolfyn/io/rdi.py index 68ffac611..92996c7f3 100644 --- a/mhkit/dolfyn/io/rdi.py +++ b/mhkit/dolfyn/io/rdi.py @@ -14,8 +14,15 @@ from ..rotate.api import set_declination -def read_rdi(filename, userdata=None, nens=None, debug_level=-1, - vmdas_search=False, winriver=False, **kwargs): +def read_rdi( + filename, + userdata=None, + nens=None, + debug_level=-1, + vmdas_search=False, + winriver=False, + **kwargs, +): """ Read a TRDI binary data file. @@ -26,7 +33,7 @@ def read_rdi(filename, userdata=None, nens=None, debug_level=-1, userdata : True, False, or string of userdata.json filename Whether to read the '.userdata.json' file. Default = True nens : None, int or 2-element tuple (start, stop) - Number of pings or ensembles to read from the file. + Number of pings or ensembles to read from the file. Default is None, read entire file debug_level : int Debug level [0 - 2]. Default = -1 @@ -34,7 +41,7 @@ def read_rdi(filename, userdata=None, nens=None, debug_level=-1, Search from the end of each ensemble for the VMDAS navigation block. The byte offsets are sometimes incorrect. Default = False winriver : bool - If file is winriver or not. Automatically set by dolfyn, this is helpful + If file is winriver or not. Automatically set by dolfyn, this is helpful for debugging. Default = False Returns @@ -47,19 +54,20 @@ def read_rdi(filename, userdata=None, nens=None, debug_level=-1, for handler in logging.root.handlers[:]: logging.root.removeHandler(handler) filepath = Path(filename) - logfile = filepath.with_suffix('.dolfyn.log') - logging.basicConfig(filename=str(logfile), - filemode='w', - level=logging.NOTSET, - format='%(name)s - %(levelname)s - %(message)s') + logfile = filepath.with_suffix(".dolfyn.log") + logging.basicConfig( + filename=str(logfile), + filemode="w", + level=logging.NOTSET, + format="%(name)s - %(levelname)s - %(message)s", + ) # Reads into a dictionary of dictionaries using netcdf naming conventions # Should be easier to debug - with _RDIReader(filename, - debug_level=debug_level, - vmdas_search=vmdas_search, - winriver=winriver) as ldr: - datNB, datBB = ldr.load_data(nens=nens) + rdr = _RDIReader( + filename, debug_level=debug_level, vmdas_search=vmdas_search, winriver=winriver + ) + datNB, datBB = rdr.load_data(nens=nens) dats = [dat for dat in [datNB, datBB] if dat is not None] @@ -68,58 +76,57 @@ def read_rdi(filename, userdata=None, nens=None, debug_level=-1, dss = [] for dat in dats: for nm in userdata: - dat['attrs'][nm] = userdata[nm] + dat["attrs"][nm] = userdata[nm] # Pass one if only one ds returned - if not np.isfinite(dat['coords']['time'][0]): + if not np.isfinite(dat["coords"]["time"][0]): continue # GPS data not necessarily sampling at the same rate as ADCP DAQ. - if 'time_gps' in dat['coords']: + if "time_gps" in dat["coords"]: dat = _remove_gps_duplicates(dat) # Convert time coords to dt64 - t_coords = [t for t in dat['coords'] if 'time' in t] + t_coords = [t for t in dat["coords"] if "time" in t] for ky in t_coords: - dat['coords'][ky] = tmlib.epoch2dt64(dat['coords'][ky]) + dat["coords"][ky] = tmlib.epoch2dt64(dat["coords"][ky]) # Convert time vars to dt64 - t_data = [t for t in dat['data_vars'] if 'time' in t] + t_data = [t for t in dat["data_vars"] if "time" in t] for ky in t_data: - dat['data_vars'][ky] = tmlib.epoch2dt64(dat['data_vars'][ky]) + dat["data_vars"][ky] = tmlib.epoch2dt64(dat["data_vars"][ky]) # Create xarray dataset from upper level dictionary ds = _create_dataset(dat) ds = _set_coords(ds, ref_frame=ds.coord_sys) # Create orientation matrices - if 'beam2inst_orientmat' not in ds: - ds['beam2inst_orientmat'] = xr.DataArray( - _calc_beam_orientmat(ds.beam_angle, - ds.beam_pattern == 'convex'), - coords={'x1': [1, 2, 3, 4], - 'x2': [1, 2, 3, 4]}, - dims=['x1', 'x2'], - attrs={'units': '1', - 'long_name': 'Rotation Matrix'}) - - if 'orientmat' not in ds: - ds['orientmat'] = _calc_orientmat(ds) + if "beam2inst_orientmat" not in ds: + ds["beam2inst_orientmat"] = xr.DataArray( + _calc_beam_orientmat(ds.beam_angle, ds.beam_pattern == "convex"), + coords={"x1": [1, 2, 3, 4], "x2": [1, 2, 3, 4]}, + dims=["x1", "x2"], + attrs={"units": "1", "long_name": "Rotation Matrix"}, + ) + + if "orientmat" not in ds: + ds["orientmat"] = _calc_orientmat(ds) # Check magnetic declination if provided via software and/or userdata _set_rdi_declination(ds, filename, inplace=True) # VMDAS applies gps correction on velocity in .ENX files only - if filename.rsplit('.')[-1] == 'ENX': - ds.attrs['vel_gps_corrected'] = 1 + if filename.rsplit(".")[-1] == "ENX": + ds.attrs["vel_gps_corrected"] = 1 else: # (not ENR or ENS) or WinRiver files - ds.attrs['vel_gps_corrected'] = 0 + ds.attrs["vel_gps_corrected"] = 0 dss += [ds] if len(dss) == 2: - warnings.warn("\nTwo profiling configurations retrieved from file" - "\nReturning first.") + warnings.warn( + "\nTwo profiling configurations retrieved from file" "\nReturning first." + ) # Close handler if debug_level >= 0: @@ -137,22 +144,23 @@ def _remove_gps_duplicates(dat): (in addition to the GPS unit's timestamp). """ - dat['data_vars']['hdwtime_gps'] = dat['coords']['time'] + dat["data_vars"]["hdwtime_gps"] = dat["coords"]["time"] # Remove duplicate timestamp values, if applicable - dat['coords']['time_gps'], idx = np.unique(dat['coords']['time_gps'], - return_index=True) + dat["coords"]["time_gps"], idx = np.unique( + dat["coords"]["time_gps"], return_index=True + ) # Remove nan values, if applicable - nan = np.zeros(dat['coords']['time'].shape, dtype=bool) - if any(np.isnan(dat['coords']['time_gps'])): - nan = np.isnan(dat['coords']['time_gps']) - dat['coords']['time_gps'] = dat['coords']['time_gps'][~nan] - - for key in dat['data_vars']: - if ('gps' in key) or ('nmea' in key): - dat['data_vars'][key] = dat['data_vars'][key][idx] + nan = np.zeros(dat["coords"]["time"].shape, dtype=bool) + if any(np.isnan(dat["coords"]["time_gps"])): + nan = np.isnan(dat["coords"]["time_gps"]) + dat["coords"]["time_gps"] = dat["coords"]["time_gps"][~nan] + + for key in dat["data_vars"]: + if ("gps" in key) or ("nmea" in key): + dat["data_vars"][key] = dat["data_vars"][key][idx] if sum(nan) > 0: - dat['data_vars'][key] = dat['data_vars'][key][~nan] + dat["data_vars"][key] = dat["data_vars"][key][~nan] return dat @@ -163,44 +171,46 @@ def _set_rdi_declination(dat, fname, inplace): included in the heading and in the velocity data. """ - declin = dat.attrs.pop('declination', None) # userdata declination + declin = dat.attrs.pop("declination", None) # userdata declination - if dat.attrs['magnetic_var_deg'] != 0: # from TRDI software if set - dat.attrs['declination'] = dat.attrs['magnetic_var_deg'] - dat.attrs['declination_in_orientmat'] = 1 # logical + if dat.attrs["magnetic_var_deg"] != 0: # from TRDI software if set + dat.attrs["declination"] = dat.attrs["magnetic_var_deg"] + dat.attrs["declination_in_orientmat"] = 1 # logical - if dat.attrs['magnetic_var_deg'] != 0 and declin is not None: + if dat.attrs["magnetic_var_deg"] != 0 and declin is not None: warnings.warn( "'magnetic_var_deg' is set to {:.2f} degrees in the binary " "file '{}', AND 'declination' is set in the 'userdata.json' " "file. DOLfYN WILL USE THE VALUE of {:.2f} degrees in " "userdata.json. If you want to use the value in " "'magnetic_var_deg', delete the value from userdata.json and " - "re-read the file." - .format(dat.attrs['magnetic_var_deg'], fname, declin)) - dat.attrs['declination'] = declin + "re-read the file.".format(dat.attrs["magnetic_var_deg"], fname, declin) + ) + dat.attrs["declination"] = declin if declin is not None: set_declination(dat, declin, inplace) -class _RDIReader(): - _pos = 0 - progress = 0 - _cfac = 180 / 2 ** 31 - _source = 0 - _fixoffset = 0 - _nbyte = 0 - _search_num = 30000 # Maximum distance? to search - _debug7f79 = None - - def __init__(self, fname, navg=1, debug_level=0, vmdas_search=False, winriver=False): +class _RDIReader: + def __init__( + self, fname, navg=1, debug_level=-1, vmdas_search=False, winriver=False + ): self.fname = _abspath(fname) - print('\nReading file {} ...'.format(fname)) + print("\nReading file {} ...".format(fname)) self._debug_level = debug_level self._vmdas_search = vmdas_search self._winrivprob = winriver - self.flag = 0 + self._vm_source = 0 + self._pos = 0 + self.progress = 0 + self._cfac = 180 / 2**31 + self._fixoffset = 0 + self._nbyte = 0 + self.n_cells_diff = 0 + self.n_cells_sl = 0 + self.cs_diff = 0 + self.cs = [] self.cfg = {} self.cfgbb = {} self.hdr = {} @@ -209,24 +219,21 @@ def __init__(self, fname, navg=1, debug_level=0, vmdas_search=False, winriver=Fa # Check header, double buffer, and get filesize self._filesize = getsize(self.fname) space = self.code_spacing() # '0x7F' - self._npings = int(self._filesize / (space + 2)) - if self._debug_level >= 0: - logging.info('Done: {}'.format(self.cfg)) - logging.info('self._bb {}'.format(self._bb)) - logging.info(self.cfgbb) + self._npings = self._filesize // space + if self._debug_level > -1: + logging.info("Done: {}".format(self.cfg)) + logging.info("self._bb {}".format(self._bb)) + logging.info("self.cfgbb: {}".format(self.cfgbb)) self.f.seek(self._pos, 0) self.n_avg = navg - self.ensemble = defs._ensemble(self.n_avg, self.cfg['n_cells']) + self.ensemble = defs._ensemble(self.n_avg, self.cfg["n_cells"]) if self._bb: - self.ensembleBB = defs._ensemble(self.n_avg, self.cfgbb['n_cells']) + self.ensembleBB = defs._ensemble(self.n_avg, self.cfgbb["n_cells"]) - self.vars_read = defs._variable_setlist(['time']) + self.vars_read = defs._variable_setlist(["time"]) if self._bb: - self.vars_readBB = defs._variable_setlist(['time']) - - if self._debug_level >= 0: - logging.info(' %d pings estimated in this file' % self._npings) + self.vars_readBB = defs._variable_setlist(["time"]) def code_spacing(self, iternum=50): """ @@ -237,7 +244,7 @@ def code_spacing(self, iternum=50): p0 = self._pos # Get basic header data and check dual profile if not self.read_hdr(): - raise RuntimeError('No header in this file') + raise RuntimeError("No header in this file") self._bb = self.check_for_double_buffer() # Turn off debugging to check code spacing @@ -249,52 +256,48 @@ def code_spacing(self, iternum=50): except: break # Compute the average of the data size: - size = (self._pos - p0) / (i+1) * 0.995 + size = (self._pos - p0) / (i + 1) self.f = fd self._pos = p0 self._debug_level = debug_level return size - def read_hdr(self,): - fd = self.f - cfgid = list(fd.read_ui8(2)) - nread = 0 - if self._debug_level >= 0: - logging.info('pos {}'.format(self.f.pos)) - logging.info('cfgid0: [{:x}, {:x}]'.format(*cfgid)) - while (cfgid[0] != 127 or cfgid[1] != 127) or not self.checkheader(): - nextbyte = fd.read_ui8(1) - if nextbyte is None: - return False - pos = fd.tell() - nread += 1 - cfgid[1] = cfgid[0] - cfgid[0] = nextbyte - if not pos % 1000: - if self._debug_level >= 0: - logging.info(' Still looking for valid cfgid at file ' - 'position %d ...' % pos) + def read_hdr(self): + """ + Scan file until 7f7f is found + """ + if not self.search_buffer(): + return False self._pos = self.f.tell() - 2 self.read_hdrseg() return True - def check_for_double_buffer(self,): + def read_hdrseg(self): + fd = self.f + hdr = self.hdr + hdr["nbyte"] = fd.read_i16(1) + spare = fd.read_ui8(1) + ndat = fd.read_ui8(1) + hdr["dat_offsets"] = fd.read_ui16(ndat) + self._nbyte = 4 + ndat * 2 + + def check_for_double_buffer(self): """ VMDAS will record two buffers in NB or NB/BB mode, so we need to figure out if that is happening here """ found = False pos = self.f.pos - if self._debug_level >= 0: + if self._debug_level > -1: logging.info(self.hdr) - logging.info('pos {}'.format(pos)) + logging.info("pos {}".format(pos)) self.id_positions = {} - for offset in self.hdr['dat_offsets']: - self.f.seek(offset+pos - self.hdr['dat_offsets'][0], rel=0) + for offset in self.hdr["dat_offsets"]: + self.f.seek(offset + pos - self.hdr["dat_offsets"][0], rel=0) id = self.f.read_ui16(1) self.id_positions[id] = offset - if self._debug_level >= 0: - logging.info('pos {} id {}'.format(offset, id)) + if self._debug_level > -1: + logging.info("id {} offset {}".format(id, offset)) if id == 1: self.read_fixed(bb=True) found = True @@ -306,21 +309,27 @@ def check_for_double_buffer(self,): self._vmdas_search = True return found - def mean(self, dat): - if self.n_avg == 1: - return dat[..., 0] - return np.nanmean(dat, axis=-1) - def load_data(self, nens=None): if nens is None: - self._nens = int(self._npings / self.n_avg) - elif (nens.__class__ is tuple or nens.__class__ is list): + # Attempt to overshoot WinRiver2 or *Pro filesize + if (self.cfg["coord_sys"] == "ship") or ( + self.cfg["inst_model"] + in [ + "RiverPro", + "StreamPro", + ] + ): + self._nens = int(self._filesize / self.hdr["nbyte"] / self.n_avg * 1.1) + else: + # Attempt to overshoot other instrument filesizes + self._nens = int(self._npings / self.n_avg) + elif nens.__class__ is tuple or nens.__class__ is list: raise Exception(" `nens` must be a integer") else: self._nens = nens - if self._debug_level >= 0: - logging.info(' taking data from pings 0 - %d' % self._nens) - logging.info(' %d ensembles will be produced.\n' % self._nens) + if self._debug_level > -1: + logging.info(" taking data from pings 0 - %d" % self._nens) + logging.info(" %d ensembles will be produced.\n" % self._nens) self.init_data() for iens in range(self._nens): @@ -333,97 +342,103 @@ def load_data(self, nens=None): ens = [self.ensemble] vars = [self.vars_read] datl = [self.outd] + cfgl = [self.cfg] if self._bb: ens += [self.ensembleBB] vars += [self.vars_readBB] datl += [self.outdBB] + cfgl += [self.cfgbb] for var, en, dat in zip(vars, ens, datl): + for nm in var: + dat = self.save_profiles(dat, nm, en, iens) + # reset flag after all variables run + self.n_cells_diff = 0 + + # Set clock clock = en.rtc[:, :] if clock[0, 0] < 100: clock[0, :] += defs.century - - for nm in var: - # If n_cells has increased (WinRiver transects) - ds = defs._get(dat, nm) - bn = self.mean(en[nm]) - # Check that - # 1. n_cells has changed, - # 2. nm is a beam variable - # 3. n_cells is greater than any previous - if self.flag > 0 and len(ds.shape) == 3 and (ds.shape[0] != bn.shape[0]): - # increase the size of original dataset - a = np.empty( - (self.flag, ds.shape[1], ds.shape[2]))*np.nan - ds = np.append(ds, a, axis=0) - defs._setd(dat, nm, ds) - # Copy the ensemble to the dataset. - ds[..., iens] = bn - # reset after all variables run - self.flag = 0 - try: dates = tmlib.date2epoch( - tmlib.datetime(*clock[:6, 0], - microsecond=clock[6, 0] * 10000))[0] + tmlib.datetime(*clock[:6, 0], microsecond=clock[6, 0] * 10000) + )[0] except ValueError: - warnings.warn("Invalid time stamp in ping {}.".format( - int(self.ensemble.number[0]))) - dat['coords']['time'][iens] = np.NaN + warnings.warn( + "Invalid time stamp in ping {}.".format( + int(self.ensemble.number[0]) + ) + ) + dat["coords"]["time"][iens] = np.NaN else: - dat['coords']['time'][iens] = np.median(dates) - - self.cleanup(self.cfg, self.outd) - if self._bb: - self.cleanup(self.cfgbb, self.outdBB) + dat["coords"]["time"][iens] = np.median(dates) # Finalize dataset (runs through both nb and bb) - for dat in datl: - self.finalize(dat) - if 'vel_bt' in dat['data_vars']: - dat['attrs']['rotate_vars'].append('vel_bt') + for dat, cfg in zip(datl, cfgl): + dat, cfg = self.cleanup(dat, cfg) + dat = self.finalize(dat) + if "vel_bt" in dat["data_vars"]: + dat["attrs"]["rotate_vars"].append("vel_bt") - dat = self.outd datbb = self.outdBB if self._bb else None - return dat, datbb - - def init_data(self,): - outd = {'data_vars': {}, 'coords': {}, - 'attrs': {}, 'units': {}, 'long_name': {}, - 'standard_name': {}, 'sys': {}} - outd['attrs']['inst_make'] = 'TRDI' - outd['attrs']['inst_type'] = 'ADCP' - outd['attrs']['rotate_vars'] = ['vel', ] + return self.outd, datbb + + def init_data(self): + outd = { + "data_vars": {}, + "coords": {}, + "attrs": {}, + "units": {}, + "long_name": {}, + "standard_name": {}, + "sys": {}, + } + outd["attrs"]["inst_make"] = "TRDI" + outd["attrs"]["inst_type"] = "ADCP" + outd["attrs"]["rotate_vars"] = [ + "vel", + ] # Currently RDI doesn't use IMUs - outd['attrs']['has_imu'] = 0 + outd["attrs"]["has_imu"] = 0 if self._bb: - outdbb = {'data_vars': {}, 'coords': {}, - 'attrs': {}, 'units': {}, 'long_name': {}, - 'standard_name': {}, 'sys': {}} - outdbb['attrs']['inst_make'] = 'TRDI' - outdbb['attrs']['inst_type'] = 'ADCP' - outdbb['attrs']['rotate_vars'] = ['vel', ] - outdbb['attrs']['has_imu'] = 0 - + outdbb = { + "data_vars": {}, + "coords": {}, + "attrs": {}, + "units": {}, + "long_name": {}, + "standard_name": {}, + "sys": {}, + } + outdbb["attrs"]["inst_make"] = "TRDI" + outdbb["attrs"]["inst_type"] = "ADCP" + outdbb["attrs"]["rotate_vars"] = [ + "vel", + ] + outdbb["attrs"]["has_imu"] = 0 + + # Preallocate variables and data sizes for nm in defs.data_defs: - outd = defs._idata(outd, nm, - sz=defs._get_size(nm, self._nens, self.cfg['n_cells'])) + outd = defs._idata( + outd, nm, sz=defs._get_size(nm, self._nens, self.cfg["n_cells"]) + ) self.outd = outd if self._bb: for nm in defs.data_defs: - outdbb = defs._idata(outdbb, nm, - sz=defs._get_size(nm, self._nens, self.cfgbb['n_cells'])) + outdbb = defs._idata( + outdbb, nm, sz=defs._get_size(nm, self._nens, self.cfgbb["n_cells"]) + ) self.outdBB = outdbb if self._debug_level > 1: - logging.info(np.shape(outdbb['data_vars']['vel'])) + logging.info(np.shape(outdbb["data_vars"]["vel"])) if self._debug_level > 1: - logging.info('{} ncells, not BB'.format(self.cfg['n_cells'])) + logging.info("{} ncells, not BB".format(self.cfg["n_cells"])) if self._bb: - logging.info('{} ncells, BB'.format(self.cfgbb['n_cells'])) + logging.info("{} ncells, BB".format(self.cfgbb["n_cells"])) - def read_buffer(self,): + def read_buffer(self): fd = self.f self.ensemble.k = -1 # so that k+=1 gives 0 on the first loop. if self._bb: @@ -435,304 +450,300 @@ def read_buffer(self,): return False startpos = fd.tell() - 2 self.read_hdrseg() - if self._debug_level >= 0: - logging.info('Read Header', hdr) + if self._debug_level > -1: + logging.info("Read Header", hdr) byte_offset = self._nbyte + 2 self._read_vmdas = False - for n in range(len(hdr['dat_offsets'])): + for n in range(len(hdr["dat_offsets"])): id = fd.read_ui16(1) if self._debug_level > 0: - logging.info(f'n {n}: {id} {id:04x}') + logging.info(f"n {n}: {id} {id:04x}") self.print_pos() retval = self.read_dat(id) - if retval == 'FAIL': + if retval == "FAIL": break byte_offset += self._nbyte - if n < (len(hdr['dat_offsets']) - 1): - oset = hdr['dat_offsets'][n + 1] - byte_offset + if n < (len(hdr["dat_offsets"]) - 1): + oset = hdr["dat_offsets"][n + 1] - byte_offset if oset != 0: if self._debug_level > 0: - logging.debug( - ' %s: Adjust location by %d\n' % (id, oset)) + logging.debug(" %s: Adjust location by %d\n" % (id, oset)) fd.seek(oset, 1) - byte_offset = hdr['dat_offsets'][n + 1] + byte_offset = hdr["dat_offsets"][n + 1] else: - if hdr['nbyte'] - 2 != byte_offset: + if hdr["nbyte"] - 2 != byte_offset: if not self._winrivprob: if self._debug_level > 0: - logging.debug(' {:d}: Adjust location by {:d}\n' - .format(id, hdr['nbyte'] - 2 - byte_offset)) - self.f.seek(hdr['nbyte'] - 2 - byte_offset, 1) - byte_offset = hdr['nbyte'] - 2 + logging.debug( + " {:d}: Adjust location by {:d}\n".format( + id, hdr["nbyte"] - 2 - byte_offset + ) + ) + self.f.seek(hdr["nbyte"] - 2 - byte_offset, 1) + byte_offset = hdr["nbyte"] - 2 # Check for vmdas again because vmdas doesn't set the offsets # correctly, and we need this info: if not self._read_vmdas and self._vmdas_search: - if self._debug_level >= 1: - logging.info( - 'Searching for vmdas nav data. Going to next ensemble') + if self._debug_level > 0: + logging.info("Searching for vmdas nav data. Going to next ensemble") self.search_buffer() # now go back to where vmdas would be: fd.seek(-98, 1) id = self.f.read_ui16(1) if id is not None: - if self._debug_level >= 1: - logging.info(f'Found {id:04d}') + if self._debug_level > 0: + logging.info(f"Found {id:04d}") if id == 8192: self.read_dat(id) readbytes = fd.tell() - startpos - offset = hdr['nbyte'] + 2 - readbytes + offset = hdr["nbyte"] + 2 - readbytes self.check_offset(offset, readbytes) self.print_pos(byte_offset=byte_offset) return True + def print_progress(self): + self.progress = self.f.tell() + if self._debug_level > 1: + logging.debug( + " pos %0.0fmb/%0.0fmb\n" + % (self.f.tell() / 1048576.0, self._filesize / 1048576.0) + ) + if (self.f.tell() - self.progress) < 1048576: + return + def search_buffer(self): """ Check to see if the next bytes indicate the beginning of a data block. If not, search for the next data block, up to _search_num times. """ - id = self.f.read_ui8(2) + fd = self.f + id = fd.read_ui8(2) if id is None: return False - id1 = list(id) + cfgid = list(id) + pos_7f79 = False search_cnt = 0 - fd = self.f - if self._debug_level >= 2: - logging.info(' -->In search_buffer...') - while (search_cnt < self._search_num and - ((id1[0] != 127 or id1[1] != 127) or - not self.checkheader())): - search_cnt += 1 - nextbyte = fd.read_ui8(1) - if nextbyte == None: - return False - id1[1] = id1[0] - id1[0] = nextbyte - if search_cnt == self._search_num: - raise Exception( - 'Searched {} entries... Bad data encountered. -> {}' - .format(search_cnt, id1)) - elif search_cnt > 0: - if self._debug_level >= 1: - logging.info(' Searched {} bytes to find next ' - 'valid ensemble start [{:x}, {:x}]\n' - .format(search_cnt, *id1)) + + if self._debug_level > -1: + logging.info("pos {}".format(fd.pos)) + logging.info("cfgid0: [{:x}, {:x}]".format(*cfgid)) + # If not [127, 127] or if the file ends in the next ensemble + while (cfgid != [127, 127]) or self.check_eof(): + if cfgid == [127, 121]: + # Search for the next header or the end of the file + skipbytes = fd.read_i16(1) + fd.seek(skipbytes - 2, 1) + id = fd.read_ui8(2) + if id is None: # EOF + return False + cfgid = list(id) + pos_7f79 = True + else: + # Search til we find something or hit the end of the file + search_cnt += 1 + nextbyte = fd.read_ui8(1) + if nextbyte is None: # EOF + return False + cfgid[0] = cfgid[1] + cfgid[1] = nextbyte + + if pos_7f79 and self._debug_level > -1: + logging.info("Skipped junk data: [{:x}, {:x}]".format(*[127, 121])) + + if search_cnt > 0: + if self._debug_level > 0: + logging.info( + " Searched {} bytes to find next " + "valid ensemble start [{:x}, {:x}]\n".format(search_cnt, *cfgid) + ) + return True - def checkheader(self,): - if self._debug_level > 1: - logging.info(" ###In checkheader.") + def check_eof(self): + """ + Returns True if next header is bad or at end of file. + """ fd = self.f - valid = False - if self._debug_level >= 0: - logging.info('pos {}'.format(self.f.pos)) + out = True numbytes = fd.read_i16(1) + # Search for next config id if numbytes > 0: fd.seek(numbytes - 2, 1) cfgid = fd.read_ui8(2) if cfgid is None: if self._debug_level > 1: - logging.info('EOF') - return False + logging.info("EOF") + return True + # Make sure one is found, either 7f7f or 7f79 if len(cfgid) == 2: fd.seek(-numbytes - 2, 1) if cfgid[0] == 127 and cfgid[1] in [127, 121]: - if cfgid[1] == 121 and self._debug7f79 is None: - self._debug7f79 = True - if self._debug_level > 1: - logging.warning('7f79!!!') - valid = True + out = False else: fd.seek(-2, 1) - if self._debug_level > 1: - logging.info(" ###Leaving checkheader.") - return valid - - def read_hdrseg(self,): - fd = self.f - hdr = self.hdr - hdr['nbyte'] = fd.read_i16(1) - spare = fd.read_ui8(1) - ndat = fd.read_ui8(1) - hdr['dat_offsets'] = fd.read_ui16(ndat) - self._nbyte = 4 + ndat * 2 - - def print_progress(self,): - self.progress = self.f.tell() - if self._debug_level > 1: - logging.debug(' pos %0.0fmb/%0.0fmb\n' % - (self.f.tell() / 1048576., self._filesize / 1048576.)) - if (self.f.tell() - self.progress) < 1048576: - return + return out def print_pos(self, byte_offset=-1): - """Print the position in the file, used for debugging. - """ - if self._debug_level >= 2: - if hasattr(self, 'ensemble'): + """Print the position in the file, used for debugging.""" + if self._debug_level > 1: + if hasattr(self, "ensemble"): k = self.ensemble.k else: k = 0 logging.debug( - f' pos: {self.f.tell()}, pos_: {self._pos}, nbyte: {self._nbyte}, k: {k}, byte_offset: {byte_offset}') - - def check_offset(self, offset, readbytes): - fd = self.f - if offset != 4 and self._fixoffset == 0: - if self._debug_level > 0: - if fd.tell() == self._filesize: - logging.error( - ' EOF reached unexpectedly - discarding this last ensemble\n') - else: - logging.debug(" Adjust location by {:d} (readbytes={:d},hdr['nbyte']={:d})\n" - .format(offset, readbytes, self.hdr['nbyte'])) - self._fixoffset = offset - 4 - fd.seek(4 + self._fixoffset, 1) - - def remove_end(self, iens): - dat = self.outd - if self._debug_level > 0: - logging.info(' Encountered end of file. Cleaning up data.') - for nm in self.vars_read: - defs._setd(dat, nm, defs._get(dat, nm)[..., :iens]) + f" pos: {self.f.tell()}, pos_: {self._pos}, nbyte: {self._nbyte}, k: {k}, byte_offset: {byte_offset}" + ) def read_dat(self, id): - function_map = {0: (self.read_fixed, []), # 0000 1st profile fixed leader - 1: (self.read_fixed, [True]), # 0001 - # 0010 Surface layer fixed leader (RiverPro & StreamPro) - 16: (self.read_fixed_sl, []), - # 0080 1st profile variable leader - 128: (self.read_var, [0]), - # 0081 2nd profile variable leader - 129: (self.read_var, [1]), - # 0100 1st profile velocity - 256: (self.read_vel, [0]), - # 0101 2nd profile velocity - 257: (self.read_vel, [1]), - # 0103 Waves first leader - 259: (self.skip_Nbyte, [74]), - # 0110 Surface layer velocity (RiverPro & StreamPro) - 272: (self.read_vel, [2]), - # 0200 1st profile correlation - 512: (self.read_corr, [0]), - # 0201 2nd profile correlation - 513: (self.read_corr, [1]), - # 0203 Waves data - 515: (self.skip_Nbyte, [186]), - # 020C Ambient sound profile - 524: (self.skip_Nbyte, [4]), - # 0210 Surface layer correlation (RiverPro & StreamPro) - 528: (self.read_corr, [2]), - # 0300 1st profile amplitude - 768: (self.read_amp, [0]), - # 0301 2nd profile amplitude - 769: (self.read_amp, [1]), - # 0302 Beam 5 Sum of squared velocities - 770: (self.skip_Ncol, []), - # 0303 Waves last leader - 771: (self.skip_Ncol, [18]), - # 0310 Surface layer amplitude (RiverPro & StreamPro) - 784: (self.read_amp, [2]), - # 0400 1st profile % good - 1024: (self.read_prcnt_gd, [0]), - # 0401 2nd profile pct good - 1025: (self.read_prcnt_gd, [1]), - # 0403 Waves HPR data - 1027: (self.skip_Nbyte, [6]), - # 0410 Surface layer pct good (RiverPro & StreamPro) - 1040: (self.read_prcnt_gd, [2]), - # 0500 1st profile status - 1280: (self.read_status, [0]), - # 0501 2nd profile status - 1281: (self.read_status, [1]), - # 0510 Surface layer status (RiverPro & StreamPro) - 1296: (self.read_status, [2]), - 1536: (self.read_bottom, []), # 0600 bottom tracking - 1793: (self.skip_Ncol, [4]), # 0701 number of pings - 1794: (self.skip_Ncol, [4]), # 0702 sum of squared vel - 1795: (self.skip_Ncol, [4]), # 0703 sum of velocities - 2560: (self.skip_Ncol, []), # 0A00 Beam 5 velocity - 2816: (self.skip_Ncol, []), # 0B00 Beam 5 correlation - 3072: (self.skip_Ncol, []), # 0C00 Beam 5 amplitude - 3328: (self.skip_Ncol, []), # 0D00 Beam 5 pct_good - # Fixed attitude data format for Ocean Surveyor ADCPs - 3000: (self.skip_Nbyte, [32]), - 3841: (self.skip_Nbyte, [38]), # 0F01 Beam 5 leader - 8192: (self.read_vmdas, []), # 2000 - # 2013 Navigation parameter data - 8211: (self.skip_Nbyte, [83]), - 8226: (self.read_winriver2, []), # 2022 - 8448: (self.read_winriver, [38]), # 2100 - 8449: (self.read_winriver, [97]), # 2101 - 8450: (self.read_winriver, [45]), # 2102 - 8451: (self.read_winriver, [60]), # 2103 - 8452: (self.read_winriver, [38]), # 2104 - # 3200 Transformation matrix - 12800: (self.skip_Nbyte, [32]), - # 3000 Fixed attitude data format for Ocean Surveyor ADCPs - 12288: (self.skip_Nbyte, [32]), - 12496: (self.skip_Nbyte, [24]), # 30D0 - 12504: (self.skip_Nbyte, [48]), # 30D8 - # 4100 beam 5 range - 16640: (self.read_alt, []), - # 4400 Firmware status data (RiverPro & StreamPro) - 17408: (self.skip_Nbyte, [28]), - # 4401 Auto mode setup (RiverPro & StreamPro) - 17409: (self.skip_Nbyte, [82]), - # 5803 High resolution bottom track velocity - 22531: (self.skip_Nbyte, [68]), - # 5804 Bottom track range - 22532: (self.skip_Nbyte, [21]), - # 5901 ISM (IMU) data - 22785: (self.skip_Nbyte, [65]), - # 5902 Ping attitude - 22786: (self.skip_Nbyte, [105]), - # 7001 ADC data - 28673: (self.skip_Nbyte, [14]), - } + function_map = { + # 0000 1st profile fixed leader + 0: (self.read_fixed, []), + # 0001 2nd profile fixed leader + 1: (self.read_fixed, [True]), + # 0010 Surface layer fixed leader (RiverPro & StreamPro) + 16: (self.read_fixed_sl, []), + # 0080 1st profile variable leader + 128: (self.read_var, [0]), + # 0081 2nd profile variable leader + 129: (self.read_var, [1]), + # 0100 1st profile velocity + 256: (self.read_vel, [0]), + # 0101 2nd profile velocity + 257: (self.read_vel, [1]), + # 0103 Waves first leader + 259: (self.skip_Nbyte, [74]), + # 0110 Surface layer velocity (RiverPro & StreamPro) + 272: (self.read_vel, [2]), + # 0200 1st profile correlation + 512: (self.read_corr, [0]), + # 0201 2nd profile correlation + 513: (self.read_corr, [1]), + # 0203 Waves data + 515: (self.skip_Nbyte, [186]), + # 020C Ambient sound profile + 524: (self.skip_Nbyte, [4]), + # 0210 Surface layer correlation (RiverPro & StreamPro) + 528: (self.read_corr, [2]), + # 0300 1st profile amplitude + 768: (self.read_amp, [0]), + # 0301 2nd profile amplitude + 769: (self.read_amp, [1]), + # 0302 Beam 5 Sum of squared velocities + 770: (self.skip_Ncol, []), + # 0303 Waves last leader + 771: (self.skip_Ncol, [18]), + # 0310 Surface layer amplitude (RiverPro & StreamPro) + 784: (self.read_amp, [2]), + # 0400 1st profile % good + 1024: (self.read_prcnt_gd, [0]), + # 0401 2nd profile pct good + 1025: (self.read_prcnt_gd, [1]), + # 0403 Waves HPR data + 1027: (self.skip_Nbyte, [6]), + # 0410 Surface layer pct good (RiverPro & StreamPro) + 1040: (self.read_prcnt_gd, [2]), + # 0500 1st profile status + 1280: (self.read_status, [0]), + # 0501 2nd profile status + 1281: (self.read_status, [1]), + # 0510 Surface layer status (RiverPro & StreamPro) + 1296: (self.read_status, [2]), + 1536: (self.read_bottom, []), # 0600 bottom tracking + 1793: (self.skip_Ncol, [4]), # 0701 number of pings + 1794: (self.skip_Ncol, [4]), # 0702 sum of squared vel + 1795: (self.skip_Ncol, [4]), # 0703 sum of velocities + 2560: (self.skip_Ncol, []), # 0A00 Beam 5 velocity + 2816: (self.skip_Ncol, []), # 0B00 Beam 5 correlation + 3072: (self.skip_Ncol, []), # 0C00 Beam 5 amplitude + 3328: (self.skip_Ncol, []), # 0D00 Beam 5 pct_good + # Fixed attitude data format for Ocean Surveyor ADCPs + 3000: (self.skip_Nbyte, [32]), + 3841: (self.skip_Nbyte, [38]), # 0F01 Beam 5 leader + 8192: (self.read_vmdas, []), # 2000 + # 2013 Navigation parameter data + 8211: (self.skip_Nbyte, [83]), + 8226: (self.read_winriver2, []), # 2022 + 8448: (self.read_winriver, [38]), # 2100 + 8449: (self.read_winriver, [97]), # 2101 + 8450: (self.read_winriver, [45]), # 2102 + 8451: (self.read_winriver, [60]), # 2103 + 8452: (self.read_winriver, [38]), # 2104 + # 3200 Transformation matrix + 12800: (self.skip_Nbyte, [32]), + # 3000 Fixed attitude data format for Ocean Surveyor ADCPs + 12288: (self.skip_Nbyte, [32]), + 12496: (self.skip_Nbyte, [24]), # 30D0 + 12504: (self.skip_Nbyte, [48]), # 30D8 + # 4100 beam 5 range + 16640: (self.read_alt, []), + # 4400 Firmware status data (RiverPro & StreamPro) + 17408: (self.skip_Nbyte, [28]), + # 4401 Auto mode setup (RiverPro & StreamPro) + 17409: (self.skip_Nbyte, [82]), + # 5803 High resolution bottom track velocity + 22531: (self.skip_Nbyte, [68]), + # 5804 Bottom track range + 22532: (self.skip_Nbyte, [21]), + # 5901 ISM (IMU) data + 22785: (self.skip_Nbyte, [65]), + # 5902 Ping attitude + 22786: (self.skip_Nbyte, [105]), + # 7001 ADC data + 28673: (self.skip_Nbyte, [14]), + } # Call the correct function: - if self._debug_level >= 2: - logging.debug(f'Trying to Read {id}') + if self._debug_level > 1: + logging.debug(f"Trying to Read {id}") if id in function_map: if self._debug_level > 1: - logging.info(' Reading code {}...'.format(hex(id))) + logging.info(" Reading code {}...".format(hex(id))) retval = function_map.get(id)[0](*function_map[id][1]) if retval: return retval if self._debug_level > 1: - logging.info(' success!') + logging.info(" success!") else: self.read_nocode(id) def read_fixed(self, bb=False): self.read_cfgseg(bb=bb) self._nbyte += 2 - if self._debug_level >= 0: - logging.info('Read Fixed') - - # Check if n_cells changed (for winriver transect files) - if hasattr(self, 'ensemble') and (self.ensemble['n_cells'] != self.cfg['n_cells']): - diff = self.cfg['n_cells'] - self.ensemble['n_cells'] - if diff > 0: - self.flag = diff - self.ensemble = defs._ensemble(self.n_avg, self.cfg['n_cells']) - # Not concerned if # of cells decreases - if self._debug_level >= 1: - logging.warning('Number of cells changed to {}' - .format(self.cfg['n_cells'])) - - def read_fixed_sl(self,): + if self._debug_level > -1: + logging.info("Read Fixed") + + # Check if n_cells has increased (for winriver transect files) + if hasattr(self, "ensemble"): + self.n_cells_diff = self.cfg["n_cells"] - self.ensemble["n_cells"] + # Increase n_cells if greater than 0 + if self.n_cells_diff > 0: + self.ensemble = defs._ensemble(self.n_avg, self.cfg["n_cells"]) + if self._debug_level > 0: + logging.warning( + f"Maximum number of cells increased to {self.cfg['n_cells']}" + ) + + def read_fixed_sl(self): # Surface layer profile cfg = self.cfg - cfg['surface_layer'] = 1 - cfg['n_cells_sl'] = self.f.read_ui8(1) - cfg['cell_size_sl'] = self.f.read_ui16(1) * .01 - cfg['bin1_dist_m_sl'] = round(self.f.read_ui16(1) * .01, 4) - - if self._debug_level >= 0: - logging.info('Read Surface Layer Config') + cfg["surface_layer"] = 1 + n_cells = self.f.read_ui8(1) + # Check if n_cells is greater than what was used in prior profiles + if n_cells > self.n_cells_sl: + self.n_cells_sl = n_cells + if self._debug_level > 0: + logging.warning( + f"Maximum number of surface layer cells increased to {n_cells}" + ) + cfg["n_cells_sl"] = n_cells + # Assuming surface layer profile cell size never changes + cfg["cell_size_sl"] = self.f.read_ui16(1) * 0.01 + cfg["bin1_dist_m_sl"] = round(self.f.read_ui16(1) * 0.01, 4) + + if self._debug_level > -1: + logging.info("Read Surface Layer Config") self._nbyte = 2 + 5 def read_cfgseg(self, bb=False): @@ -745,71 +756,79 @@ def read_cfgseg(self, bb=False): fd = self.f tmp = fd.read_ui8(5) prog_ver0 = tmp[0] - cfg['prog_ver'] = tmp[0] + tmp[1] / 100. - cfg['inst_model'] = defs.adcp_type.get(tmp[0], - 'unrecognized firmware version') + cfg["prog_ver"] = tmp[0] + tmp[1] / 100.0 + cfg["inst_model"] = defs.adcp_type.get(tmp[0], "unrecognized firmware version") config = tmp[2:4] - cfg['beam_angle'] = [15, 20, 30][(config[1] & 3)] + cfg["beam_angle"] = [15, 20, 30][(config[1] & 3)] beam5 = [0, 1][int((config[1] & 16) == 16)] - cfg['freq'] = ([75, 150, 300, 600, 1200, 2400, 38][(config[0] & 7)]) - cfg['beam_pattern'] = (['concave', - 'convex'][int((config[0] & 8) == 8)]) - cfg['orientation'] = ['down', 'up'][int((config[0] & 128) == 128)] - simflag = ['real', 'simulated'][tmp[4]] + cfg["freq"] = [75, 150, 300, 600, 1200, 2400, 38][(config[0] & 7)] + cfg["beam_pattern"] = ["concave", "convex"][int((config[0] & 8) == 8)] + cfg["orientation"] = ["down", "up"][int((config[0] & 128) == 128)] + simflag = ["real", "simulated"][tmp[4]] fd.seek(1, 1) - cfg['n_beams'] = fd.read_ui8(1) + beam5 - cfg['n_cells'] = fd.read_ui8(1) - cfg['pings_per_ensemble'] = fd.read_ui16(1) - cfg['cell_size'] = fd.read_ui16(1) * .01 - cfg['blank_dist'] = fd.read_ui16(1) * .01 - cfg['profiling_mode'] = fd.read_ui8(1) - cfg['min_corr_threshold'] = fd.read_ui8(1) - cfg['n_code_reps'] = fd.read_ui8(1) - cfg['min_prcnt_gd'] = fd.read_ui8(1) - cfg['max_error_vel'] = fd.read_ui16(1) / 1000 - cfg['sec_between_ping_groups'] = ( - np.sum(np.array(fd.read_ui8(3)) * - np.array([60., 1., .01]))) + cfg["n_beams"] = fd.read_ui8(1) + beam5 + # Check if number of cells has changed + n_cells = fd.read_ui8(1) + if ("n_cells" not in cfg) or (n_cells != cfg["n_cells"]): + cfg["n_cells"] = n_cells + if self._debug_level > 0: + logging.info(f"Number of cells set to {cfg['n_cells']}") + cfg["pings_per_ensemble"] = fd.read_ui16(1) + # Check if cell size has changed + cs = fd.read_ui16(1) * 0.01 + if ("cell_size" not in cfg) or (cs != cfg["cell_size"]): + self.cs_diff = cs if "cell_size" not in cfg else (cs - cfg["cell_size"]) + cfg["cell_size"] = cs + if self._debug_level > 0: + logging.info(f"Cell size set to {cfg['cell_size']}") + cfg["blank_dist"] = fd.read_ui16(1) * 0.01 + cfg["profiling_mode"] = fd.read_ui8(1) + cfg["min_corr_threshold"] = fd.read_ui8(1) + cfg["n_code_reps"] = fd.read_ui8(1) + cfg["min_prcnt_gd"] = fd.read_ui8(1) + cfg["max_error_vel"] = fd.read_ui16(1) / 1000 + cfg["sec_between_ping_groups"] = np.sum( + np.array(fd.read_ui8(3)) * np.array([60.0, 1.0, 0.01]) + ) coord_sys = fd.read_ui8(1) - cfg['coord_sys'] = (['beam', 'inst', - 'ship', 'earth'][((coord_sys >> 3) & 3)]) - cfg['use_pitchroll'] = ['no', 'yes'][(coord_sys & 4) == 4] - cfg['use_3beam'] = ['no', 'yes'][(coord_sys & 2) == 2] - cfg['bin_mapping'] = ['no', 'yes'][(coord_sys & 1) == 1] - cfg['heading_misalign_deg'] = fd.read_i16(1) * .01 - cfg['magnetic_var_deg'] = fd.read_i16(1) * .01 - cfg['sensors_src'] = np.binary_repr(fd.read_ui8(1), 8) - cfg['sensors_avail'] = np.binary_repr(fd.read_ui8(1), 8) - cfg['bin1_dist_m'] = round(fd.read_ui16(1) * .01, 4) - cfg['transmit_pulse_m'] = fd.read_ui16(1) * .01 - cfg['water_ref_cells'] = list(fd.read_ui8(2)) # list for attrs - cfg['false_target_threshold'] = fd.read_ui8(1) + cfg["coord_sys"] = ["beam", "inst", "ship", "earth"][((coord_sys >> 3) & 3)] + cfg["use_pitchroll"] = ["no", "yes"][(coord_sys & 4) == 4] + cfg["use_3beam"] = ["no", "yes"][(coord_sys & 2) == 2] + cfg["bin_mapping"] = ["no", "yes"][(coord_sys & 1) == 1] + cfg["heading_misalign_deg"] = fd.read_i16(1) * 0.01 + cfg["magnetic_var_deg"] = fd.read_i16(1) * 0.01 + cfg["sensors_src"] = np.binary_repr(fd.read_ui8(1), 8) + cfg["sensors_avail"] = np.binary_repr(fd.read_ui8(1), 8) + cfg["bin1_dist_m"] = round(fd.read_ui16(1) * 0.01, 4) + cfg["transmit_pulse_m"] = fd.read_ui16(1) * 0.01 + cfg["water_ref_cells"] = list(fd.read_ui8(2)) # list for attrs + cfg["false_target_threshold"] = fd.read_ui8(1) fd.seek(1, 1) - cfg['transmit_lag_m'] = fd.read_ui16(1) * .01 + cfg["transmit_lag_m"] = fd.read_ui16(1) * 0.01 self._nbyte = 40 - if cfg['prog_ver'] >= 8.14: + if cfg["prog_ver"] >= 8.14: cpu_serialnum = fd.read_ui8(8) self._nbyte += 8 - if cfg['prog_ver'] >= 8.24: - cfg['bandwidth'] = fd.read_ui16(1) + if cfg["prog_ver"] >= 8.24: + cfg["bandwidth"] = fd.read_ui16(1) self._nbyte += 2 - if cfg['prog_ver'] >= 16.05: - cfg['power_level'] = fd.read_ui8(1) + if cfg["prog_ver"] >= 16.05: + cfg["power_level"] = fd.read_ui8(1) self._nbyte += 1 - if cfg['prog_ver'] >= 16.27: + if cfg["prog_ver"] >= 16.27: # cfg['navigator_basefreqindex'] = fd.read_ui8(1) fd.seek(1, 1) - cfg['serialnum'] = fd.read_ui32(1) - cfg['beam_angle'] = fd.read_ui8(1) + cfg["serialnum"] = fd.read_ui32(1) + cfg["beam_angle"] = fd.read_ui8(1) self._nbyte += 6 self.configsize = self.f.tell() - cfgstart - if self._debug_level >= 0: - logging.info('Read Config') + if self._debug_level > -1: + logging.info("Read Config") def read_var(self, bb=False): - """ Read variable leader """ + """Read variable leader""" fd = self.f if bb: ens = self.ensembleBB @@ -818,22 +837,24 @@ def read_var(self, bb=False): ens.k += 1 ens = self.ensemble k = ens.k - self.vars_read += ['number', - 'rtc', - 'number', - 'builtin_test_fail', - 'c_sound', - 'depth', - 'heading', - 'pitch', - 'roll', - 'salinity', - 'temp', - 'min_preping_wait', - 'heading_std', - 'pitch_std', - 'roll_std', - 'adc'] + self.vars_read += [ + "number", + "rtc", + "number", + "builtin_test_fail", + "c_sound", + "depth", + "heading", + "pitch", + "roll", + "salinity", + "temp", + "min_preping_wait", + "heading_std", + "pitch_std", + "roll_std", + "adc", + ] ens.number[k] = fd.read_ui16(1) ens.rtc[:, k] = fd.read_ui8(7) ens.number[k] += 65535 * fd.read_ui8(1) @@ -845,8 +866,7 @@ def read_var(self, bb=False): ens.roll[k] = fd.read_i16(1) * 0.01 ens.salinity[k] = fd.read_i16(1) ens.temp[k] = fd.read_i16(1) * 0.01 - ens.min_preping_wait[k] = (fd.read_ui8( - 3) * np.array([60, 1, .01])).sum() + ens.min_preping_wait[k] = (fd.read_ui8(3) * np.array([60, 1, 0.01])).sum() ens.heading_std[k] = fd.read_ui8(1) ens.pitch_std[k] = fd.read_ui8(1) * 0.1 ens.roll_std[k] = fd.read_ui8(1) * 0.1 @@ -854,45 +874,45 @@ def read_var(self, bb=False): self._nbyte = 2 + 40 cfg = self.cfg - if cfg['inst_model'].lower() == 'broadband': - if cfg['prog_ver'] >= 5.55: + if cfg["inst_model"].lower() == "broadband": + if cfg["prog_ver"] >= 5.55: fd.seek(15, 1) cent = fd.read_ui8(1) ens.rtc[:, k] = fd.read_ui8(7) ens.rtc[0, k] = ens.rtc[0, k] + cent * 100 self._nbyte += 23 - elif cfg['inst_model'].lower() == 'ocean surveyor': + elif cfg["inst_model"].lower() == "ocean surveyor": fd.seek(16, 1) # 30 bytes all set to zero, 14 read above self._nbyte += 16 - if cfg['prog_ver'] > 23: + if cfg["prog_ver"] > 23: fd.seek(2, 1) self._nbyte += 2 else: ens.error_status[k] = np.binary_repr(fd.read_ui32(1), 32) - self.vars_read += ['pressure', 'pressure_std'] + self.vars_read += ["pressure", "pressure_std"] self._nbyte += 4 - if cfg['prog_ver'] >= 8.13: + if cfg["prog_ver"] >= 8.13: # Added pressure sensor stuff in 8.13 fd.seek(2, 1) ens.pressure[k] = fd.read_ui32(1) / 1000 # dPa to dbar ens.pressure_std[k] = fd.read_ui32(1) / 1000 self._nbyte += 10 - if cfg['prog_ver'] >= 8.24: + if cfg["prog_ver"] >= 8.24: # Spare byte added 8.24 fd.seek(1, 1) self._nbyte += 1 - if cfg['prog_ver'] >= 16.05: + if cfg["prog_ver"] >= 16.05: # Added more fields with century in clock cent = fd.read_ui8(1) ens.rtc[:, k] = fd.read_ui8(7) ens.rtc[0, k] = ens.rtc[0, k] + cent * 100 self._nbyte += 8 - if cfg['prog_ver'] >= 56: + if cfg["prog_ver"] >= 56: fd.seek(1) # lag near bottom flag self._nbyte += 1 - if self._debug_level >= 0: - logging.info('Read Var') + if self._debug_level > -1: + logging.info("Read Var") def switch_profile(self, bb): if bb == 1: @@ -900,91 +920,88 @@ def switch_profile(self, bb): cfg = self.cfgbb # Placeholder for dual profile mode # Solution for vmdas profile in bb spot (vs nb) - tag = '' + tag = "" elif bb == 2: ens = self.ensemble cfg = self.cfg - tag = '_sl' + tag = "_sl" else: ens = self.ensemble cfg = self.cfg - tag = '' + tag = "" return ens, cfg, tag def read_vel(self, bb=0): ens, cfg, tg = self.switch_profile(bb) - self.vars_read += ['vel'+tg] - n_cells = cfg['n_cells'+tg] + self.vars_read += ["vel" + tg] + n_cells = cfg["n_cells" + tg] k = ens.k - vel = np.array( - self.f.read_i16(4 * n_cells) - ).reshape((n_cells, 4)) * .001 - ens['vel'+tg][:n_cells, :, k] = vel + vel = np.array(self.f.read_i16(4 * n_cells)).reshape((n_cells, 4)) * 0.001 + ens["vel" + tg][:n_cells, :, k] = vel self._nbyte = 2 + 4 * n_cells * 2 - if self._debug_level >= 0: - logging.info('Read Vel') + if self._debug_level > -1: + logging.info("Read Vel") def read_corr(self, bb=0): ens, cfg, tg = self.switch_profile(bb) - self.vars_read += ['corr'+tg] - n_cells = cfg['n_cells'+tg] + self.vars_read += ["corr" + tg] + n_cells = cfg["n_cells" + tg] k = ens.k - ens['corr'+tg][:n_cells, :, k] = np.array( + ens["corr" + tg][:n_cells, :, k] = np.array( self.f.read_ui8(4 * n_cells) ).reshape((n_cells, 4)) self._nbyte = 2 + 4 * n_cells - if self._debug_level >= 0: - logging.info('Read Corr') + if self._debug_level > -1: + logging.info("Read Corr") def read_amp(self, bb=0): ens, cfg, tg = self.switch_profile(bb) - self.vars_read += ['amp'+tg] - n_cells = cfg['n_cells'+tg] + self.vars_read += ["amp" + tg] + n_cells = cfg["n_cells" + tg] k = ens.k - ens['amp'+tg][:n_cells, :, k] = np.array( + ens["amp" + tg][:n_cells, :, k] = np.array( self.f.read_ui8(4 * n_cells) ).reshape((n_cells, 4)) self._nbyte = 2 + 4 * n_cells - if self._debug_level >= 0: - logging.info('Read Amp') + if self._debug_level > -1: + logging.info("Read Amp") def read_prcnt_gd(self, bb=0): ens, cfg, tg = self.switch_profile(bb) - self.vars_read += ['prcnt_gd'+tg] - n_cells = cfg['n_cells'+tg] + self.vars_read += ["prcnt_gd" + tg] + n_cells = cfg["n_cells" + tg] - ens['prcnt_gd'+tg][:n_cells, :, ens.k] = np.array( + ens["prcnt_gd" + tg][:n_cells, :, ens.k] = np.array( self.f.read_ui8(4 * n_cells) ).reshape((n_cells, 4)) self._nbyte = 2 + 4 * n_cells - if self._debug_level >= 0: - logging.info('Read PG') + if self._debug_level > -1: + logging.info("Read PG") def read_status(self, bb=0): ens, cfg, tg = self.switch_profile(bb) - self.vars_read += ['status'+tg] - n_cells = cfg['n_cells'+tg] + self.vars_read += ["status" + tg] + n_cells = cfg["n_cells" + tg] - ens['status'+tg][:n_cells, :, ens.k] = np.array( + ens["status" + tg][:n_cells, :, ens.k] = np.array( self.f.read_ui8(4 * n_cells) ).reshape((n_cells, 4)) self._nbyte = 2 + 4 * n_cells - if self._debug_level >= 0: - logging.info('Read Status') + if self._debug_level > -1: + logging.info("Read Status") - def read_bottom(self,): - self.vars_read += ['dist_bt', 'vel_bt', 'corr_bt', 'amp_bt', - 'prcnt_gd_bt'] + def read_bottom(self): + self.vars_read += ["dist_bt", "vel_bt", "corr_bt", "amp_bt", "prcnt_gd_bt"] fd = self.f ens = self.ensemble k = ens.k cfg = self.cfg - if self._source == 2: - self.vars_read += ['latitude_gps', 'longitude_gps'] + if self._vm_source == 2: + self.vars_read += ["latitude_gps", "longitude_gps"] fd.seek(2, 1) long1 = fd.read_ui16(1) fd.seek(6, 1) @@ -998,10 +1015,9 @@ def read_bottom(self,): ens.corr_bt[:, k] = fd.read_ui8(4) ens.amp_bt[:, k] = fd.read_ui8(4) ens.prcnt_gd_bt[:, k] = fd.read_ui8(4) - if self._source == 2: + if self._vm_source == 2: fd.seek(2, 1) - ens.longitude_gps[k] = ( - long1 + 65536 * fd.read_ui16(1)) * self._cfac + ens.longitude_gps[k] = (long1 + 65536 * fd.read_ui16(1)) * self._cfac if ens.longitude_gps[k] > 180: ens.longitude_gps[k] = ens.longitude_gps[k] - 360 if ens.longitude_gps[k] == 0: @@ -1010,9 +1026,10 @@ def read_bottom(self,): qual = fd.read_ui8(1) if qual == 0: if self._debug_level > 0: - logging.info(' qual==%d,%f %f' % (qual, - ens.latitude_gps[k], - ens.longitude_gps[k])) + logging.info( + " qual==%d,%f %f" + % (qual, ens.latitude_gps[k], ens.longitude_gps[k]) + ) ens.latitude_gps[k] = np.NaN ens.longitude_gps[k] = np.NaN fd.seek(71 - 45 - 16 - 17, 1) @@ -1021,81 +1038,81 @@ def read_bottom(self,): # Skip reference layer data fd.seek(26, 1) self._nbyte = 2 + 68 - if cfg['prog_ver'] >= 5.3: + if cfg["prog_ver"] >= 5.3: fd.seek(7, 1) # skip to rangeMsb bytes ens.dist_bt[:, k] = ens.dist_bt[:, k] + fd.read_ui8(4) * 655.36 self._nbyte += 11 - if cfg['prog_ver'] >= 16.2 and (cfg.get('sourceprog') != 'WINRIVER'): + if cfg["prog_ver"] >= 16.2 and (cfg.get("sourceprog") != "WINRIVER"): fd.seek(4, 1) # not documented self._nbyte += 4 - if cfg['prog_ver'] >= 56.1: + if cfg["prog_ver"] >= 56.1: fd.seek(4, 1) # not documented self._nbyte += 4 - if self._debug_level >= 0: - logging.info('Read Bottom Track') + if self._debug_level > -1: + logging.info("Read Bottom Track") - def read_alt(self,): - """Read altimeter (vertical beam range) """ + def read_alt(self): + """Read altimeter (vertical beam range)""" fd = self.f ens = self.ensemble k = ens.k - self.vars_read += ['alt_dist', 'alt_rssi', 'alt_eval', 'alt_status'] + self.vars_read += ["alt_dist", "alt_rssi", "alt_eval", "alt_status"] ens.alt_eval[k] = fd.read_ui8(1) # evaluation amplitude ens.alt_rssi[k] = fd.read_ui8(1) # RSSI amplitude ens.alt_dist[k] = fd.read_ui32(1) / 1000 # range to surface/seafloor ens.alt_status[k] = fd.read_ui8(1) # status bit flags self._nbyte = 7 + 2 - if self._debug_level >= 0: - logging.info('Read Altimeter') + if self._debug_level > -1: + logging.info("Read Altimeter") - def read_vmdas(self,): + def read_vmdas(self): """Read VMDAS Navigation block""" fd = self.f - self.cfg['sourceprog'] = 'VMDAS' + self.cfg["sourceprog"] = "VMDAS" ens = self.ensemble k = ens.k - if self._source != 1 and self._debug_level >= 0: - logging.info(' \n***** Apparently a VMDAS file \n\n') - self._source = 1 - self.vars_read += ['time_gps', - 'clock_offset_UTC_gps', - 'latitude_gps', - 'longitude_gps', - 'avg_speed_gps', - 'avg_dir_gps', - 'speed_made_good_gps', - 'dir_made_good_gps', - 'flags_gps', - 'pitch_gps', - 'roll_gps', - 'heading_gps', - ] + if self._vm_source != 1 and self._debug_level > -1: + logging.info(" \n***** Apparently a VMDAS file \n\n") + self._vm_source = 1 + self.vars_read += [ + "time_gps", + "clock_offset_UTC_gps", + "latitude_gps", + "longitude_gps", + "avg_speed_gps", + "avg_dir_gps", + "speed_made_good_gps", + "dir_made_good_gps", + "flags_gps", + "pitch_gps", + "roll_gps", + "heading_gps", + ] # UTC date time utim = fd.read_ui8(4) date_utc = tmlib.datetime(utim[2] + utim[3] * 256, utim[1], utim[0]) # 1st lat/lon position after previous ADCP ping # This byte is in hundredths of seconds (10s of milliseconds): - utc_time_first_fix = tmlib.timedelta( - milliseconds=(int(fd.read_ui32(1) / 10))) - ens.clock_offset_UTC_gps[k] = fd.read_i32( - 1) / 1000 # "PC clock offset from UTC" in ms + utc_time_first_fix = tmlib.timedelta(milliseconds=(int(fd.read_ui32(1) / 10))) + ens.clock_offset_UTC_gps[k] = ( + fd.read_i32(1) / 1000 + ) # "PC clock offset from UTC" in ms latitude_first_gps = fd.read_i32(1) * self._cfac longitude_first_gps = fd.read_i32(1) * self._cfac # Last lat/lon position prior to current ADCP ping - utc_time_fix = tmlib.timedelta( - milliseconds=(int(fd.read_ui32(1) / 10))) + utc_time_fix = tmlib.timedelta(milliseconds=(int(fd.read_ui32(1) / 10))) ens.time_gps[k] = tmlib.date2epoch(date_utc + utc_time_fix)[0] ens.latitude_gps[k] = fd.read_i32(1) * self._cfac ens.longitude_gps[k] = fd.read_i32(1) * self._cfac ens.avg_speed_gps[k] = fd.read_ui16(1) / 1000 - ens.avg_dir_gps[k] = fd.read_ui16(1) * 180 / 2 ** 15 # avg true track + ens.avg_dir_gps[k] = fd.read_ui16(1) * 180 / 2**15 # avg true track fd.seek(2, 1) # avg magnetic track ens.speed_made_good_gps[k] = fd.read_ui16(1) / 1000 - ens.dir_made_good_gps[k] = fd.read_ui16(1) * 180 / 2 ** 15 + ens.dir_made_good_gps[k] = fd.read_ui16(1) * 180 / 2**15 fd.seek(2, 1) # reserved ens.flags_gps[k] = int(np.binary_repr(fd.read_ui16(1))) fd.seek(6, 1) # reserved, ADCP ensemble # @@ -1103,50 +1120,52 @@ def read_vmdas(self,): # ADCP date time utim = fd.read_ui8(4) date_adcp = tmlib.datetime(utim[0] + utim[1] * 256, utim[3], utim[2]) - time_adcp = tmlib.timedelta( - milliseconds=(int(fd.read_ui32(1) / 10))) + time_adcp = tmlib.timedelta(milliseconds=(int(fd.read_ui32(1) / 10))) - ens.pitch_gps[k] = fd.read_ui16(1) * 180 / 2 ** 15 - ens.roll_gps[k] = fd.read_ui16(1) * 180 / 2 ** 15 - ens.heading_gps[k] = fd.read_ui16(1) * 180 / 2 ** 15 + ens.pitch_gps[k] = fd.read_ui16(1) * 180 / 2**15 + ens.roll_gps[k] = fd.read_ui16(1) * 180 / 2**15 + ens.heading_gps[k] = fd.read_ui16(1) * 180 / 2**15 fd.seek(10, 1) self._nbyte = 2 + 76 - if self._debug_level >= 0: - logging.info('Read VMDAS') + if self._debug_level > -1: + logging.info("Read VMDAS") self._read_vmdas = True - def read_winriver2(self, ): + def read_winriver2(self): startpos = self.f.tell() self._winrivprob = True - self.cfg['sourceprog'] = 'WinRiver2' + self.cfg["sourceprog"] = "WinRiver2" ens = self.ensemble k = ens.k - if self._debug_level >= 0: - logging.info('Read WinRiver2') - self._source = 3 + if self._debug_level > -1: + logging.info("Read WinRiver2") + self._vm_source = 3 spid = self.f.read_ui16(1) # NMEA specific IDs if spid in [4, 104]: # GGA sz = self.f.read_ui16(1) dtime = self.f.read_f64(1) if sz <= 43: # If no sentence, data is still stored in nmea format - empty_gps = self.f.reads(sz-2) + empty_gps = self.f.reads(sz - 2) self.f.seek(2, 1) else: # TRDI rewrites the nmea string into their format if one is found start_string = self.f.reads(6) - if type(start_string) != str: - if self._debug_level >= 1: - logging.warning(f'Invalid GGA string found in ensemble {k},' - ' skipping...') - return 'FAIL' + if not isinstance(start_string, str): + if self._debug_level > 0: + logging.warning( + f"Invalid GGA string found in ensemble {k}," " skipping..." + ) + return "FAIL" self.f.seek(1, 1) gga_time = self.f.reads(9) - time = tmlib.timedelta(hours=int(gga_time[0:2]), - minutes=int(gga_time[2:4]), - seconds=int(gga_time[4:6]), - milliseconds=int(float(gga_time[6:])*1000)) + time = tmlib.timedelta( + hours=int(gga_time[0:2]), + minutes=int(gga_time[2:4]), + seconds=int(gga_time[4:6]), + milliseconds=int(float(gga_time[6:]) * 1000), + ) clock = self.ensemble.rtc[:, :] if clock[0, 0] < 100: clock[0, :] += defs.century @@ -1155,115 +1174,127 @@ def read_winriver2(self, ): self.f.seek(1, 1) ens.latitude_gps[k] = self.f.read_f64(1) tcNS = self.f.reads(1) # 'N' or 'S' - if tcNS == 'S': + if tcNS == "S": ens.latitude_gps[k] *= -1 ens.longitude_gps[k] = self.f.read_f64(1) tcEW = self.f.reads(1) # 'E' or 'W' - if tcEW == 'W': + if tcEW == "W": ens.longitude_gps[k] *= -1 ens.fix_gps[k] = self.f.read_ui8(1) # gps fix type/quality ens.n_sat_gps[k] = self.f.read_ui8(1) # of satellites # horizontal dilution of precision - ens.hdop_gps[k] = self.f.read_float(1) - ens.elevation_gps[k] = self.f.read_float(1) # altitude + ens.hdop_gps[k] = self.f.read_f32(1) + ens.elevation_gps[k] = self.f.read_f32(1) # altitude m = self.f.reads(1) # altitude unit, 'm' - h_geoid = self.f.read_float(1) # height of geoid + h_geoid = self.f.read_f32(1) # height of geoid m2 = self.f.reads(1) # geoid unit, 'm' - ens.rtk_age_gps[k] = self.f.read_float(1) + ens.rtk_age_gps[k] = self.f.read_f32(1) station_id = self.f.read_ui16(1) - self.vars_read += ['time_gps', 'longitude_gps', 'latitude_gps', 'fix_gps', - 'n_sat_gps', 'hdop_gps', 'elevation_gps', 'rtk_age_gps'] + self.vars_read += [ + "time_gps", + "longitude_gps", + "latitude_gps", + "fix_gps", + "n_sat_gps", + "hdop_gps", + "elevation_gps", + "rtk_age_gps", + ] self._nbyte = self.f.tell() - startpos + 2 elif spid in [5, 105]: # VTG sz = self.f.read_ui16(1) dtime = self.f.read_f64(1) if sz <= 22: # if no data - empty_gps = self.f.reads(sz-2) + empty_gps = self.f.reads(sz - 2) self.f.seek(2, 1) else: start_string = self.f.reads(6) - if type(start_string) != str: - if self._debug_level >= 1: - logging.warning(f'Invalid VTG string found in ensemble {k},' - ' skipping...') - return 'FAIL' + if not isinstance(start_string, str): + if self._debug_level > 0: + logging.warning( + f"Invalid VTG string found in ensemble {k}," " skipping..." + ) + return "FAIL" self.f.seek(1, 1) - true_track = self.f.read_float(1) + true_track = self.f.read_f32(1) t = self.f.reads(1) # 'T' - magn_track = self.f.read_float(1) + magn_track = self.f.read_f32(1) m = self.f.reads(1) # 'M' - speed_knot = self.f.read_float(1) + speed_knot = self.f.read_f32(1) kts = self.f.reads(1) # 'N' - speed_kph = self.f.read_float(1) + speed_kph = self.f.read_f32(1) kph = self.f.reads(1) # 'K' mode = self.f.reads(1) # knots -> m/s ens.speed_over_grnd_gps[k] = speed_knot / 1.944 ens.dir_over_grnd_gps[k] = true_track - self.vars_read += ['speed_over_grnd_gps', - 'dir_over_grnd_gps'] + self.vars_read += ["speed_over_grnd_gps", "dir_over_grnd_gps"] self._nbyte = self.f.tell() - startpos + 2 elif spid in [6, 106]: # 'DBT' depth sounder sz = self.f.read_ui16(1) dtime = self.f.read_f64(1) if sz <= 20: - empty_gps = self.f.reads(sz-2) + empty_gps = self.f.reads(sz - 2) self.f.seek(2, 1) else: start_string = self.f.reads(6) - if type(start_string) != str: - if self._debug_level >= 1: - logging.warning(f'Invalid DBT string found in ensemble {k},' - ' skipping...') - return 'FAIL' + if not isinstance(start_string, str): + if self._debug_level > 0: + logging.warning( + f"Invalid DBT string found in ensemble {k}," " skipping..." + ) + return "FAIL" self.f.seek(1, 1) - depth_ft = self.f.read_float(1) + depth_ft = self.f.read_f32(1) ft = self.f.reads(1) # 'f' - depth_m = self.f.read_float(1) + depth_m = self.f.read_f32(1) m = self.f.reads(1) # 'm' - depth_fathom = self.f.read_float(1) + depth_fathom = self.f.read_f32(1) f = self.f.reads(1) # 'F' ens.dist_nmea[k] = depth_m - self.vars_read += ['dist_nmea'] + self.vars_read += ["dist_nmea"] self._nbyte = self.f.tell() - startpos + 2 elif spid in [7, 107]: # 'HDT' sz = self.f.read_ui16(1) dtime = self.f.read_f64(1) if sz <= 14: - empty_gps = self.f.reads(sz-2) + empty_gps = self.f.reads(sz - 2) self.f.seek(2, 1) else: start_string = self.f.reads(6) - if type(start_string) != str: - if self._debug_level >= 1: - logging.warning(f'Invalid HDT string found in ensemble {k},' - ' skipping...') - return 'FAIL' + if not isinstance(start_string, str): + if self._debug_level > 0: + logging.warning( + f"Invalid HDT string found in ensemble {k}," " skipping..." + ) + return "FAIL" self.f.seek(1, 1) ens.heading_gps[k] = self.f.read_f64(1) tt = self.f.reads(1) - self.vars_read += ['heading_gps'] + self.vars_read += ["heading_gps"] self._nbyte = self.f.tell() - startpos + 2 def read_winriver(self, nbt): self._winrivprob = True - self.cfg['sourceprog'] = 'WINRIVER' - if self._source not in [2, 3]: - if self._debug_level >= 0: - logging.warning('\n***** Apparently a WINRIVER file - ' - 'Raw NMEA data handler not yet implemented\n') - self._source = 2 + self.cfg["sourceprog"] = "WINRIVER" + if self._vm_source not in [2, 3]: + if self._debug_level > -1: + logging.warning( + "\n***** Apparently a WINRIVER file - " + "Raw NMEA data handler not yet implemented\n" + ) + self._vm_source = 2 startpos = self.f.tell() sz = self.f.read_ui16(1) - tmp = self.f.reads(sz-2) + tmp = self.f.reads(sz - 2) self._nbyte = self.f.tell() - startpos + 2 def skip_Ncol(self, n_skip=1): - self.f.seek(n_skip * self.cfg['n_cells'], 1) - self._nbyte = 2 + n_skip * self.cfg['n_cells'] + self.f.seek(n_skip * self.cfg["n_cells"], 1) + self._nbyte = 2 + n_skip * self.cfg["n_cells"] def skip_Nbyte(self, n_skip): self.f.seek(n_skip, 1) @@ -1272,76 +1303,199 @@ def skip_Nbyte(self, n_skip): def read_nocode(self, id): # Skipping bytes from codes 0340-30FC, commented if needed hxid = hex(id) - if hxid[2:4] == '30': + if hxid[2:4] == "30": logging.warning("Skipping bytes from codes 0340-30FC") # I want to count the number of 1s in the middle 4 bits # of the 2nd two bytes. # 60 is a 0b00111100 mask - nflds = (bin(int(hxid[3]) & 60).count('1') + - bin(int(hxid[4]) & 60).count('1')) + nflds = bin(int(hxid[3]) & 60).count("1") + bin(int(hxid[4]) & 60).count( + "1" + ) # I want to count the number of 1s in the highest # 2 bits of byte 3 # 3 is a 0b00000011 mask: - dfac = bin(int(hxid[3], 0) & 3).count('1') + dfac = bin(int(hxid[3], 0) & 3).count("1") self.skip_Nbyte(12 * nflds * dfac) else: - if self._debug_level >= 0: - logging.warning(' Unrecognized ID code: %0.4X' % id) + if self._debug_level > -1: + logging.warning(" Unrecognized ID code: %0.4X" % id) self.skip_nocode(id) def skip_nocode(self, id): # Skipping bytes if ID isn't known offsets = list(self.id_positions.values()) idx = np.where(offsets == self.id_positions[id])[0][0] - byte_len = offsets[idx+1] - offsets[idx] - 2 + byte_len = offsets[idx + 1] - offsets[idx] - 2 self.skip_Nbyte(byte_len) - if self._debug_level >= 0: + if self._debug_level > -1: logging.debug(f"Skipping ID code {id}\n") - def cleanup(self, cfg, dat): - dat['coords']['range'] = (cfg['bin1_dist_m'] + - np.arange(self.ensemble['n_cells']) * - cfg['cell_size']) + def check_offset(self, offset, readbytes): + fd = self.f + if offset != 4 and self._fixoffset == 0: + if self._debug_level > 0: + if fd.tell() == self._filesize: + logging.error( + " EOF reached unexpectedly - discarding this last ensemble\n" + ) + else: + logging.debug( + " Adjust location by {:d} (readbytes={:d},hdr['nbyte']={:d})\n".format( + offset, readbytes, self.hdr["nbyte"] + ) + ) + self._fixoffset = offset - 4 + fd.seek(4 + self._fixoffset, 1) + + def remove_end(self, iens): + dat = self.outd + if self._debug_level > 0: + logging.info(" Encountered end of file. Cleaning up data.") + for nm in self.vars_read: + defs._setd(dat, nm, defs._get(dat, nm)[..., :iens]) + def save_profiles(self, dat, nm, en, iens): + ds = defs._get(dat, nm) + if self.n_avg == 1: + bn = en[nm][..., 0] + else: + bn = np.nanmean(en[nm], axis=-1) + + # If n_cells has changed (RiverPro/StreamPro WinRiver transects) + if len(ds.shape) == 3: + if "_sl" in nm: + # This works here b/c the max number of surface layer cells + # is smaller than the min number of normal profile cells used. + # Extra nan cells created after this if-statement + # are trimmed off in self.cleanup. + bn = bn[: self.cfg["n_cells_sl"]] + else: + # Set bn to current ping size + bn = bn[: self.cfg["n_cells"]] + # If n_cells has increased, we also need to increment defs + if self.n_cells_diff > 0: + a = np.empty((self.n_cells_diff, ds.shape[1], ds.shape[2])) * np.nan + ds = np.append(ds, a.astype(ds.dtype), axis=0) + defs._setd(dat, nm, ds) + # If the number of cells decreases, set extra cells to nan instead of + # whatever is stuck in memory + if ds.shape[0] != bn.shape[0]: + n_cells = ds.shape[0] - bn.shape[0] + a = np.empty((n_cells, bn.shape[1])) * np.nan + bn = np.append(bn, a.astype(ds.dtype), axis=0) + + # Keep track of when the cell size changes + if self.cs_diff: + self.cs.append([iens, self.cfg["cell_size"]]) + self.cs_diff = 0 + + # Then copy the ensemble to the dataset. + ds[..., iens] = bn + defs._setd(dat, nm, ds) + + return dat + + def cleanup(self, dat, cfg): + # Clean up changing cell size, if necessary + cs = np.array(self.cs) + cell_sizes = cs[:, 1] + + # If cell sizes change, depth-bin average the smaller cell sizes + if len(self.cs) > 1: + bins_to_merge = cell_sizes.max() / cell_sizes + idx_start = cs[:, 0].astype(int) + idx_end = np.append(cs[1:, 0], self._nens).astype(int) + + dv = dat["data_vars"] + for var in dv: + if (len(dv[var].shape) == 3) and ("_sl" not in var): + # Create a new NaN var to save data in + new_var = (np.zeros(dv[var].shape) * np.nan).astype(dv[var].dtype) + # For each cell size change, reshape and bin-average + for id1, id2, b in zip(idx_start, idx_end, bins_to_merge): + array = np.transpose(dv[var][..., id1:id2]) + bin_arr = np.transpose(np.mean(self.reshape(array, b), axis=-1)) + new_var[: len(bin_arr), :, id1:id2] = bin_arr + # Reset data. This often leaves nan data at farther ranges + dv[var] = new_var + + # Set cell size and range + cfg["n_cells"] = self.ensemble["n_cells"] + cfg["cell_size"] = cell_sizes.max() + dat["coords"]["range"] = ( + cfg["bin1_dist_m"] + np.arange(cfg["n_cells"]) * cfg["cell_size"] + ) + + # Save configuration data as attributes for nm in cfg: - dat['attrs'][nm] = cfg[nm] - - if 'surface_layer' in cfg: # RiverPro/StreamPro - dat['coords']['range_sl'] = (cfg['bin1_dist_m_sl'] + - np.arange(self.cfg['n_cells_sl']) * - cfg['cell_size_sl']) - # Trim surface layer profile to length - dv = dat['data_vars'] + dat["attrs"][nm] = cfg[nm] + + # Clean up surface layer profiles + if "surface_layer" in cfg: # RiverPro/StreamPro + dat["coords"]["range_sl"] = ( + cfg["bin1_dist_m_sl"] + + np.arange(0, self.n_cells_sl) * cfg["cell_size_sl"] + ) + # Trim off extra nan data + dv = dat["data_vars"] for var in dv: - if 'sl' in var: - dv[var] = dv[var][:cfg['n_cells_sl']] - dat['attrs']['rotate_vars'].append('vel_sl') + if "sl" in var: + dv[var] = dv[var][: self.n_cells_sl] + dat["attrs"]["rotate_vars"].append("vel_sl") + + return dat, cfg + + def reshape(self, arr, n_bin=None): + """ + Reshape the array `arr` to shape (...,n,n_bin). + """ + + out = np.zeros( + list(arr.shape[:-1]) + [int(arr.shape[-1] // n_bin), int(n_bin)], + dtype=arr.dtype, + ) + shp = out.shape + if np.mod(n_bin, 1) == 0: + # n_bin needs to be int + n_bin = int(n_bin) + # If n_bin is an integer, we can do this simply. + out[..., :n_bin] = (arr[..., : (shp[-2] * shp[-1])]).reshape(shp, order="C") + else: + inds = (np.arange(np.prod(shp[-2:])) * n_bin // int(n_bin)).astype(int) + # If there are too many indices, drop one bin + if inds[-1] >= arr.shape[-1]: + inds = inds[: -int(n_bin)] + shp[-2] -= 1 + out = out[..., 1:, :] + n_bin = int(n_bin) + out[..., :n_bin] = (arr[..., inds]).reshape(shp, order="C") + n_bin = int(n_bin) + + return out def finalize(self, dat): - """Remove the attributes from the data that were never loaded. """ + Remove the attributes from the data that were never loaded. + """ + for nm in set(defs.data_defs.keys()) - self.vars_read: defs._pop(dat, nm) for nm in self.cfg: - dat['attrs'][nm] = self.cfg[nm] + dat["attrs"][nm] = self.cfg[nm] # VMDAS and WinRiver have different set sampling frequency - da = dat['attrs'] - if hasattr(da, 'sourceprog') and (da['sourceprog'].lower() in ['vmdas', 'winriver', 'winriver2']): - da['fs'] = round(np.diff(dat['coords']['time']).mean() ** -1, 2) + da = dat["attrs"] + if ("sourceprog" in da) and ( + da["sourceprog"].lower() in ["vmdas", "winriver", "winriver2"] + ): + da["fs"] = round(1 / np.median(np.diff(dat["coords"]["time"])), 2) else: - da['fs'] = (da['sec_between_ping_groups'] * - da['pings_per_ensemble']) ** (-1) - da['n_cells'] = self.ensemble['n_cells'] + da["fs"] = 1 / (da["sec_between_ping_groups"] * da["pings_per_ensemble"]) for nm in defs.data_defs: shp = defs.data_defs[nm][0] - if len(shp) and shp[0] == 'nc' and defs._in_group(dat, nm): + if len(shp) and shp[0] == "nc" and defs._in_group(dat, nm): defs._setd(dat, nm, np.swapaxes(defs._get(dat, nm), 0, 1)) - def __enter__(self,): - return self - - def __exit__(self, type, value, traceback): - self.f.close() + return dat diff --git a/mhkit/dolfyn/io/rdi_defs.py b/mhkit/dolfyn/io/rdi_defs.py index 8c65812db..a91148a53 100644 --- a/mhkit/dolfyn/io/rdi_defs.py +++ b/mhkit/dolfyn/io/rdi_defs.py @@ -1,105 +1,325 @@ import numpy as np century = 2000 -adcp_type = {4: 'Broadband', - 5: 'Broadband', - 6: 'Navigator', - 10: 'Rio Grande', - 11: 'H-ADCP', - 14: 'Ocean Surveyor', - 16: 'Workhorse', - 19: 'Navigator', - 23: 'Ocean Surveyor', - 28: 'ChannelMaster', - 31: 'StreamPro', - 34: 'Explorer', - 37: 'Navigator', - 41: 'DVS', - 43: 'Workhorse', - 44: 'RiverRay', - 47: 'SentinelV', - 50: 'Workhorse', - 51: 'Workhorse', - 52: 'Workhorse', - 53: 'Navigator', - 55: 'DVS', - 56: 'RiverPro', - 59: 'Meridian', - 61: 'Pinnacle', - 66: 'SentinelV', - 67: 'Pathfinder', - 73: 'Pioneer', - 74: 'Tasman', - 76: 'WayFinder', - 77: 'Workhorse', - 78: 'Workhorse', - } - -data_defs = {'number': ([], 'data_vars', 'uint32', '1', 'Ensemble Number', 'number_of_observations'), - 'rtc': ([7], 'sys', 'uint16', '1', 'Real Time Clock', ''), - 'builtin_test_fail': ([], 'data_vars', 'bool', '1', 'Built-In Test Failures', ''), - 'c_sound': ([], 'data_vars', 'float32', 'm s-1', 'Speed of Sound', 'speed_of_sound_in_sea_water'), - 'depth': ([], 'data_vars', 'float32', 'm', 'Depth', 'depth'), - 'pitch': ([], 'data_vars', 'float32', 'degree', 'Pitch', 'platform_pitch'), - 'roll': ([], 'data_vars', 'float32', 'degree', 'Roll', 'platform_roll'), - 'heading': ([], 'data_vars', 'float32', 'degree', 'Heading', 'platform_orientation'), - 'temp': ([], 'data_vars', 'float32', 'degree_C', 'Temperature', 'sea_water_temperature'), - 'salinity': ([], 'data_vars', 'float32', 'psu', 'Salinity', 'sea_water_salinity'), - 'min_preping_wait': ([], 'data_vars', 'float32', 's', 'Minimum Pre-Ping Wait Time Between Measurements', ''), - 'heading_std': ([], 'data_vars', 'float32', 'degree', 'Heading Standard Deviation', ''), - 'pitch_std': ([], 'data_vars', 'float32', 'degree', 'Pitch Standard Deviation', ''), - 'roll_std': ([], 'data_vars', 'float32', 'degree', 'Roll Standard Deviation', ''), - 'adc': ([8], 'sys', 'uint8', '1', 'Analog-Digital Converter Output', ''), - 'error_status': ([], 'attrs', 'float32', '1', 'Error Status', ''), - 'pressure': ([], 'data_vars', 'float32', 'dbar', 'Pressure', 'sea_water_pressure'), - 'pressure_std': ([], 'data_vars', 'float32', 'dbar', 'Pressure Standard Deviation', ''), - 'vel': (['nc', 4], 'data_vars', 'float32', 'm s-1', 'Water Velocity', ''), - 'amp': (['nc', 4], 'data_vars', 'uint8', '1', 'Acoustic Signal Amplitude', - 'signal_intensity_from_multibeam_acoustic_doppler_velocity_sensor_in_sea_water'), - 'corr': (['nc', 4], 'data_vars', 'uint8', '1', 'Acoustic Signal Correlation', - 'beam_consistency_indicator_from_multibeam_acoustic_doppler_velocity_profiler_in_sea_water'), - 'prcnt_gd': (['nc', 4], 'data_vars', 'uint8', '%', 'Percent Good', - 'proportion_of_acceptable_signal_returns_from_acoustic_instrument_in_sea_water'), - 'status': (['nc', 4], 'data_vars', 'float32', '1', 'Status', ''), - 'dist_bt': ([4], 'data_vars', 'float32', 'm', 'Bottom Track Measured Depth', ''), - 'vel_bt': ([4], 'data_vars', 'float32', 'm s-1', 'Platform Velocity from Bottom Track', ''), - 'corr_bt': ([4], 'data_vars', 'uint8', '1', 'Bottom Track Acoustic Signal Correlation', ''), - 'amp_bt': ([4], 'data_vars', 'uint8', '1', 'Bottom Track Acoustic Signal Amplitude', ''), - 'prcnt_gd_bt': ([4], 'data_vars', 'uint8', '%', 'Bottom Track Percent Good', ''), - 'time': ([], 'coords', 'float64', 'seconds since 1970-01-01 00:00:00', 'Time', 'time'), - 'alt_dist': ([], 'data_vars', 'float32', 'm', 'Altimeter Range', 'altimeter_range'), - 'alt_rssi': ([], 'data_vars', 'uint8', 'dB', 'Altimeter Recieved Signal Strength Indicator', ''), - 'alt_eval': ([], 'data_vars', 'uint8', 'dB', 'Altimeter Evaluation Amplitude', ''), - 'alt_status': ([], 'data_vars', 'uint8', 'bit', 'Altimeter Status', ''), - 'time_gps': ([], 'coords', 'float64', 'seconds since 1970-01-01 00:00:00', 'GPS Time', 'time'), - 'clock_offset_UTC_gps': ([], 'data_vars', 'float64', 's', 'Instrument Clock Offset from UTC', ''), - 'latitude_gps': ([], 'data_vars', 'float32', 'degrees_north', 'Latitude', 'latitude'), - 'longitude_gps': ([], 'data_vars', 'float32', 'degrees_east', 'Longitude', 'longitude'), - 'avg_speed_gps': ([], 'data_vars', 'float32', 'm s-1', 'Average Platform Speed', 'platform_speed_wrt_ground'), - 'avg_dir_gps': ([], 'data_vars', 'float32', 'degree', 'Average Platform Direction', 'platform_course'), - 'speed_made_good_gps': ([], 'data_vars', 'float32', 'm s-1', 'Platform Speed Made Good', 'platform_speed_wrt_ground'), - 'dir_made_good_gps': ([], 'data_vars', 'float32', 'degree', 'Platform Direction Made Good', 'platform_course'), - 'flags_gps': ([], 'data_vars', 'float32', 'bits', 'GPS Flags', ''), - 'fix_gps': ([], 'data_vars', 'int8', '1', 'GPS Fix', ''), - 'n_sat_gps': ([], 'data_vars', 'int8', 'count', 'Number of Satellites', ''), - 'hdop_gps': ([], 'data_vars', 'float32', '1', 'Horizontal Dilution of Precision', ''), - 'elevation_gps': ([], 'data_vars', 'float32', 'm', 'Elevation above MLLW', ''), - 'rtk_age_gps': ([], 'data_vars', 'float32', 's', 'Age of Received Real Time Kinetic Signal', ''), - 'speed_over_grnd_gps': ([], 'data_vars', 'float32', 'm s-1', 'Platform Speed over Ground', 'platform_speed_wrt_ground'), - 'dir_over_grnd_gps': ([], 'data_vars', 'float32', 'degree', 'Platform Direction over Ground', 'platform_course'), - 'heading_gps': ([], 'data_vars', 'float32', 'degree', 'GPS Heading', 'platform_orientation'), - 'pitch_gps': ([], 'data_vars', 'float32', 'degree', 'GPS Pitch', 'platform_pitch'), - 'roll_gps': ([], 'data_vars', 'float32', 'degree', 'GPS Roll', 'platform_roll'), - 'dist_nmea': ([], 'data_vars', 'float32', 'm', 'Depth Sounder Range', ''), - 'vel_sl': (['nc', 4], 'data_vars', 'float32', 'm s-1', 'Surface Layer Water Velocity', ''), - 'corr_sl': (['nc', 4], 'data_vars', 'uint8', '1', 'Surface Layer Acoustic Signal Correlation', - 'beam_consistency_indicator_from_multibeam_acoustic_doppler_velocity_profiler_in_sea_water'), - 'amp_sl': (['nc', 4], 'data_vars', 'uint8', '1', 'Surface Layer Acoustic Signal Amplitude', - 'signal_intensity_from_multibeam_acoustic_doppler_velocity_sensor_in_sea_water'), - 'prcnt_gd_sl': (['nc', 4], 'data_vars', 'uint8', '%', 'Surface Layer Percent Good', - 'proportion_of_acceptable_signal_returns_from_acoustic_instrument_in_sea_water'), - 'status_sl': (['nc', 4], 'data_vars', 'float32', '1', 'Surface Layer Status', ''), - } +adcp_type = { + 4: "Broadband", + 5: "Broadband", + 6: "Navigator", + 10: "Rio Grande", + 11: "H-ADCP", + 14: "Ocean Surveyor", + 16: "Workhorse", + 19: "Navigator", + 23: "Ocean Surveyor", + 28: "ChannelMaster", + 31: "StreamPro", + 34: "Explorer", + 37: "Navigator", + 41: "DVS", + 43: "Workhorse", + 44: "RiverRay", + 47: "SentinelV", + 50: "Workhorse", + 51: "Workhorse", + 52: "Workhorse", + 53: "Navigator", + 55: "DVS", + 56: "RiverPro", + 59: "Meridian", + 61: "Pinnacle", + 66: "SentinelV", + 67: "Pathfinder", + 73: "Pioneer", + 74: "Tasman", + 76: "WayFinder", + 77: "Workhorse", + 78: "Workhorse", +} + +data_defs = { + "number": ( + [], + "data_vars", + "uint32", + "1", + "Ensemble Number", + "number_of_observations", + ), + "rtc": ([7], "sys", "uint16", "1", "Real Time Clock", ""), + "builtin_test_fail": ([], "data_vars", "bool", "1", "Built-In Test Failures", ""), + "c_sound": ( + [], + "data_vars", + "float32", + "m s-1", + "Speed of Sound", + "speed_of_sound_in_sea_water", + ), + "depth": ([], "data_vars", "float32", "m", "Depth", "depth"), + "pitch": ([], "data_vars", "float32", "degree", "Pitch", "platform_pitch"), + "roll": ([], "data_vars", "float32", "degree", "Roll", "platform_roll"), + "heading": ( + [], + "data_vars", + "float32", + "degree", + "Heading", + "platform_orientation", + ), + "temp": ( + [], + "data_vars", + "float32", + "degree_C", + "Temperature", + "sea_water_temperature", + ), + "salinity": ([], "data_vars", "float32", "psu", "Salinity", "sea_water_salinity"), + "min_preping_wait": ( + [], + "data_vars", + "float32", + "s", + "Minimum Pre-Ping Wait Time Between Measurements", + "", + ), + "heading_std": ( + [], + "data_vars", + "float32", + "degree", + "Heading Standard Deviation", + "", + ), + "pitch_std": ([], "data_vars", "float32", "degree", "Pitch Standard Deviation", ""), + "roll_std": ([], "data_vars", "float32", "degree", "Roll Standard Deviation", ""), + "adc": ([8], "sys", "uint8", "1", "Analog-Digital Converter Output", ""), + "error_status": ([], "attrs", "float32", "1", "Error Status", ""), + "pressure": ([], "data_vars", "float32", "dbar", "Pressure", "sea_water_pressure"), + "pressure_std": ( + [], + "data_vars", + "float32", + "dbar", + "Pressure Standard Deviation", + "", + ), + "vel": (["nc", 4], "data_vars", "float32", "m s-1", "Water Velocity", ""), + "amp": ( + ["nc", 4], + "data_vars", + "uint8", + "1", + "Acoustic Signal Amplitude", + "signal_intensity_from_multibeam_acoustic_doppler_velocity_sensor_in_sea_water", + ), + "corr": ( + ["nc", 4], + "data_vars", + "uint8", + "1", + "Acoustic Signal Correlation", + "beam_consistency_indicator_from_multibeam_acoustic_doppler_velocity_profiler_in_sea_water", + ), + "prcnt_gd": ( + ["nc", 4], + "data_vars", + "uint8", + "%", + "Percent Good", + "proportion_of_acceptable_signal_returns_from_acoustic_instrument_in_sea_water", + ), + "status": (["nc", 4], "data_vars", "float32", "1", "Status", ""), + "dist_bt": ([4], "data_vars", "float32", "m", "Bottom Track Measured Depth", ""), + "vel_bt": ( + [4], + "data_vars", + "float32", + "m s-1", + "Platform Velocity from Bottom Track", + "", + ), + "corr_bt": ( + [4], + "data_vars", + "uint8", + "1", + "Bottom Track Acoustic Signal Correlation", + "", + ), + "amp_bt": ( + [4], + "data_vars", + "uint8", + "1", + "Bottom Track Acoustic Signal Amplitude", + "", + ), + "prcnt_gd_bt": ([4], "data_vars", "uint8", "%", "Bottom Track Percent Good", ""), + "time": ( + [], + "coords", + "float64", + "seconds since 1970-01-01 00:00:00", + "Time", + "time", + ), + "alt_dist": ([], "data_vars", "float32", "m", "Altimeter Range", "altimeter_range"), + "alt_rssi": ( + [], + "data_vars", + "uint8", + "dB", + "Altimeter Recieved Signal Strength Indicator", + "", + ), + "alt_eval": ([], "data_vars", "uint8", "dB", "Altimeter Evaluation Amplitude", ""), + "alt_status": ([], "data_vars", "uint8", "bit", "Altimeter Status", ""), + "time_gps": ( + [], + "coords", + "float64", + "seconds since 1970-01-01 00:00:00", + "GPS Time", + "time", + ), + "clock_offset_UTC_gps": ( + [], + "data_vars", + "float64", + "s", + "Instrument Clock Offset from UTC", + "", + ), + "latitude_gps": ( + [], + "data_vars", + "float32", + "degrees_north", + "Latitude", + "latitude", + ), + "longitude_gps": ( + [], + "data_vars", + "float32", + "degrees_east", + "Longitude", + "longitude", + ), + "avg_speed_gps": ( + [], + "data_vars", + "float32", + "m s-1", + "Average Platform Speed", + "platform_speed_wrt_ground", + ), + "avg_dir_gps": ( + [], + "data_vars", + "float32", + "degree", + "Average Platform Direction", + "platform_course", + ), + "speed_made_good_gps": ( + [], + "data_vars", + "float32", + "m s-1", + "Platform Speed Made Good", + "platform_speed_wrt_ground", + ), + "dir_made_good_gps": ( + [], + "data_vars", + "float32", + "degree", + "Platform Direction Made Good", + "platform_course", + ), + "flags_gps": ([], "data_vars", "float32", "bits", "GPS Flags", ""), + "fix_gps": ([], "data_vars", "int8", "1", "GPS Fix", ""), + "n_sat_gps": ([], "data_vars", "int8", "count", "Number of Satellites", ""), + "hdop_gps": ( + [], + "data_vars", + "float32", + "1", + "Horizontal Dilution of Precision", + "", + ), + "elevation_gps": ([], "data_vars", "float32", "m", "Elevation above MLLW", ""), + "rtk_age_gps": ( + [], + "data_vars", + "float32", + "s", + "Age of Received Real Time Kinetic Signal", + "", + ), + "speed_over_grnd_gps": ( + [], + "data_vars", + "float32", + "m s-1", + "Platform Speed over Ground", + "platform_speed_wrt_ground", + ), + "dir_over_grnd_gps": ( + [], + "data_vars", + "float32", + "degree", + "Platform Direction over Ground", + "platform_course", + ), + "heading_gps": ( + [], + "data_vars", + "float32", + "degree", + "GPS Heading", + "platform_orientation", + ), + "pitch_gps": ([], "data_vars", "float32", "degree", "GPS Pitch", "platform_pitch"), + "roll_gps": ([], "data_vars", "float32", "degree", "GPS Roll", "platform_roll"), + "dist_nmea": ([], "data_vars", "float32", "m", "Depth Sounder Range", ""), + "vel_sl": ( + ["nc", 4], + "data_vars", + "float32", + "m s-1", + "Surface Layer Water Velocity", + "", + ), + "corr_sl": ( + ["nc", 4], + "data_vars", + "uint8", + "1", + "Surface Layer Acoustic Signal Correlation", + "beam_consistency_indicator_from_multibeam_acoustic_doppler_velocity_profiler_in_sea_water", + ), + "amp_sl": ( + ["nc", 4], + "data_vars", + "uint8", + "1", + "Surface Layer Acoustic Signal Amplitude", + "signal_intensity_from_multibeam_acoustic_doppler_velocity_sensor_in_sea_water", + ), + "prcnt_gd_sl": ( + ["nc", 4], + "data_vars", + "uint8", + "%", + "Surface Layer Percent Good", + "proportion_of_acceptable_signal_returns_from_acoustic_instrument_in_sea_water", + ), + "status_sl": (["nc", 4], "data_vars", "float32", "1", "Surface Layer Status", ""), +} def _get(dat, nm): @@ -141,21 +361,21 @@ def _idata(dat, nm, sz): long_name = data_defs[nm][4] standard_name = data_defs[nm][5] arr = np.empty(sz, dtype=dtype) - if dtype.startswith('float'): + if dtype.startswith("float"): arr[:] = np.NaN dat[group][nm] = arr - dat['units'][nm] = units - dat['long_name'][nm] = long_name + dat["units"][nm] = units + dat["long_name"][nm] = long_name if standard_name: - dat['standard_name'][nm] = standard_name + dat["standard_name"][nm] = standard_name return dat def _get_size(name, n=None, ncell=0): sz = list(data_defs[name][0]) # create a copy! - if 'nc' in sz: - sz.insert(sz.index('nc'), ncell) - sz.remove('nc') + if "nc" in sz: + sz.insert(sz.index("nc"), ncell) + sz.remove("nc") if n is None: return tuple(sz) return tuple(sz + [n]) @@ -168,7 +388,7 @@ def __iadd__(self, vals): return self -class _ensemble(): +class _ensemble: n_avg = 1 k = -1 # This is the counter for filling the ensemble object @@ -181,9 +401,11 @@ def __init__(self, navg, n_cells): self.n_avg = navg self.n_cells = n_cells for nm in data_defs: - setattr(self, nm, - np.zeros(_get_size(nm, n=navg, ncell=n_cells), - dtype=data_defs[nm][2])) + setattr( + self, + nm, + np.zeros(_get_size(nm, n=navg, ncell=n_cells), dtype=data_defs[nm][2]), + ) - def clean_data(self,): - self['vel'][self['vel'] == -32.768] = np.NaN + def clean_data(self): + self["vel"][self["vel"] == -32.768] = np.NaN diff --git a/mhkit/dolfyn/io/rdi_lib.py b/mhkit/dolfyn/io/rdi_lib.py index dac0b710b..df0851a0f 100644 --- a/mhkit/dolfyn/io/rdi_lib.py +++ b/mhkit/dolfyn/io/rdi_lib.py @@ -3,40 +3,40 @@ from os.path import expanduser -class bin_reader(): +class bin_reader: """ Reads binary data files. It is mostly for development purposes, to simplify learning a data file's format. Reading binary data files should minimize the number of calls to struct.unpack and file.read because many calls to these functions (i.e. using the code in this module) are slow. """ - _size_factor = {'B': 1, 'b': 1, 'H': 2, - 'h': 2, 'L': 4, 'l': 4, 'f': 4, 'd': 8} - _frmt = {np.uint8: 'B', np.int8: 'b', - np.uint16: 'H', np.int16: 'h', - np.uint32: 'L', np.int32: 'l', - float: 'f', np.float32: 'f', - np.double: 'd', np.float64: 'd', - } + + _size_factor = {"B": 1, "b": 1, "H": 2, "h": 2, "L": 4, "l": 4, "f": 4, "d": 8} + _frmt = { + np.uint8: "B", + np.int8: "b", + np.uint16: "H", + np.int16: "h", + np.uint32: "L", + np.int32: "l", + float: "f", + np.float32: "f", + np.double: "d", + np.float64: "d", + } @property - def pos(self,): + def pos(self): return self.f.tell() - def __enter__(self,): - return self - - def __exit__(self,): - self.close() - - def __init__(self, fname, endian='<', checksum_size=None, debug_level=0): + def __init__(self, fname, endian="<", checksum_size=None, debug_level=0): """ Default to little-endian '<'... *checksum_size* is in bytes, if it is None or False, this function does not perform checksums. """ self.endian = endian - self.f = open(expanduser(fname), 'rb') + self.f = open(expanduser(fname), "rb") self.f.seek(0, 2) self.fsize = self.tell() self.f.seek(0, 0) @@ -47,7 +47,7 @@ def __init__(self, fname, endian='<', checksum_size=None, debug_level=0): self.cs = checksum_size self.debug_level = debug_level - def checksum(self,): + def checksum(self): """ The next byte(s) are the expected checksum. Perform the checksum. """ @@ -55,9 +55,9 @@ def checksum(self,): cs = self.read(1, self.cs._frmt) self.cs(cs, True) else: - raise Exception('CheckSum not requested for this file') + raise Exception("CheckSum not requested for this file") - def tell(self,): + def tell(self): return self.f.tell() def seek(self, pos, rel=1): @@ -70,7 +70,7 @@ def reads(self, n): val = self.f.read(n) self.cs and self.cs.add(val) try: - val = val.decode('utf-8') + val = val.decode("utf-8") except: if self.debug_level > 5: print("ERROR DECODING: {}".format(val)) @@ -88,28 +88,25 @@ def read(self, n, frmt): return np.array(unpack(self.endian + frmt * n, val)) def read_ui8(self, n): - return self.read(n, 'B') - - def read_float(self, n): - return self.read(n, 'f') + return self.read(n, "B") - def read_double(self, n): - return self.read(n, 'd') + def read_f32(self, n): + return self.read(n, "f") - read_f32 = read_float - read_f64 = read_double + def read_f64(self, n): + return self.read(n, "d") def read_i8(self, n): - return self.read(n, 'b') + return self.read(n, "b") def read_ui16(self, n): - return self.read(n, 'H') + return self.read(n, "H") def read_i16(self, n): - return self.read(n, 'h') + return self.read(n, "h") def read_ui32(self, n): - return self.read(n, 'L') + return self.read(n, "L") def read_i32(self, n): - return self.read(n, 'l') + return self.read(n, "l") diff --git a/mhkit/dolfyn/rotate/api.py b/mhkit/dolfyn/rotate/api.py index 65a6277b1..835b170e2 100644 --- a/mhkit/dolfyn/rotate/api.py +++ b/mhkit/dolfyn/rotate/api.py @@ -9,20 +9,20 @@ # The 'rotation chain' -rc = ['beam', 'inst', 'earth', 'principal'] +rc = ["beam", "inst", "earth", "principal"] rot_module_dict = { # Nortek instruments - 'vector': r_vec, - 'awac': r_awac, - 'signature': r_sig, - 'ad2cp': r_sig, - + "vector": r_vec, + "awac": r_awac, + "signature": r_sig, + "ad2cp": r_sig, # TRDI instruments - 'rdi': r_rdi} + "rdi": r_rdi, +} -def rotate2(ds, out_frame='earth', inplace=True): +def rotate2(ds, out_frame="earth", inplace=True): """ Rotate a dataset to a new coordinate system. @@ -46,8 +46,8 @@ def rotate2(ds, out_frame='earth', inplace=True): ----- - This function rotates all variables in ``ds.attrs['rotate_vars']``. - - In order to rotate to the 'principal' frame, a value should exist for - ``ds.attrs['principal_heading']``. The function + - In order to rotate to the 'principal' frame, a value should exist for + ``ds.attrs['principal_heading']``. The function :func:`calc_principal_heading ` is recommended for this purpose, e.g.: @@ -62,18 +62,19 @@ def rotate2(ds, out_frame='earth', inplace=True): ds = ds.copy(deep=True) csin = ds.coord_sys.lower() - if csin == 'ship': - csin = 'inst' + if csin == "ship": + csin = "inst" # Returns True/False if head2inst_rotmat has been set/not-set. r_vec._check_inst2head_rotmat(ds) - if out_frame == 'principal' and csin != 'earth': + if out_frame == "principal" and csin != "earth": warnings.warn( "You are attempting to rotate into the 'principal' " "coordinate system, but the dataset is in the {} " "coordinate system. Be sure that 'principal_heading' is " - "defined based on the earth coordinate system.".format(csin)) + "defined based on the earth coordinate system.".format(csin) + ) rmod = None for ky in rot_module_dict: @@ -81,22 +82,26 @@ def rotate2(ds, out_frame='earth', inplace=True): rmod = rot_module_dict[ky] break if rmod is None: - raise ValueError("Rotations are not defined for " - "instrument '{}'.".format(_make_model(ds))) + raise ValueError( + "Rotations are not defined for " "instrument '{}'.".format(_make_model(ds)) + ) # Get the 'indices' of the rotation chain try: iframe_in = rc.index(csin) except ValueError: - raise Exception("The coordinate system of the input " - "dataset, '{}', is invalid." - .format(ds.coord_sys)) + raise Exception( + "The coordinate system of the input " + "dataset, '{}', is invalid.".format(ds.coord_sys) + ) try: iframe_out = rc.index(out_frame.lower()) except ValueError: - raise Exception("The specified output coordinate system " - "is invalid, please select one of: 'beam', 'inst', " - "'earth', 'principal'.") + raise Exception( + "The specified output coordinate system " + "is invalid, please select one of: 'beam', 'inst', " + "'earth', 'principal'." + ) if iframe_out == iframe_in: print("Data is already in the {} coordinate system".format(out_frame)) @@ -108,13 +113,13 @@ def rotate2(ds, out_frame='earth', inplace=True): while ds.coord_sys.lower() != out_frame.lower(): csin = ds.coord_sys - if csin == 'ship': - csin = 'inst' + if csin == "ship": + csin = "inst" inow = rc.index(csin) if reverse: - func = getattr(rmod, '_' + rc[inow - 1] + '2' + rc[inow]) + func = getattr(rmod, "_" + rc[inow - 1] + "2" + rc[inow]) else: - func = getattr(rmod, '_' + rc[inow] + '2' + rc[inow + 1]) + func = getattr(rmod, "_" + rc[inow] + "2" + rc[inow + 1]) ds = func(ds, reverse=reverse) if not inplace: @@ -130,7 +135,7 @@ def calc_principal_heading(vel, tidal_mode=True): vel : np.ndarray (2,...,Nt), or (3,...,Nt) The 2D or 3D velocity array (3rd-dim is ignored in this calculation) tidal_mode : bool - If true, range is set from 0 to +/-180 degrees. If false, range is 0 to + If true, range is set from 0 to +/-180 degrees. If false, range is 0 to 360 degrees. Default = True Returns @@ -165,8 +170,7 @@ def calc_principal_heading(vel, tidal_mode=True): dt = np.ma.masked_invalid(dt) # Divide the angle by 2 to remove the doubling done on the previous # line. - pang = np.angle( - np.nanmean(dt, -1, dtype=np.complex128)) / 2 + pang = np.angle(np.nanmean(dt, -1, dtype=np.complex128)) / 2 else: pang = np.angle(np.nanmean(dt, -1)) @@ -225,8 +229,8 @@ def set_declination(ds, declin, inplace=True): if not inplace: ds = ds.copy(deep=True) - if 'declination' in ds.attrs: - angle = declin - ds.attrs.pop('declination') + if "declination" in ds.attrs: + angle = declin - ds.attrs.pop("declination") else: angle = declin cd = np.cos(-np.deg2rad(angle)) @@ -234,28 +238,28 @@ def set_declination(ds, declin, inplace=True): # The ordering is funny here because orientmat is the # transpose of the inst->earth rotation matrix: - Rdec = np.array([[cd, -sd, 0], - [sd, cd, 0], - [0, 0, 1]]) + Rdec = np.array([[cd, -sd, 0], [sd, cd, 0], [0, 0, 1]]) - if ds.coord_sys == 'earth': + if ds.coord_sys == "earth": rotate2earth = True - rotate2(ds, 'inst', inplace=True) + rotate2(ds, "inst", inplace=True) else: rotate2earth = False - ds['orientmat'].values = np.einsum('kj...,ij->ki...', - ds['orientmat'].values, - Rdec, ) - if 'heading' in ds: - ds['heading'] += angle + ds["orientmat"].values = np.einsum( + "kj...,ij->ki...", + ds["orientmat"].values, + Rdec, + ) + if "heading" in ds: + ds["heading"] += angle if rotate2earth: - rotate2(ds, 'earth', inplace=True) - if 'principal_heading' in ds.attrs: - ds.attrs['principal_heading'] += angle + rotate2(ds, "earth", inplace=True) + if "principal_heading" in ds.attrs: + ds.attrs["principal_heading"] += angle - ds.attrs['declination'] = declin - ds.attrs['declination_in_orientmat'] = 1 # logical + ds.attrs["declination"] = declin + ds.attrs["declination_in_orientmat"] = 1 # logical if not inplace: return ds @@ -295,31 +299,32 @@ def set_inst2head_rotmat(ds, rotmat, inplace=True): if not inplace: ds = ds.copy(deep=True) - if not ds.inst_model.lower() == 'vector': - raise Exception("Setting 'inst2head_rotmat' is only supported " - "for Nortek Vector ADVs.") - if ds.get('inst2head_rotmat', None) is not None: + if not ds.inst_model.lower() == "vector": + raise Exception( + "Setting 'inst2head_rotmat' is only supported " "for Nortek Vector ADVs." + ) + if ds.get("inst2head_rotmat", None) is not None: raise Exception( "You are setting 'inst2head_rotmat' after it has already " - "been set. You can only set it once.") + "been set. You can only set it once." + ) csin = ds.coord_sys - if csin not in ['inst', 'beam']: - rotate2(ds, 'inst', inplace=True) + if csin not in ["inst", "beam"]: + rotate2(ds, "inst", inplace=True) - ds['inst2head_rotmat'] = xr.DataArray(np.array(rotmat), - dims=['x1', 'x2'], - coords={'x1': [1, 2, 3], - 'x2': [1, 2, 3]}) + ds["inst2head_rotmat"] = xr.DataArray( + np.array(rotmat), dims=["x1", "x2"], coords={"x1": [1, 2, 3], "x2": [1, 2, 3]} + ) - ds.attrs['inst2head_rotmat_was_set'] = 1 # logical + ds.attrs["inst2head_rotmat_was_set"] = 1 # logical # Note that there is no validation that the user doesn't # change `ds.attrs['inst2head_rotmat']` after calling this # function. - if not csin == 'beam': # csin not 'beam', then we're in inst + if not csin == "beam": # csin not 'beam', then we're in inst ds = r_vec._rotate_inst2head(ds) - if csin not in ['inst', 'beam']: + if csin not in ["inst", "beam"]: rotate2(ds, csin, inplace=True) if not inplace: diff --git a/mhkit/dolfyn/rotate/base.py b/mhkit/dolfyn/rotate/base.py index 13503e61b..d7cdef541 100644 --- a/mhkit/dolfyn/rotate/base.py +++ b/mhkit/dolfyn/rotate/base.py @@ -10,8 +10,7 @@ def _make_model(ds): The make and model of the instrument that collected the data in this data object. """ - return '{} {}'.format(ds.attrs['inst_make'], - ds.attrs['inst_model']).lower() + return "{} {}".format(ds.attrs["inst_make"], ds.attrs["inst_model"]).lower() def _check_rotmat_det(rotmat, thresh=1e-3): @@ -30,72 +29,81 @@ def _check_rotmat_det(rotmat, thresh=1e-3): def _check_rotate_vars(ds, rotate_vars): if rotate_vars is None: - if 'rotate_vars' in ds.attrs: + if "rotate_vars" in ds.attrs: rotate_vars = ds.rotate_vars else: - warnings.warn(" 'rotate_vars' attribute not found." - "Rotating `vel`.") - rotate_vars = ['vel'] + warnings.warn(" 'rotate_vars' attribute not found." "Rotating `vel`.") + rotate_vars = ["vel"] return rotate_vars def _set_coords(ds, ref_frame, forced=False): """ - Checks the current reference frame and adjusts xarray coords/dims + Checks the current reference frame and adjusts xarray coords/dims as necessary. Makes sure assigned dataarray coordinates match what DOLfYN is reading in. """ make = _make_model(ds) - XYZ = ['X', 'Y', 'Z'] - ENU = ['E', 'N', 'U'] + XYZ = ["X", "Y", "Z"] + ENU = ["E", "N", "U"] beam = ds.beam.values - principal = ['streamwise', 'x-stream', 'vert'] + principal = ["streamwise", "x-stream", "vert"] # check make/model - if 'rdi' in make: - inst = ['X', 'Y', 'Z', 'err'] - earth = ['E', 'N', 'U', 'err'] - princ = ['streamwise', 'x-stream', 'vert', 'err'] + if "rdi" in make: + inst = ["X", "Y", "Z", "err"] + earth = ["E", "N", "U", "err"] + princ = ["streamwise", "x-stream", "vert", "err"] - elif 'nortek' in make: - if 'signature' in make or 'ad2cp' in make: - inst = ['X', 'Y', 'Z1', 'Z2'] - earth = ['E', 'N', 'U1', 'U2'] - princ = ['streamwise', 'x-stream', 'vert1', 'vert2'] + elif "nortek" in make: + if "signature" in make or "ad2cp" in make: + inst = ["X", "Y", "Z1", "Z2"] + earth = ["E", "N", "U1", "U2"] + princ = ["streamwise", "x-stream", "vert1", "vert2"] else: # AWAC or Vector inst = XYZ earth = ENU princ = principal - orient = {'beam': beam, 'inst': inst, 'ship': inst, 'earth': earth, - 'principal': princ} - orientIMU = {'beam': XYZ, 'inst': XYZ, 'ship': XYZ, 'earth': ENU, - 'principal': principal} + orient = { + "beam": beam, + "inst": inst, + "ship": inst, + "earth": earth, + "principal": princ, + } + orientIMU = { + "beam": XYZ, + "inst": XYZ, + "ship": XYZ, + "earth": ENU, + "principal": principal, + } if forced: - ref_frame += '-forced' + ref_frame += "-forced" # Update 'dir' and 'dirIMU' dimensions - attrs = ds['dir'].attrs - attrs.update({'ref_frame': ref_frame}) + attrs = ds["dir"].attrs + attrs.update({"ref_frame": ref_frame}) - ds['dir'] = orient[ref_frame] - ds['dir'].attrs = attrs - if hasattr(ds, 'dirIMU'): - ds['dirIMU'] = orientIMU[ref_frame] - ds['dirIMU'].attrs = attrs + ds["dir"] = orient[ref_frame] + ds["dir"].attrs = attrs + if hasattr(ds, "dirIMU"): + ds["dirIMU"] = orientIMU[ref_frame] + ds["dirIMU"].attrs = attrs - ds.attrs['coord_sys'] = ref_frame + ds.attrs["coord_sys"] = ref_frame # These are essentially one extra line to scroll through - tag = ['', '_echo', '_bt'] + tag = ["", "_echo", "_bt"] for tg in tag: - if hasattr(ds, 'coord_sys_axes'+tg): - ds.attrs.pop('coord_sys_axes'+tg) + if hasattr(ds, "coord_sys_axes" + tg): + ds.attrs.pop("coord_sys_axes" + tg) return ds @@ -122,12 +130,12 @@ def _beam2inst(dat, reverse=False, force=False): """ if not force: - if not reverse and dat.coord_sys.lower() != 'beam': - raise ValueError('The input must be in beam coordinates.') - if reverse and dat.coord_sys != 'inst': - raise ValueError('The input must be in inst coordinates.') + if not reverse and dat.coord_sys.lower() != "beam": + raise ValueError("The input must be in beam coordinates.") + if reverse and dat.coord_sys != "inst": + raise ValueError("The input must be in inst coordinates.") - rotmat = dat['beam2inst_orientmat'] + rotmat = dat["beam2inst_orientmat"] if isinstance(force, (list, set, tuple)): # You can force a distinct set of variables to be rotated by @@ -135,16 +143,17 @@ def _beam2inst(dat, reverse=False, force=False): rotate_vars = force else: rotate_vars = [ - ky for ky in dat.rotate_vars if dat[ky].shape[0] == rotmat.shape[0]] + ky for ky in dat.rotate_vars if dat[ky].shape[0] == rotmat.shape[0] + ] - cs = 'inst' + cs = "inst" if reverse: # Can't use transpose because rotation is not between # orthogonal coordinate systems rotmat = inv(rotmat) - cs = 'beam' + cs = "beam" for ky in rotate_vars: - dat[ky].values = np.einsum('ij,j...->i...', rotmat, dat[ky].values) + dat[ky].values = np.einsum("ij,j...->i...", rotmat, dat[ky].values) if force: dat = _set_coords(dat, cs, forced=True) @@ -154,7 +163,7 @@ def _beam2inst(dat, reverse=False, force=False): return dat -def euler2orient(heading, pitch, roll, units='degrees'): +def euler2orient(heading, pitch, roll, units="degrees"): """ Calculate the orientation matrix from DOLfYN-defined euler angles. @@ -163,8 +172,8 @@ def euler2orient(heading, pitch, roll, units='degrees'): The matrices H, P, R are the transpose of the matrices for rotation about z, y, x as shown here https://en.wikipedia.org/wiki/Rotation_matrix. The transpose is used - because in DOLfYN the orientation matrix is organized for - rotation from EARTH --> INST, while the wiki's matrices are organized for + because in DOLfYN the orientation matrix is organized for + rotation from EARTH --> INST, while the wiki's matrices are organized for rotation from INST --> EARTH. Parameters @@ -187,7 +196,7 @@ def euler2orient(heading, pitch, roll, units='degrees'): - a "ZYX" rotation order. That is, these variables are computed assuming that rotation from the earth -> instrument frame happens by rotating around the z-axis first (heading), then rotating - around the y-axis (pitch), then rotating around the x-axis (roll). + around the y-axis (pitch), then rotating around the x-axis (roll). Note this requires matrix multiplication in the reverse order. - heading is defined as the direction the x-axis points, positive @@ -201,11 +210,11 @@ def euler2orient(heading, pitch, roll, units='degrees'): instrument's x-axis """ - if units.lower() == 'degrees': + if units.lower() == "degrees": pitch = np.deg2rad(pitch) roll = np.deg2rad(roll) heading = np.deg2rad(heading) - elif units.lower() == 'radians': + elif units.lower() == "radians": pass else: raise Exception("Invalid units") @@ -227,19 +236,28 @@ def euler2orient(heading, pitch, roll, units='degrees'): one = np.ones_like(sr) H = np.array( - [[ch, sh, zero], - [-sh, ch, zero], - [zero, zero, one], ]) + [ + [ch, sh, zero], + [-sh, ch, zero], + [zero, zero, one], + ] + ) P = np.array( - [[cp, zero, -sp], - [zero, one, zero], - [sp, zero, cp], ]) + [ + [cp, zero, -sp], + [zero, one, zero], + [sp, zero, cp], + ] + ) R = np.array( - [[one, zero, zero], - [zero, cr, sr], - [zero, -sr, cr], ]) + [ + [one, zero, zero], + [zero, cr, sr], + [zero, -sr, cr], + ] + ) - return np.einsum('ij...,jk...,kl...->il...', R, P, H) + return np.einsum("ij...,jk...,kl...->il...", R, P, H) def orient2euler(omat): @@ -258,18 +276,17 @@ def orient2euler(omat): positive clockwise from North (this is *opposite* the right-hand-rule around the Z-axis), range 0-360 degrees. pitch : np.ndarray - The pitch angle (degrees). Pitch is positive when the x-axis + The pitch angle (degrees). Pitch is positive when the x-axis pitches up (this is *opposite* the right-hand-rule around the Y-axis). roll : np.ndarray - The roll angle (degrees). Roll is positive according to the + The roll angle (degrees). Roll is positive according to the right-hand-rule around the instrument's x-axis. """ - if isinstance(omat, np.ndarray) and \ - omat.shape[:2] == (3, 3): + if isinstance(omat, np.ndarray) and omat.shape[:2] == (3, 3): pass - elif hasattr(omat, 'orientmat'): - omat = omat['orientmat'].values + elif hasattr(omat, "orientmat"): + omat = omat["orientmat"].values # Note: orientation matrix is earth->inst unless supplied by an external IMU hh = np.rad2deg(np.arctan2(omat[0, 0], omat[0, 1])) @@ -286,7 +303,7 @@ def orient2euler(omat): def quaternion2orient(quaternions): """ - Calculate orientation from Nortek AHRS quaternions, where q = [W, X, Y, Z] + Calculate orientation from Nortek AHRS quaternions, where q = [W, X, Y, Z] instead of the standard q = [X, Y, Z, W] = [q1, q2, q3, q4] Parameters @@ -305,23 +322,43 @@ def quaternion2orient(quaternions): """ omat = type(quaternions)(np.empty((3, 3, quaternions.time.size))) - omat = omat.rename({'dim_0': 'earth', 'dim_1': 'inst', 'dim_2': 'time'}) + omat = omat.rename({"dim_0": "earth", "dim_1": "inst", "dim_2": "time"}) for i in range(quaternions.time.size): - r = R.from_quat([quaternions.isel(q=1, time=i), - quaternions.isel(q=2, time=i), - quaternions.isel(q=3, time=i), - quaternions.isel(q=0, time=i)]) + r = R.from_quat( + [ + quaternions.isel(q=1, time=i), + quaternions.isel(q=2, time=i), + quaternions.isel(q=3, time=i), + quaternions.isel(q=0, time=i), + ] + ) omat[..., i] = r.as_matrix() # quaternions in inst2earth reference frame, need to rotate to earth2inst omat.values = np.rollaxis(omat.values, 1) - earth = xr.DataArray(['E', 'N', 'U'], dims=['earth'], name='earth', attrs={ - 'units': '1', 'long_name': 'Earth Reference Frame', 'coverage_content_type': 'coordinate'}) - inst = xr.DataArray(['X', 'Y', 'Z'], dims=['inst'], name='inst', attrs={ - 'units': '1', 'long_name': 'Instrument Reference Frame', 'coverage_content_type': 'coordinate'}) - return omat.assign_coords({'earth': earth, 'inst': inst, 'time': quaternions.time}) + earth = xr.DataArray( + ["E", "N", "U"], + dims=["earth"], + name="earth", + attrs={ + "units": "1", + "long_name": "Earth Reference Frame", + "coverage_content_type": "coordinate", + }, + ) + inst = xr.DataArray( + ["X", "Y", "Z"], + dims=["inst"], + name="inst", + attrs={ + "units": "1", + "long_name": "Instrument Reference Frame", + "coverage_content_type": "coordinate", + }, + ) + return omat.assign_coords({"earth": earth, "inst": inst, "time": quaternions.time}) def calc_tilt(pitch, roll): @@ -334,16 +371,16 @@ def calc_tilt(pitch, roll): Instrument roll in degrees pitch : numpy.ndarray or xarray.DataArray Instrument pitch in degrees - + Returns ------- tilt : numpy.ndarray Vertical inclination of the instrument in degrees """ - if 'xarray' in type(pitch).__module__: + if "xarray" in type(pitch).__module__: pitch = pitch.values - if 'xarray' in type(roll).__module__: + if "xarray" in type(roll).__module__: roll = roll.values tilt = np.arctan( diff --git a/mhkit/dolfyn/rotate/rdi.py b/mhkit/dolfyn/rotate/rdi.py index 9f58e3738..36e91c8dd 100644 --- a/mhkit/dolfyn/rotate/rdi.py +++ b/mhkit/dolfyn/rotate/rdi.py @@ -31,15 +31,16 @@ def _inst2earth(adcpo, reverse=False, rotate_vars=None, force=False): """ csin = adcpo.coord_sys.lower() - cs_allowed = ['inst', 'ship'] + cs_allowed = ["inst", "ship"] if reverse: - cs_allowed = ['earth'] + cs_allowed = ["earth"] if not force and csin not in cs_allowed: - raise ValueError("Invalid rotation for data in {}-frame " - "coordinate system.".format(csin)) + raise ValueError( + "Invalid rotation for data in {}-frame " "coordinate system.".format(csin) + ) - if 'orientmat' in adcpo: - omat = adcpo['orientmat'] + if "orientmat" in adcpo: + omat = adcpo["orientmat"] else: omat = _calc_orientmat(adcpo) @@ -52,11 +53,11 @@ def _inst2earth(adcpo, reverse=False, rotate_vars=None, force=False): # view (not a new array) rotmat = np.rollaxis(omat.data, 1) if reverse: - cs_new = 'inst' - sumstr = 'jik,j...k->i...k' + cs_new = "inst" + sumstr = "jik,j...k->i...k" else: - cs_new = 'earth' - sumstr = 'ijk,j...k->i...k' + cs_new = "earth" + sumstr = "ijk,j...k->i...k" # Only operate on the first 3-components, b/c the 4th is err_vel for nm in rotate_vars: @@ -91,18 +92,17 @@ def _calc_beam_orientmat(theta=20, convex=True, degrees=True): c = -1 else: c = 1 - a = 1 / (2. * np.sin(theta)) - b = 1 / (4. * np.cos(theta)) - d = a / (2. ** 0.5) - return np.array([[c * a, -c * a, 0, 0], - [0, 0, -c * a, c * a], - [b, b, b, b], - [d, d, -d, -d]]) + a = 1 / (2.0 * np.sin(theta)) + b = 1 / (4.0 * np.cos(theta)) + d = a / (2.0**0.5) + return np.array( + [[c * a, -c * a, 0, 0], [0, 0, -c * a, c * a], [b, b, b, b], [d, d, -d, -d]] + ) def _calc_orientmat(adcpo): """ - Calculate the orientation matrix using the raw + Calculate the orientation matrix using the raw heading, pitch, roll values from the RDI binary file. Parameters @@ -123,12 +123,12 @@ def _calc_orientmat(adcpo): (Tilt 1) is recorded in the variable leader. P is set to 0 if the "use tilt" bit of the EX command is not set.""" - r = np.deg2rad(adcpo['roll'].values) - p = np.arctan(np.tan(np.deg2rad(adcpo['pitch'].values)) * np.cos(r)) - h = np.deg2rad(adcpo['heading'].values) + r = np.deg2rad(adcpo["roll"].values) + p = np.arctan(np.tan(np.deg2rad(adcpo["pitch"].values)) * np.cos(r)) + h = np.deg2rad(adcpo["heading"].values) - if 'rdi' in adcpo.inst_make.lower(): - if adcpo.orientation == 'up': + if "rdi" in adcpo.inst_make.lower(): + if adcpo.orientation == "up": """ ## RDI-ADCP-MANUAL (Jan 08, section 5.6 page 18) Since the roll describes the ship axes rather than the @@ -139,7 +139,7 @@ def _calc_orientmat(adcpo): to 0 if the "use tilt" bit of the EX command is not set. """ r += np.pi - if (adcpo.coord_sys == 'ship' and adcpo.use_pitchroll == 'yes'): + if adcpo.coord_sys == "ship" and adcpo.use_pitchroll == "yes": r[:] = 0 p[:] = 0 @@ -163,14 +163,29 @@ def _calc_orientmat(adcpo): # The 'orientation matrix' is the transpose of the 'rotation matrix'. omat = np.rollaxis(rotmat, 1) - earth = xr.DataArray(['E', 'N', 'U'], dims=['earth'], name='earth', attrs={ - 'units': '1', 'long_name': 'Earth Reference Frame', 'coverage_content_type': 'coordinate'}) - inst = xr.DataArray(['X', 'Y', 'Z'], dims=['inst'], name='inst', attrs={ - 'units': '1', 'long_name': 'Instrument Reference Frame', 'coverage_content_type': 'coordinate'}) - return xr.DataArray(omat, - coords={'earth': earth, - 'inst': inst, - 'time': adcpo.time}, - dims=['earth', 'inst', 'time'], - attrs={'units': '1', - 'long_name': 'Orientation Matrix'}) + earth = xr.DataArray( + ["E", "N", "U"], + dims=["earth"], + name="earth", + attrs={ + "units": "1", + "long_name": "Earth Reference Frame", + "coverage_content_type": "coordinate", + }, + ) + inst = xr.DataArray( + ["X", "Y", "Z"], + dims=["inst"], + name="inst", + attrs={ + "units": "1", + "long_name": "Instrument Reference Frame", + "coverage_content_type": "coordinate", + }, + ) + return xr.DataArray( + omat, + coords={"earth": earth, "inst": inst, "time": adcpo.time}, + dims=["earth", "inst", "time"], + attrs={"units": "1", "long_name": "Orientation Matrix"}, + ) diff --git a/mhkit/dolfyn/rotate/signature.py b/mhkit/dolfyn/rotate/signature.py index 8d333a136..771842842 100644 --- a/mhkit/dolfyn/rotate/signature.py +++ b/mhkit/dolfyn/rotate/signature.py @@ -22,23 +22,23 @@ def _inst2earth(adcpo, reverse=False, rotate_vars=None, force=False): The list of variables to rotate. By default this is taken from adcpo.rotate_vars. force : bool - Do not check which frame the data is in prior to performing + Do not check which frame the data is in prior to performing this rotation. Default = False """ if reverse: # The transpose of the rotation matrix gives the inverse # rotation, so we simply reverse the order of the einsum: - sumstr = 'jik,j...k->i...k' - cs_now = 'earth' - cs_new = 'inst' + sumstr = "jik,j...k->i...k" + cs_now = "earth" + cs_new = "inst" else: - sumstr = 'ijk,j...k->i...k' - cs_now = 'inst' - cs_new = 'earth' + sumstr = "ijk,j...k->i...k" + cs_now = "inst" + cs_new = "earth" # if ADCP is upside down - if adcpo.orientation == 'down': + if adcpo.orientation == "down": down = True else: # orientation = 'up' or 'AHRS' down = False @@ -52,14 +52,18 @@ def _inst2earth(adcpo, reverse=False, rotate_vars=None, force=False): return elif cs != cs_now: raise ValueError( - "Data must be in the '%s' frame when using this function" % - cs_now) + "Data must be in the '%s' frame when using this function" % cs_now + ) - if 'orientmat' in adcpo: - omat = adcpo['orientmat'] + if "orientmat" in adcpo: + omat = adcpo["orientmat"] else: - omat = _euler2orient(adcpo['time'], adcpo['heading'].values, adcpo['pitch'].values, - adcpo['roll'].values) + omat = _euler2orient( + adcpo["time"], + adcpo["heading"].values, + adcpo["pitch"].values, + adcpo["roll"].values, + ) # Take the transpose of the orientation to get the inst->earth rotation # matrix. @@ -67,12 +71,18 @@ def _inst2earth(adcpo, reverse=False, rotate_vars=None, force=False): _dcheck = rotb._check_rotmat_det(rmat) if not _dcheck.all(): - warnings.warn("Invalid orientation matrix (determinant != 1) at indices: {}. " - "If rotated, data at these indices will be erroneous." - .format(np.nonzero(~_dcheck)[0]), UserWarning) + warnings.warn( + "Invalid orientation matrix (determinant != 1) at indices: {}. " + "If rotated, data at these indices will be erroneous.".format( + np.nonzero(~_dcheck)[0] + ), + UserWarning, + ) # The dictionary of rotation matrices for different sized arrays. - rmd = {3: rmat, } + rmd = { + 3: rmat, + } # The 4-row rotation matrix assume that rows 0,1 are u,v, # and 2,3 are independent estimates of w. @@ -99,30 +109,35 @@ def _inst2earth(adcpo, reverse=False, rotate_vars=None, force=False): signIMU = np.array([1, -1, -1], ndmin=dat.ndim).T if not reverse: if n == 3: - dat = np.einsum(sumstr, rmd[3], signIMU*dat) + dat = np.einsum(sumstr, rmd[3], signIMU * dat) elif n == 4: - dat = np.einsum('ijk,j...k->i...k', rmd[4], sign*dat) + dat = np.einsum("ijk,j...k->i...k", rmd[4], sign * dat) else: - raise Exception("The entry {} is not a vector, it cannot" - "be rotated.".format(nm)) + raise Exception( + "The entry {} is not a vector, it cannot" + "be rotated.".format(nm) + ) elif reverse: if n == 3: - dat = signIMU*np.einsum(sumstr, rmd[3], dat) + dat = signIMU * np.einsum(sumstr, rmd[3], dat) elif n == 4: - dat = sign*np.einsum('ijk,j...k->i...k', rmd[4], dat) + dat = sign * np.einsum("ijk,j...k->i...k", rmd[4], dat) else: - raise Exception("The entry {} is not a vector, it cannot" - "be rotated.".format(nm)) + raise Exception( + "The entry {} is not a vector, it cannot" + "be rotated.".format(nm) + ) else: # 'up' and AHRS if n == 3: dat = np.einsum(sumstr, rmd[3], dat) elif n == 4: - dat = np.einsum('ijk,j...k->i...k', rmd[4], dat) + dat = np.einsum("ijk,j...k->i...k", rmd[4], dat) else: - raise Exception("The entry {} is not a vector, it cannot" - "be rotated.".format(nm)) + raise Exception( + "The entry {} is not a vector, it cannot" "be rotated.".format(nm) + ) adcpo[nm].values = dat.copy() adcpo = rotb._set_coords(adcpo, cs_new) diff --git a/mhkit/dolfyn/rotate/vector.py b/mhkit/dolfyn/rotate/vector.py index bc833d7dd..3fcd856a3 100644 --- a/mhkit/dolfyn/rotate/vector.py +++ b/mhkit/dolfyn/rotate/vector.py @@ -28,28 +28,28 @@ def _beam2inst(dat, reverse=False, force=False): def _rotate_inst2head(advo, reverse=False): """ - Rotates the velocity vector from the instrument frame to the ADV probe (head) frame or + Rotates the velocity vector from the instrument frame to the ADV probe (head) frame or vice versa. - This function uses the rotation matrix 'inst2head_rotmat' to rotate the velocity vector 'vel' - from the instrument frame to the head frame ('inst->head') or from the head frame to the + This function uses the rotation matrix 'inst2head_rotmat' to rotate the velocity vector 'vel' + from the instrument frame to the head frame ('inst->head') or from the head frame to the instrument frame ('head->inst'). Parameters ---------- advo: dict - A dictionary-like object that includes the rotation matrix 'inst2head_rotmat' + A dictionary-like object that includes the rotation matrix 'inst2head_rotmat' and the velocity vector 'vel' to be rotated. reverse: bool, optional - A boolean value indicating the direction of the rotation. - If False (default), the function rotates 'vel' from the instrument frame to the head frame. + A boolean value indicating the direction of the rotation. + If False (default), the function rotates 'vel' from the instrument frame to the head frame. If True, the function rotates 'vel' from the head frame to the instrument frame. Returns ------- advo: dict - The input dictionary-like object with the rotated velocity vector. + The input dictionary-like object with the rotated velocity vector. If 'inst2head_rotmat' doesn't exist in 'advo', the function returns the input 'advo' unmodified. """ @@ -57,9 +57,9 @@ def _rotate_inst2head(advo, reverse=False): # This object doesn't have a head2inst_rotmat, so we do nothing. return advo if reverse: # head->inst - advo['vel'].values = np.dot(advo['inst2head_rotmat'].T, advo['vel']) + advo["vel"].values = np.dot(advo["inst2head_rotmat"].T, advo["vel"]) else: # inst->head - advo['vel'].values = np.dot(advo['inst2head_rotmat'], advo['vel']) + advo["vel"].values = np.dot(advo["inst2head_rotmat"], advo["vel"]) return advo @@ -80,12 +80,14 @@ def _check_inst2head_rotmat(advo): Returns True if 'inst2head_rotmat' exists, was set correctly, and is valid (False if not). """ - if advo.get('inst2head_rotmat', None) is None: + if advo.get("inst2head_rotmat", None) is None: # This is the default value, and we do nothing. return False if not advo.inst2head_rotmat_was_set: - raise Exception("The inst2head rotation matrix exists in props, " - "but it was not set using `set_inst2head_rotmat.") + raise Exception( + "The inst2head rotation matrix exists in props, " + "but it was not set using `set_inst2head_rotmat." + ) if not rotb._check_rotmat_det(advo.inst2head_rotmat.values): raise ValueError("Invalid inst2head_rotmat (determinant != 1).") return True @@ -107,20 +109,20 @@ def _inst2earth(advo, reverse=False, rotate_vars=None, force=False): The list of variables to rotate. By default this is taken from advo.attrs['rotate_vars']. force : bool - Do not check which frame the data is in prior to performing + Do not check which frame the data is in prior to performing this rotation. Default = False """ if reverse: # earth->inst # The transpose of the rotation matrix gives the inverse # rotation, so we simply reverse the order of the einsum: - sumstr = 'jik,j...k->i...k' - cs_now = 'earth' - cs_new = 'inst' + sumstr = "jik,j...k->i...k" + cs_now = "earth" + cs_new = "inst" else: # inst->earth - sumstr = 'ijk,j...k->i...k' - cs_now = 'inst' - cs_new = 'earth' + sumstr = "ijk,j...k->i...k" + cs_now = "inst" + cs_new = "earth" rotate_vars = rotb._check_rotate_vars(advo, rotate_vars) @@ -131,17 +133,18 @@ def _inst2earth(advo, reverse=False, rotate_vars=None, force=False): return elif cs != cs_now: raise ValueError( - "Data must be in the '%s' frame when using this function" % - cs_now) + "Data must be in the '%s' frame when using this function" % cs_now + ) - if hasattr(advo, 'orientmat'): - omat = advo['orientmat'] + if hasattr(advo, "orientmat"): + omat = advo["orientmat"] else: - if 'vector' in advo.inst_model.lower(): - orientation_down = advo['orientation_down'] + if "vector" in advo.inst_model.lower(): + orientation_down = advo["orientation_down"] - omat = _calc_omat(advo['time'], advo['heading'], advo['pitch'], - advo['roll'], orientation_down) + omat = _calc_omat( + advo["time"], advo["heading"], advo["pitch"], advo["roll"], orientation_down + ) # Take the transpose of the orientation to get the inst->earth rotation # matrix. @@ -149,15 +152,20 @@ def _inst2earth(advo, reverse=False, rotate_vars=None, force=False): _dcheck = rotb._check_rotmat_det(rmat) if not _dcheck.all(): - warnings.warn("Invalid orientation matrix (determinant != 1) at indices: {}. " - "If rotated, data at these indices will be erroneous." - .format(np.nonzero(~_dcheck)[0]), UserWarning) + warnings.warn( + "Invalid orientation matrix (determinant != 1) at indices: {}. " + "If rotated, data at these indices will be erroneous.".format( + np.nonzero(~_dcheck)[0] + ), + UserWarning, + ) for nm in rotate_vars: n = advo[nm].shape[0] if n != 3: - raise Exception("The entry {} is not a vector, it cannot " - "be rotated.".format(nm)) + raise Exception( + "The entry {} is not a vector, it cannot " "be rotated.".format(nm) + ) advo[nm].values = np.einsum(sumstr, rmat, advo[nm]) advo = rotb._set_coords(advo, cs_new) @@ -191,34 +199,32 @@ def _earth2principal(advo, reverse=False, rotate_vars=None): # the rest of the function) if reverse: - cs_now = 'principal' - cs_new = 'earth' + cs_now = "principal" + cs_new = "earth" else: ang *= -1 - cs_now = 'earth' - cs_new = 'principal' + cs_now = "earth" + cs_new = "principal" rotate_vars = rotb._check_rotate_vars(advo, rotate_vars) cs = advo.coord_sys.lower() if cs == cs_new: - print('Data is already in the %s coordinate system' % cs_new) + print("Data is already in the %s coordinate system" % cs_new) return elif cs != cs_now: raise ValueError( - 'Data must be in the {} frame ' - 'to use this function'.format(cs_now)) + "Data must be in the {} frame " "to use this function".format(cs_now) + ) # Calculate the rotation matrix: cp, sp = np.cos(ang), np.sin(ang) - rotmat = np.array([[cp, -sp, 0], - [sp, cp, 0], - [0, 0, 1]], dtype=np.float32) + rotmat = np.array([[cp, -sp, 0], [sp, cp, 0], [0, 0, 1]], dtype=np.float32) # Perform the rotation: for nm in rotate_vars: dat = advo[nm].values - dat[:2] = np.einsum('ij,j...->i...', rotmat[:2, :2], dat[:2]) + dat[:2] = np.einsum("ij,j...->i...", rotmat[:2, :2], dat[:2]) advo[nm].values = dat.copy() # Finalize the output. @@ -273,7 +279,7 @@ def _calc_omat(time, hh, pp, rr, orientation_down=None): return _euler2orient(time, hh, pp, rr) -def _euler2orient(time, heading, pitch, roll, units='degrees'): +def _euler2orient(time, heading, pitch, roll, units="degrees"): # For Nortek data only. # The heading, pitch, roll used here are from the Nortek binary files. @@ -281,7 +287,7 @@ def _euler2orient(time, heading, pitch, roll, units='degrees'): # Returns a rotation matrix that rotates earth (ENU) -> inst. # This is based on the Nortek `Transforms.m` file, available in # the refs folder. - if units.lower() == 'degrees': + if units.lower() == "degrees": pitch = np.deg2rad(pitch) roll = np.deg2rad(roll) heading = np.deg2rad(heading) @@ -291,7 +297,7 @@ def _euler2orient(time, heading, pitch, roll, units='degrees'): # This also involved swapping the sign on sh in the def of omat # below from the values provided in the Nortek Matlab script. - heading = (np.pi / 2 - heading) + heading = np.pi / 2 - heading ch = np.cos(heading) sh = np.sin(heading) @@ -313,14 +319,29 @@ def _euler2orient(time, heading, pitch, roll, units='degrees'): omat[1, 2, :] = sr * cp omat[2, 2, :] = cp * cr - earth = xr.DataArray(['E', 'N', 'U'], dims=['earth'], name='earth', attrs={ - 'units': '1', 'long_name': 'Earth Reference Frame', 'coverage_content_type': 'coordinate'}) - inst = xr.DataArray(['X', 'Y', 'Z'], dims=['inst'], name='inst', attrs={ - 'units': '1', 'long_name': 'Instrument Reference Frame', 'coverage_content_type': 'coordinate'}) - return xr.DataArray(omat, - coords={'earth': earth, - 'inst': inst, - 'time': time}, - dims=['earth', 'inst', 'time'], - attrs={'units': '1', - 'long_name': 'Orientation Matrix'}) + earth = xr.DataArray( + ["E", "N", "U"], + dims=["earth"], + name="earth", + attrs={ + "units": "1", + "long_name": "Earth Reference Frame", + "coverage_content_type": "coordinate", + }, + ) + inst = xr.DataArray( + ["X", "Y", "Z"], + dims=["inst"], + name="inst", + attrs={ + "units": "1", + "long_name": "Instrument Reference Frame", + "coverage_content_type": "coordinate", + }, + ) + return xr.DataArray( + omat, + coords={"earth": earth, "inst": inst, "time": time}, + dims=["earth", "inst", "time"], + attrs={"units": "1", "long_name": "Orientation Matrix"}, + ) diff --git a/mhkit/dolfyn/time.py b/mhkit/dolfyn/time.py index 576c395d1..ed25b23a5 100644 --- a/mhkit/dolfyn/time.py +++ b/mhkit/dolfyn/time.py @@ -12,7 +12,7 @@ def _fullyear(year): def epoch2dt64(ep_time): """ - Convert from epoch time (seconds since 1/1/1970 00:00:00) to + Convert from epoch time (seconds since 1/1/1970 00:00:00) to numpy.datetime64 array Parameters @@ -27,14 +27,14 @@ def epoch2dt64(ep_time): """ # assumes t0=1970-01-01 00:00:00 - out = np.array(ep_time.astype('int')).astype('datetime64[s]') - out = out + ((ep_time % 1) * 1e9).astype('timedelta64[ns]') + out = np.array(ep_time.astype("int")).astype("datetime64[s]") + out = out + ((ep_time % 1) * 1e9).astype("timedelta64[ns]") return out def dt642epoch(dt64): """ - Convert numpy.datetime64 array to epoch time + Convert numpy.datetime64 array to epoch time (seconds since 1/1/1970 00:00:00) Parameters @@ -48,7 +48,7 @@ def dt642epoch(dt64): Epoch time (seconds since 1/1/1970 00:00:00) """ - return dt64.astype('datetime64[ns]').astype('float') / 1e9 + return dt64.astype("datetime64[ns]").astype("float") / 1e9 def date2dt64(dt): @@ -66,7 +66,7 @@ def date2dt64(dt): Single or array of datetime64 object(s) """ - return np.array(dt).astype('datetime64[ns]') + return np.array(dt).astype("datetime64[ns]") def dt642date(dt64): @@ -89,7 +89,7 @@ def dt642date(dt64): def epoch2date(ep_time, offset_hr=0, to_str=False): """ - Convert from epoch time (seconds since 1/1/1970 00:00:00) to a list + Convert from epoch time (seconds since 1/1/1970 00:00:00) to a list of datetime objects Parameters @@ -104,12 +104,12 @@ def epoch2date(ep_time, offset_hr=0, to_str=False): Returns ------- time : datetime.datetime - The converted datetime object or list(strings) + The converted datetime object or list(strings) Notes ----- The specific time instance is set during deployment, usually sync'd to the - deployment computer. The time seen by DOLfYN is in the timezone of the + deployment computer. The time seen by DOLfYN is in the timezone of the deployment computer, which is unknown to DOLfYN. """ @@ -161,7 +161,7 @@ def date2str(dt, format_str=None): """ if format_str is None: - format_str = '%Y-%m-%d %H:%M:%S.%f' + format_str = "%Y-%m-%d %H:%M:%S.%f" if not isinstance(dt, list): dt = [dt] @@ -208,9 +208,10 @@ def date2matlab(dt): time = list() for i in range(len(dt)): mdn = dt[i] + timedelta(days=366) - frac_seconds = (dt[i]-datetime(dt[i].year, dt[i].month, - dt[i].day, 0, 0, 0)).seconds / (24*60*60) - frac_microseconds = dt[i].microsecond / (24*60*60*1000000) + frac_seconds = ( + dt[i] - datetime(dt[i].year, dt[i].month, dt[i].day, 0, 0, 0) + ).seconds / (24 * 60 * 60) + frac_microseconds = dt[i].microsecond / (24 * 60 * 60 * 1000000) time.append(mdn.toordinal() + frac_seconds + frac_microseconds) return time @@ -238,9 +239,10 @@ def matlab2date(matlab_dn): time.append(day + dayfrac) # Datenum is precise down to 100 microseconds - add difference to round - us = int(round(time[i].microsecond/100, 0))*100 - time[i] = time[i].replace(microsecond=time[i].microsecond) + \ - timedelta(microseconds=us-time[i].microsecond) + us = int(round(time[i].microsecond / 100, 0)) * 100 + time[i] = time[i].replace(microsecond=time[i].microsecond) + timedelta( + microseconds=us - time[i].microsecond + ) return time @@ -253,7 +255,7 @@ def _fill_time_gaps(epoch, sample_rate_hz): """ # epoch is seconds since 1970 - dt = 1. / sample_rate_hz + dt = 1.0 / sample_rate_hz epoch = fillgaps(epoch) if np.isnan(epoch[0]): i0 = np.nonzero(~np.isnan(epoch))[0][0] @@ -263,6 +265,6 @@ def _fill_time_gaps(epoch, sample_rate_hz): # Search backward through the array to get the 'negative index' ie = -np.nonzero(~np.isnan(epoch[::-1]))[0][0] - 1 delta = np.arange(1, -ie, 1) * dt - epoch[(ie + 1):] = epoch[ie] + delta + epoch[(ie + 1) :] = epoch[ie] + delta return epoch diff --git a/mhkit/dolfyn/tools/fft.py b/mhkit/dolfyn/tools/fft.py index 8810c78b0..7d8c08503 100644 --- a/mhkit/dolfyn/tools/fft.py +++ b/mhkit/dolfyn/tools/fft.py @@ -1,5 +1,6 @@ import numpy as np from .misc import detrend_array + fft = np.fft.fft @@ -28,16 +29,27 @@ def fft_frequency(nfft, fs, full=False): if full: return f else: - return np.abs(f[1:int(nfft / 2. + 1)]) + return np.abs(f[1 : int(nfft / 2.0 + 1)]) def _getwindow(window, nfft): - if window == 'hann': - window = np.hanning(nfft) - elif window == 'hamm': - window = np.hamming(nfft) - elif window is None or window == 1: + if window is None: + window = np.ones(nfft) + elif isinstance(window, (int, float)) and window == 1: window = np.ones(nfft) + elif isinstance(window, str): + if "hann" in window: + window = np.hanning(nfft) + elif "hamm" in window: + window = np.hamming(nfft) + else: + raise ValueError("Unsupported window type: {}".format(window)) + elif isinstance(window, np.ndarray): + if len(window) != nfft: + raise ValueError("Custom window length must be equal to nfft") + else: + raise ValueError("Invalid window parameter") + return window @@ -68,7 +80,7 @@ def _stepsize(l, nfft, nens=None, step=None): if nens is None and step is None: if l == nfft: return 0, 1, int(nfft) - nens = int(2. * l / nfft) + nens = int(2.0 * l / nfft) return int((l - nfft) / (nens - 1)), nens, int(nfft) elif nens is None: return int(step), int((l - nfft) / step + 1), int(nfft) @@ -78,7 +90,7 @@ def _stepsize(l, nfft, nens=None, step=None): return int((l - nfft) / (nens - 1)), int(nens), int(nfft) -def cpsd_quasisync_1D(a, b, nfft, fs, window='hann'): +def cpsd_quasisync_1D(a, b, nfft, fs, window="hann"): """ Compute the cross power spectral density (CPSD) of the signals `a` and `b`. @@ -148,21 +160,24 @@ def cpsd_quasisync_1D(a, b, nfft, fs, window='hann'): step[1], nens, nfft = _stepsize(l[1], nfft, nens=nens) fs = np.float64(fs) window = _getwindow(window, nfft) - fft_inds = slice(1, int(nfft / 2. + 1)) - wght = 2. / (window ** 2).sum() - pwr = fft(detrend_array(a[0:nfft]) * window)[fft_inds] * \ - np.conj(fft(detrend_array(b[0:nfft]) * window)[fft_inds]) + fft_inds = slice(1, int(nfft / 2.0 + 1)) + wght = 2.0 / (window**2).sum() + pwr = fft(detrend_array(a[0:nfft]) * window)[fft_inds] * np.conj( + fft(detrend_array(b[0:nfft]) * window)[fft_inds] + ) if nens - 1: - for i1, i2 in zip(range(step[0], l[0] - nfft + 1, step[0]), - range(step[1], l[1] - nfft + 1, step[1])): - pwr += fft(detrend_array(a[i1:(i1 + nfft)]) * window)[fft_inds] * \ - np.conj( - fft(detrend_array(b[i2:(i2 + nfft)]) * window)[fft_inds]) + for i1, i2 in zip( + range(step[0], l[0] - nfft + 1, step[0]), + range(step[1], l[1] - nfft + 1, step[1]), + ): + pwr += fft(detrend_array(a[i1 : (i1 + nfft)]) * window)[fft_inds] * np.conj( + fft(detrend_array(b[i2 : (i2 + nfft)]) * window)[fft_inds] + ) pwr *= wght / nens / fs return pwr -def cpsd_1D(a, b, nfft, fs, window='hann', step=None): +def cpsd_1D(a, b, nfft, fs, window="hann", step=None): """ Compute the cross power spectral density (CPSD) of the signals `a` and `b`. @@ -229,8 +244,8 @@ def cpsd_1D(a, b, nfft, fs, window='hann', step=None): step, nens, nfft = _stepsize(l, nfft, step=step) fs = np.float64(fs) window = _getwindow(window, nfft) - fft_inds = slice(1, int(nfft / 2. + 1)) - wght = 2. / (window ** 2).sum() + fft_inds = slice(1, int(nfft / 2.0 + 1)) + wght = 2.0 / (window**2).sum() s1 = fft(detrend_array(a[0:nfft]) * window)[fft_inds] if auto_psd: pwr = np.abs(s1) ** 2 @@ -238,18 +253,18 @@ def cpsd_1D(a, b, nfft, fs, window='hann', step=None): pwr = s1 * np.conj(fft(detrend_array(b[0:nfft]) * window)[fft_inds]) if nens - 1: for i in range(step, l - nfft + 1, step): - s1 = fft(detrend_array(a[i:(i + nfft)]) * window)[fft_inds] + s1 = fft(detrend_array(a[i : (i + nfft)]) * window)[fft_inds] if auto_psd: pwr += np.abs(s1) ** 2 else: - pwr += s1 * \ - np.conj( - fft(detrend_array(b[i:(i + nfft)]) * window)[fft_inds]) + pwr += s1 * np.conj( + fft(detrend_array(b[i : (i + nfft)]) * window)[fft_inds] + ) pwr *= wght / nens / fs return pwr -def psd_1D(a, nfft, fs, window='hann', step=None): +def psd_1D(a, nfft, fs, window="hann", step=None): """ Compute the power spectral density (PSD). @@ -286,7 +301,7 @@ def psd_1D(a, nfft, fs, window='hann', step=None): Notes ----- - Credit: This function's line of code was copied from JN's fast_psd.m + Credit: This function's line of code was copied from JN's fast_psd.m routine. See Also diff --git a/mhkit/dolfyn/tools/misc.py b/mhkit/dolfyn/tools/misc.py index de0400772..f97485151 100644 --- a/mhkit/dolfyn/tools/misc.py +++ b/mhkit/dolfyn/tools/misc.py @@ -50,8 +50,9 @@ def detrend_array(arr, axis=-1, in_place=False): x = np.arange(sz[axis], dtype=np.float_).reshape(sz) x -= np.nanmean(x, axis=axis, keepdims=True) arr -= np.nanmean(arr, axis=axis, keepdims=True) - b = np.nanmean((x * arr), axis=axis, keepdims=True) / \ - np.nanmean((x ** 2), axis=axis, keepdims=True) + b = np.nanmean((x * arr), axis=axis, keepdims=True) / np.nanmean( + (x**2), axis=axis, keepdims=True + ) arr -= b * x return arr @@ -82,7 +83,7 @@ def group(bl, min_length=0): if not any(bl): return np.empty(0) - vl = np.diff(bl.astype('int')) + vl = np.diff(bl.astype("int")) ups = np.nonzero(vl == 1)[0] + 1 dns = np.nonzero(vl == -1)[0] + 1 if bl[0]: @@ -95,7 +96,7 @@ def group(bl, min_length=0): dns = np.array([len(bl)]) else: dns = np.concatenate((dns, [len(bl)])) - out = np.empty(len(dns), dtype='O') + out = np.empty(len(dns), dtype="O") idx = 0 for u, d in zip(ups, dns): if d - u < min_length: @@ -134,12 +135,12 @@ def slice1d_along_axis(arr_shape, axis=0): if axis < 0: axis += nd ind = [0] * (nd - 1) - i = np.zeros(nd, 'O') + i = np.zeros(nd, "O") indlist = list(range(nd)) indlist.remove(axis) i[axis] = slice(None) itr_dims = np.asarray(arr_shape).take(indlist) - Ntot = np.product(itr_dims) + Ntot = np.prod(itr_dims) i.put(indlist, ind) k = 0 while k < Ntot: @@ -165,18 +166,18 @@ def convert_degrees(deg, tidal_mode=True): deg: float or array-like Number or array in 'degrees CCW from East' or 'degrees CW from North' tidal_mode : bool - If true, range is set from 0 to +/-180 degrees. If false, range is 0 to + If true, range is set from 0 to +/-180 degrees. If false, range is 0 to 360 degrees. Default = True Returns ------- out : float or array-like - Input data transformed to 'degrees CW from North' or + Input data transformed to 'degrees CW from North' or 'degrees CCW from East', respectively (based on `deg`) Notes ----- - The same algorithm is used to convert back and forth between 'CCW from E' + The same algorithm is used to convert back and forth between 'CCW from E' and 'CW from N' """ @@ -223,11 +224,10 @@ def fillgaps(a, maxgap=np.inf, dim=0, extrapFlg=False): nd = a.ndim if dim < 0: dim += nd - if (dim >= nd): - raise ValueError("dim must be less than a.ndim; dim=%d, rank=%d." - % (dim, nd)) + if dim >= nd: + raise ValueError("dim must be less than a.ndim; dim=%d, rank=%d." % (dim, nd)) ind = [0] * (nd - 1) - i = np.zeros(nd, 'O') + i = np.zeros(nd, "O") indlist = list(range(nd)) indlist.remove(dim) i[dim] = slice(None, None) @@ -238,18 +238,21 @@ def fillgaps(a, maxgap=np.inf, dim=0, extrapFlg=False): # Here we extrapolate the ends, if necessary: if extrapFlg and gd.__len__() > 0: if gd[0] != 0 and gd[0] <= maxgap: - a[:gd[0]] = a[gd[0]] + a[: gd[0]] = a[gd[0]] if gd[-1] != a.__len__() and (a.__len__() - (gd[-1] + 1)) <= maxgap: - a[gd[-1]:] = a[gd[-1]] + a[gd[-1] :] = a[gd[-1]] # Here is the main loop if gd.__len__() > 1: inds = np.nonzero((1 < np.diff(gd)) & (np.diff(gd) <= maxgap + 1))[0] for i2 in range(0, inds.__len__()): ii = list(range(gd[inds[i2]] + 1, gd[inds[i2] + 1])) - a[ii] = (np.diff(a[gd[[inds[i2], inds[i2] + 1]]]) * - (np.arange(0, ii.__len__()) + 1) / - (ii.__len__() + 1) + a[gd[inds[i2]]]).astype(a.dtype) + a[ii] = ( + np.diff(a[gd[[inds[i2], inds[i2] + 1]]]) + * (np.arange(0, ii.__len__()) + 1) + / (ii.__len__() + 1) + + a[gd[inds[i2]]] + ).astype(a.dtype) return a @@ -289,27 +292,28 @@ def interpgaps(a, t, maxgap=np.inf, dim=0, extrapFlg=False): # Here we extrapolate the ends, if necessary: if extrapFlg and gd.__len__() > 0: if gd[0] != 0 and gd[0] <= maxgap: - a[:gd[0]] = a[gd[0]] + a[: gd[0]] = a[gd[0]] if gd[-1] != a.__len__() and (a.__len__() - (gd[-1] + 1)) <= maxgap: - a[gd[-1]:] = a[gd[-1]] + a[gd[-1] :] = a[gd[-1]] # Here is the main loop if gd.__len__() > 1: - inds = _find((1 < np.diff(gd)) & - (np.diff(gd) <= maxgap + 1)) + inds = _find((1 < np.diff(gd)) & (np.diff(gd) <= maxgap + 1)) for i2 in range(0, inds.__len__()): ii = np.arange(gd[inds[i2]] + 1, gd[inds[i2] + 1]) - ti = (t[ii] - t[gd[inds[i2]]]) / np.diff(t[[gd[inds[i2]], - gd[inds[i2] + 1]]]) - a[ii] = (np.diff(a[gd[[inds[i2], inds[i2] + 1]]]) * ti + - a[gd[inds[i2]]]).astype(a.dtype) + ti = (t[ii] - t[gd[inds[i2]]]) / np.diff( + t[[gd[inds[i2]], gd[inds[i2] + 1]]] + ) + a[ii] = ( + np.diff(a[gd[[inds[i2], inds[i2] + 1]]]) * ti + a[gd[inds[i2]]] + ).astype(a.dtype) return a def medfiltnan(a, kernel, thresh=0): """ - Do a running median filter of the data. Regions where more than + Do a running median filter of the data. Regions where more than ``thresh`` fraction of the points are NaN are set to NaN. Parameters @@ -317,9 +321,9 @@ def medfiltnan(a, kernel, thresh=0): a : numpy.ndarray 2D array containing data to be filtered. kernel_size : numpy.ndarray or list, optional - A scalar or a list of length 2, giving the size of the median - filter window in each dimension. Elements of kernel_size should - be odd. If kernel_size is a scalar, then this scalar is used as + A scalar or a list of length 2, giving the size of the median + filter window in each dimension. Elements of kernel_size should + be odd. If kernel_size is a scalar, then this scalar is used as the size in each dimension. thresh : int Maximum gap in *a* to filter over @@ -344,9 +348,9 @@ def medfiltnan(a, kernel, thresh=0): kernel = [1, kernel] out = medfilt2d(a, kernel) if thresh > 0: - out[convolve2d(np.isnan(a), - np.ones(kernel) / np.prod(kernel), - 'same') > thresh] = np.NaN + out[ + convolve2d(np.isnan(a), np.ones(kernel) / np.prod(kernel), "same") > thresh + ] = np.NaN if flag_1D: return out[0] return out diff --git a/mhkit/dolfyn/velocity.py b/mhkit/dolfyn/velocity.py index 47d3a6528..24b14d375 100644 --- a/mhkit/dolfyn/velocity.py +++ b/mhkit/dolfyn/velocity.py @@ -7,13 +7,13 @@ from .tools.misc import slice1d_along_axis, convert_degrees -@xr.register_dataset_accessor('velds') # 'vel dataset' -class Velocity(): +@xr.register_dataset_accessor("velds") # 'vel dataset' +class Velocity: """ All ADCP and ADV xarray datasets wrap this base class. - The turbulence-related attributes defined within this class - assume that the ``'tke_vec'`` and ``'stress_vec'`` data entries are + The turbulence-related attributes defined within this class + assume that the ``'tke_vec'`` and ``'stress_vec'`` data entries are included in the dataset. These are typically calculated using a :class:`VelBinner` tool, but the method for calculating these variables can depend on the details of the measurement @@ -27,7 +27,7 @@ class Velocity(): ######## # Major components of the dolfyn-API - def rotate2(self, out_frame='earth', inplace=True): + def rotate2(self, out_frame="earth", inplace=True): """ Rotate the dataset to a new coordinate system. @@ -173,100 +173,128 @@ def __getitem__(self, key): def __contains__(self, val): return val in self.ds - def __repr__(self, ): - time_string = '{:.2f} {} (started: {})' - if ('time' not in self or dt642epoch(self['time'][0]) < 1): - time_string = '-->No Time Information!<--' + def __repr__( + self, + ): + time_string = "{:.2f} {} (started: {})" + if "time" not in self or dt642epoch(self["time"][0]) < 1: + time_string = "-->No Time Information!<--" else: - tm = self['time'][[0, -1]].values + tm = self["time"][[0, -1]].values dt = dt642date(tm[0])[0] - delta = (dt642epoch(tm[-1]) - - dt642epoch(tm[0])) / (3600 * 24) # days + delta = (dt642epoch(tm[-1]) - dt642epoch(tm[0])) / (3600 * 24) # days if delta > 1: - units = 'days' + units = "days" elif delta * 24 > 1: - units = 'hours' + units = "hours" delta *= 24 elif delta * 24 * 60 > 1: delta *= 24 * 60 - units = 'minutes' + units = "minutes" else: delta *= 24 * 3600 - units = 'seconds' + units = "seconds" try: - time_string = time_string.format(delta, units, - dt.strftime('%b %d, %Y %H:%M')) + time_string = time_string.format( + delta, units, dt.strftime("%b %d, %Y %H:%M") + ) except AttributeError: - time_string = '-->Error in time info<--' + time_string = "-->Error in time info<--" p = self.ds.attrs - t_shape = self['time'].shape + t_shape = self["time"].shape if len(t_shape) > 1: - shape_string = '({} bins, {} pings @ {}Hz)'.format( - t_shape[0], t_shape, p.get('fs')) + shape_string = "({} bins, {} pings @ {}Hz)".format( + t_shape[0], t_shape, p.get("fs") + ) else: - shape_string = '({} pings @ {}Hz)'.format( - t_shape[0], p.get('fs', '??')) - _header = ("<%s data object>: " - " %s %s\n" - " . %s\n" - " . %s-frame\n" - " . %s\n" % - (p.get('inst_type'), - self.ds.attrs['inst_make'], self.ds.attrs['inst_model'], - time_string, - p.get('coord_sys'), - shape_string)) - _vars = ' Variables:\n' + shape_string = "({} pings @ {}Hz)".format(t_shape[0], p.get("fs", "??")) + _header = ( + "<%s data object>: " + " %s %s\n" + " . %s\n" + " . %s-frame\n" + " . %s\n" + % ( + p.get("inst_type"), + self.ds.attrs["inst_make"], + self.ds.attrs["inst_model"], + time_string, + p.get("coord_sys"), + shape_string, + ) + ) + _vars = " Variables:\n" # Specify which variable show up in this view here. # * indicates a wildcard # This list also sets the display order. # Only the first 12 matches are displayed. - show_vars = ['time*', 'vel*', 'range', 'range_echo', - 'orientmat', 'heading', 'pitch', 'roll', - 'temp', 'press*', 'amp*', 'corr*', - 'accel', 'angrt', 'mag', 'echo', - ] + show_vars = [ + "time*", + "vel*", + "range", + "range_echo", + "orientmat", + "heading", + "pitch", + "roll", + "temp", + "press*", + "amp*", + "corr*", + "accel", + "angrt", + "mag", + "echo", + ] n = 0 for v in show_vars: if n > 12: break - if v.endswith('*'): + if v.endswith("*"): v = v[:-1] # Drop the '*' for nm in self.variables: if n > 12: break if nm.startswith(v): n += 1 - _vars += ' - {} {}\n'.format(nm, self.ds[nm].dims) + _vars += " - {} {}\n".format(nm, self.ds[nm].dims) elif v in self.ds: - _vars += ' - {} {}\n'.format(v, self.ds[v].dims) + _vars += " - {} {}\n".format(v, self.ds[v].dims) if n < len(self.variables): - _vars += ' ... and others (see `.variables`)\n' + _vars += " ... and others (see `.variables`)\n" return _header + _vars ###### # Duplicate valuable xarray properties here. @property - def variables(self, ): + def variables( + self, + ): """A sorted list of the variable names in the dataset.""" return sorted(self.ds.variables) @property - def attrs(self, ): + def attrs( + self, + ): """The attributes in the dataset.""" return self.ds.attrs @property - def coords(self, ): + def coords( + self, + ): """The coordinates in the dataset.""" return self.ds.coords ###### # A bunch of DOLfYN specific properties @property - def u(self,): + def u( + self, + ): """ The first velocity component. @@ -279,10 +307,12 @@ def u(self,): - earth: east - principal: streamwise """ - return self.ds['vel'][0].drop('dir') + return self.ds["vel"][0].drop("dir") @property - def v(self,): + def v( + self, + ): """ The second velocity component. @@ -295,10 +325,12 @@ def v(self,): - earth: north - principal: cross-stream """ - return self.ds['vel'][1].drop('dir') + return self.ds["vel"][1].drop("dir") @property - def w(self,): + def w( + self, + ): """ The third velocity component. @@ -311,37 +343,47 @@ def w(self,): - earth: up - principal: up """ - return self.ds['vel'][2].drop('dir') + return self.ds["vel"][2].drop("dir") @property - def U(self,): + def U( + self, + ): """Horizontal velocity as a complex quantity""" return xr.DataArray( - (self.u + self.v * 1j).astype('complex64'), - attrs={'units': 'm s-1', - 'long_name': 'Horizontal Water Velocity'}) - + (self.u + self.v * 1j).astype("complex64"), + attrs={"units": "m s-1", "long_name": "Horizontal Water Velocity"}, + ) + @property - def U_mag(self,): + def U_mag( + self, + ): """Horizontal velocity magnitude""" return xr.DataArray( - np.abs(self.U).astype('float32'), - attrs={'units': 'm s-1', - 'long_name': 'Water Speed', - 'standard_name': 'sea_water_speed'}) + np.abs(self.U).astype("float32"), + attrs={ + "units": "m s-1", + "long_name": "Water Speed", + "standard_name": "sea_water_speed", + }, + ) @property - def U_dir(self,): + def U_dir( + self, + ): """ - Angle of horizontal velocity vector. Direction is 'to', - as opposed to 'from'. This function calculates angle as - "degrees CCW from X/East/streamwise" and then converts it to + Angle of horizontal velocity vector. Direction is 'to', + as opposed to 'from'. This function calculates angle as + "degrees CCW from X/East/streamwise" and then converts it to "degrees CW from X/North/streamwise". """ + def convert_to_CW(angle): - if self.ds.coord_sys == 'earth': + if self.ds.coord_sys == "earth": # Convert "deg CCW from East" to "deg CW from North" [0, 360] angle = convert_degrees(angle, tidal_mode=False) relative_to = self.ds.dir[1].values @@ -353,18 +395,23 @@ def convert_to_CW(angle): return angle, relative_to # Convert from radians to degrees - angle, rel = convert_to_CW(np.angle(self.U)*(180/np.pi)) + angle, rel = convert_to_CW(np.angle(self.U) * (180 / np.pi)) return xr.DataArray( - angle.astype('float32'), + angle.astype("float32"), dims=self.U.dims, coords=self.U.coords, - attrs={'units': 'degrees_CW_from_' + str(rel), - 'long_name': 'Water Direction', - 'standard_name': 'sea_water_to_direction'}) + attrs={ + "units": "degrees_CW_from_" + str(rel), + "long_name": "Water Direction", + "standard_name": "sea_water_to_direction", + }, + ) @property - def E_coh(self,): + def E_coh( + self, + ): """ Coherent turbulent energy @@ -376,11 +423,14 @@ def E_coh(self,): E_coh = (self.upwp_**2 + self.upvp_**2 + self.vpwp_**2) ** (0.5) return xr.DataArray( - E_coh.astype('float32'), - coords={'time': self.ds['stress_vec'].time}, - dims=['time'], - attrs={'units': self.ds['stress_vec'].units, - 'long_name': 'Coherent Turbulence Energy'}) + E_coh.astype("float32"), + coords={"time": self.ds["stress_vec"].time}, + dims=["time"], + attrs={ + "units": self.ds["stress_vec"].units, + "long_name": "Coherent Turbulence Energy", + }, + ) @property def I_tke(self, thresh=0): @@ -389,14 +439,15 @@ def I_tke(self, thresh=0): Ratio of sqrt(tke) to horizontal velocity magnitude. """ - I_tke = np.ma.masked_where(self.U_mag < thresh, - np.sqrt(2 * self.tke) / self.U_mag) + I_tke = np.ma.masked_where( + self.U_mag < thresh, np.sqrt(2 * self.tke) / self.U_mag + ) return xr.DataArray( - I_tke.data.astype('float32'), + I_tke.data.astype("float32"), coords=self.U_mag.coords, dims=self.U_mag.dims, - attrs={'units': '% [0,1]', - 'long_name': 'TKE Intensity'}) + attrs={"units": "% [0,1]", "long_name": "TKE Intensity"}, + ) @property def I(self, thresh=0): @@ -406,61 +457,73 @@ def I(self, thresh=0): Ratio of standard deviation of horizontal velocity to horizontal velocity magnitude. """ - I = np.ma.masked_where(self.U_mag < thresh, - self.ds['U_std'] / self.U_mag) + I = np.ma.masked_where(self.U_mag < thresh, self.ds["U_std"] / self.U_mag) return xr.DataArray( - I.data.astype('float32'), + I.data.astype("float32"), coords=self.U_mag.coords, dims=self.U_mag.dims, - attrs={'units': '% [0,1]', - 'long_name': 'Turbulence Intensity'}) + attrs={"units": "% [0,1]", "long_name": "Turbulence Intensity"}, + ) @property - def tke(self,): - """Turbulent kinetic energy (sum of the three components) - """ - tke = self.ds['tke_vec'].sum('tke') / 2 - tke.name = 'TKE' - tke.attrs['units'] = self.ds['tke_vec'].units - tke.attrs['long_name'] = 'TKE' - tke.attrs['standard_name'] = 'specific_turbulent_kinetic_energy_of_sea_water' + def tke( + self, + ): + """Turbulent kinetic energy (sum of the three components)""" + tke = self.ds["tke_vec"].sum("tke") / 2 + tke.name = "TKE" + tke.attrs["units"] = self.ds["tke_vec"].units + tke.attrs["long_name"] = "TKE" + tke.attrs["standard_name"] = "specific_turbulent_kinetic_energy_of_sea_water" return tke @property - def upvp_(self,): + def upvp_( + self, + ): """u'v'bar Reynolds stress""" - return self.ds['stress_vec'].sel(tau="upvp_").drop('tau') + return self.ds["stress_vec"].sel(tau="upvp_").drop("tau") @property - def upwp_(self,): + def upwp_( + self, + ): """u'w'bar Reynolds stress""" - return self.ds['stress_vec'].sel(tau="upwp_").drop('tau') + return self.ds["stress_vec"].sel(tau="upwp_").drop("tau") @property - def vpwp_(self,): + def vpwp_( + self, + ): """v'w'bar Reynolds stress""" - return self.ds['stress_vec'].sel(tau="vpwp_").drop('tau') + return self.ds["stress_vec"].sel(tau="vpwp_").drop("tau") @property - def upup_(self,): + def upup_( + self, + ): """u'u'bar component of the tke""" - return self.ds['tke_vec'].sel(tke="upup_").drop('tke') + return self.ds["tke_vec"].sel(tke="upup_").drop("tke") @property - def vpvp_(self,): + def vpvp_( + self, + ): """v'v'bar component of the tke""" - return self.ds['tke_vec'].sel(tke="vpvp_").drop('tke') + return self.ds["tke_vec"].sel(tke="vpvp_").drop("tke") @property - def wpwp_(self,): + def wpwp_( + self, + ): """w'w'bar component of the tke""" - return self.ds['tke_vec'].sel(tke="wpwp_").drop('tke') + return self.ds["tke_vec"].sel(tke="wpwp_").drop("tke") class VelBinner(TimeBinner): @@ -487,38 +550,53 @@ class VelBinner(TimeBinner): # This defines how cross-spectra and stresses are computed. _cross_pairs = [(0, 1), (0, 2), (1, 2)] - tke = xr.DataArray(["upup_", "vpvp_", "wpwp_"], - dims=['tke'], - name='tke', - attrs={'units': '1', - 'long_name': 'Turbulent Kinetic Energy Vector Components', - 'coverage_content_type': 'coordinate'}) - - tau = xr.DataArray(["upvp_", "upwp_", "vpwp_"], - dims=['tau'], - name='tau', - attrs={'units': '1', - 'long_name': 'Reynolds Stress Vector Components', - 'coverage_content_type': 'coordinate'}) - - S = xr.DataArray(['Sxx', 'Syy', 'Szz'], - dims=['S'], - name='S', - attrs={'units': '1', - 'long_name': 'Power Spectral Density Vector Components', - 'coverage_content_type': 'coordinate'}) - - C = xr.DataArray(['Cxy', 'Cxz', 'Cyz'], - dims=['C'], - name='C', - attrs={'units': '1', - 'long_name': 'Cross-Spectral Density Vector Components', - 'coverage_content_type': 'coordinate'}) - + tke = xr.DataArray( + ["upup_", "vpvp_", "wpwp_"], + dims=["tke"], + name="tke", + attrs={ + "units": "1", + "long_name": "Turbulent Kinetic Energy Vector Components", + "coverage_content_type": "coordinate", + }, + ) + + tau = xr.DataArray( + ["upvp_", "upwp_", "vpwp_"], + dims=["tau"], + name="tau", + attrs={ + "units": "1", + "long_name": "Reynolds Stress Vector Components", + "coverage_content_type": "coordinate", + }, + ) + + S = xr.DataArray( + ["Sxx", "Syy", "Szz"], + dims=["S"], + name="S", + attrs={ + "units": "1", + "long_name": "Power Spectral Density Vector Components", + "coverage_content_type": "coordinate", + }, + ) + + C = xr.DataArray( + ["Cxy", "Cxz", "Cyz"], + dims=["C"], + name="C", + attrs={ + "units": "1", + "long_name": "Cross-Spectral Density Vector Components", + "coverage_content_type": "coordinate", + }, + ) def bin_average(self, raw_ds, out_ds=None, names=None): """ - Bin the dataset and calculate the ensemble averages of each + Bin the dataset and calculate the ensemble averages of each variable. Parameters @@ -559,36 +637,42 @@ def bin_average(self, raw_ds, out_ds=None, names=None): for ky in names: # set up dimensions and coordinates for Dataset dims_list = raw_ds[ky].dims + if any([ar for ar in dims_list if "altraw" in ar]): + continue coords_dict = {} for nm in dims_list: - if 'time' in nm: + if "time" in nm: coords_dict[nm] = self.mean(raw_ds[ky][nm].values) else: coords_dict[nm] = raw_ds[ky][nm].values # create Dataset - if 'ensemble' not in ky: + if "ensemble" not in ky: try: # variables with time coordinate - out_ds[ky] = xr.DataArray(self.mean(raw_ds[ky].values), - coords=coords_dict, - dims=dims_list, - attrs=raw_ds[ky].attrs - ).astype('float32') + out_ds[ky] = xr.DataArray( + self.mean(raw_ds[ky].values), + coords=coords_dict, + dims=dims_list, + attrs=raw_ds[ky].attrs, + ).astype("float32") except: # variables not needing averaging pass # Add standard deviation std = self.standard_deviation(raw_ds.velds.U_mag.values) - out_ds['U_std'] = xr.DataArray( - std.astype('float32'), + out_ds["U_std"] = xr.DataArray( + std.astype("float32"), dims=raw_ds.vel.dims[1:], - attrs={'units': 'm s-1', - 'long_name': 'Water Velocity Standard Deviation'}) + attrs={ + "units": "m s-1", + "long_name": "Water Velocity Standard Deviation", + }, + ) return out_ds - def bin_variance(self, raw_ds, out_ds=None, names=None, suffix='_var'): + def bin_variance(self, raw_ds, out_ds=None, names=None, suffix="_var"): """ - Bin the dataset and calculate the ensemble variances of each + Bin the dataset and calculate the ensemble variances of each variable. Complementary to `bin_average()`. Parameters @@ -630,21 +714,24 @@ def bin_variance(self, raw_ds, out_ds=None, names=None, suffix='_var'): for ky in names: # set up dimensions and coordinates for dataarray dims_list = raw_ds[ky].dims + if any([ar for ar in dims_list if "altraw" in ar]): + continue coords_dict = {} for nm in dims_list: - if 'time' in nm: + if "time" in nm: coords_dict[nm] = self.mean(raw_ds[ky][nm].values) else: coords_dict[nm] = raw_ds[ky][nm].values # create Dataset - if 'ensemble' not in ky: + if "ensemble" not in ky: try: # variables with time coordinate - out_ds[ky+suffix] = xr.DataArray(self.variance(raw_ds[ky].values), - coords=coords_dict, - dims=dims_list, - attrs=raw_ds[ky].attrs - ).astype('float32') + out_ds[ky + suffix] = xr.DataArray( + self.variance(raw_ds[ky].values), + coords=coords_dict, + dims=dims_list, + attrs=raw_ds[ky].attrs, + ).astype("float32") except: # variables not needing averaging pass @@ -680,17 +767,18 @@ def autocovariance(self, veldat, n_bin=None): indat = veldat.values n_bin = self._parse_nbin(n_bin) - out = np.empty(self._outshape(indat.shape, n_bin=n_bin)[:-1] + - [int(n_bin // 4)], dtype=indat.dtype) + out = np.empty( + self._outshape(indat.shape, n_bin=n_bin)[:-1] + [int(n_bin // 4)], + dtype=indat.dtype, + ) dt1 = self.reshape(indat, n_pad=n_bin / 2 - 2) # Here we de-mean only on the 'valid' range: - dt1 = dt1 - dt1[..., :, int(n_bin // 4): - int(-n_bin // 4)].mean(-1)[..., None] + dt1 = dt1 - dt1[..., :, int(n_bin // 4) : int(-n_bin // 4)].mean(-1)[..., None] dt2 = self.demean(indat) se = slice(int(n_bin // 4) - 1, None, 1) sb = slice(int(n_bin // 4) - 1, None, -1) for slc in slice1d_along_axis(dt1.shape, -1): - tmp = np.correlate(dt1[slc], dt2[slc], 'valid') + tmp = np.correlate(dt1[slc], dt2[slc], "valid") # The zero-padding in reshape means we compute coherence # from one-sided time-series for first and last points. if slc[-2] == 0: @@ -703,100 +791,168 @@ def autocovariance(self, veldat, n_bin=None): dims_list, coords_dict = self._new_coords(veldat) # tack on new coordinate - dims_list.append('lag') - coords_dict['lag'] = np.arange(n_bin//4) + dims_list.append("lag") + coords_dict["lag"] = np.arange(n_bin // 4) - da = xr.DataArray(out.astype('float32'), - coords=coords_dict, - dims=dims_list,) - da['lag'].attrs['units'] = 'timestep' + da = xr.DataArray( + out.astype("float32"), + coords=coords_dict, + dims=dims_list, + ) + da["lag"].attrs["units"] = "timestep" return da + def turbulence_intensity(self, U_mag, noise=0, thresh=0, detrend=False): + """ + Calculate noise-corrected turbulence intensity. + + Parameters + ---------- + U_mag : xarray.DataArray + Raw horizontal velocity magnitude + noise : numeric + Instrument noise level in same units as velocity. Typically + found from `.turbulence.doppler_noise_level`. + Default: None. + thresh : numeric + Theshold below which TI will not be calculated + detrend : bool (default: False) + Detrend the velocity data (True), or simply de-mean it + (False), prior to computing TI. + """ + + if "xarray" in type(U_mag).__module__: + U = U_mag.values + if "xarray" in type(noise).__module__: + noise = noise.values + + if detrend: + up = self.detrend(U) + else: + up = self.demean(U) + + # Take RMS and subtract noise + u_rms = np.sqrt(np.nanmean(up**2, axis=-1) - noise**2) + u_mag = self.mean(U) + + ti = np.ma.masked_where(u_mag < thresh, u_rms / u_mag) + + dims = U_mag.dims + coords = {} + for nm in U_mag.dims: + if "time" in nm: + coords[nm] = self.mean(U_mag[nm].values) + else: + coords[nm] = U_mag[nm].values + + return xr.DataArray( + ti.data.astype("float32"), + coords=coords, + dims=dims, + attrs={ + "units": "% [0,1]", + "long_name": "Turbulence Intensity", + "comment": f"TI was corrected from a noise level of {noise} m/s", + }, + ) + def turbulent_kinetic_energy(self, veldat, noise=None, detrend=True): """ - Calculate the turbulent kinetic energy (TKE) (variances + Calculate the turbulent kinetic energy (TKE) (variances of u,v,w). Parameters ---------- veldat : xarray.DataArray - Velocity data array from ADV or single beam from ADCP. + Velocity data array from ADV or single beam from ADCP. The last dimension is assumed to be time. noise : float or array-like - A vector of the noise levels of the velocity data with - the same first dimension as the velocity vector. + Instrument noise level in same units as velocity. Typically + found from `.turbulence.doppler_noise_level`. + Default: None. detrend : bool (default: False) Detrend the velocity data (True), or simply de-mean it - (False), prior to computing tke. Note: the psd routines + (False), prior to computing TKE. Note: the PSD routines use detrend, so if you want to have the same amount of variance here as there use ``detrend=True``. - + Returns ------- tke_vec : xarray.DataArray dataArray containing u'u'_, v'v'_ and w'w'_ """ - if 'xarray' in type(veldat).__module__: + if "xarray" in type(veldat).__module__: vel = veldat.values - if 'xarray' in type(noise).__module__: + if "xarray" in type(noise).__module__: noise = noise.values if len(np.shape(vel)) > 2: - raise ValueError("This function is only valid for calculating TKE using " - "velocity from an ADV or a single ADCP beam.") + raise ValueError( + "This function is only valid for calculating TKE using " + "velocity from an ADV or a single ADCP beam." + ) # Calc TKE if detrend: - out = np.nanmean(self.detrend(vel)**2, axis=-1) + out = np.nanmean(self.detrend(vel) ** 2, axis=-1) else: - out = np.nanmean(self.demean(vel)**2, axis=-1) + out = np.nanmean(self.demean(vel) ** 2, axis=-1) - if 'dir' in veldat.dims: + if "dir" in veldat.dims: # Subtract noise if noise is not None: if np.shape(noise)[0] != 3: raise Exception( - 'Noise should have same first dimension as velocity') + "Noise should have same first dimension as velocity" + ) out[0] -= noise[0] ** 2 out[1] -= noise[1] ** 2 out[2] -= noise[2] ** 2 # Set coords - dims = ['tke', 'time'] - coords = {'tke': self.tke, - 'time': self.mean(veldat.time.values)} + dims = ["tke", "time"] + coords = {"tke": self.tke, "time": self.mean(veldat.time.values)} else: # Subtract noise if noise is not None: if np.shape(noise) > np.shape(vel): raise Exception( - 'Noise should have same or fewer dimensions as velocity') - out -= noise ** 2 + "Noise should have same or fewer dimensions as velocity" + ) + out -= noise**2 # Set coords dims = veldat.dims coords = {} for nm in veldat.dims: - if 'time' in nm: + if "time" in nm: coords[nm] = self.mean(veldat[nm].values) else: coords[nm] = veldat[nm].values return xr.DataArray( - out.astype('float32'), + out.astype("float32"), dims=dims, coords=coords, - attrs={'units': 'm2 s-2', - 'long_name': 'TKE Vector', - 'standard_name': 'specific_turbulent_kinetic_energy_of_sea_water'}) - - def power_spectral_density(self, veldat, - freq_units='rad/s', - fs=None, - window='hann', - noise=None, - n_bin=None, n_fft=None, n_pad=None, - step=None): + attrs={ + "units": "m2 s-2", + "long_name": "TKE Vector", + "standard_name": "specific_turbulent_kinetic_energy_of_sea_water", + }, + ) + + def power_spectral_density( + self, + veldat, + freq_units="rad/s", + fs=None, + window="hann", + noise=0, + n_bin=None, + n_fft=None, + n_pad=None, + step=None, + ): """ Calculate the power spectral density of velocity. @@ -805,17 +961,16 @@ def power_spectral_density(self, veldat, veldat : xr.DataArray The raw velocity data (of dims 'dir' and 'time'). freq_units : string - Frequency units of the returned spectra in either Hz or rad/s + Frequency units of the returned spectra in either Hz or rad/s (`f` or :math:`\\omega`) fs : float (optional) The sample rate. Default is `binner.fs` window : string or array Specify the window function. Options: 1, None, 'hann', 'hamm' - noise : float or array-like - A vector of the noise levels of the velocity data with - the same first dimension as the velocity vector. - Default = 0. + noise : numeric or array + Instrument noise level in same units as velocity. + Default: 0 (ADCP) or [0, 0, 0] (ADV). n_bin : int (optional) The bin-size. Default: from the binner. n_fft : int (optional) @@ -835,76 +990,93 @@ def power_spectral_density(self, veldat, fs_in = self._parse_fs(fs) n_fft = self._parse_nfft(n_fft) - if 'xarray' in type(veldat).__module__: + if "xarray" in type(veldat).__module__: vel = veldat.values - if 'xarray' in type(noise).__module__: - noise = noise.values - if ('rad' not in freq_units) and ('Hz' not in freq_units): + if ("rad" not in freq_units) and ("Hz" not in freq_units): raise ValueError("`freq_units` should be one of 'Hz' or 'rad/s'") - + # Create frequency vector, also checks whether using f or omega - if 'rad' in freq_units: - fs = 2*np.pi*fs_in - freq_units = 'rad s-1' - units = 'm2 s-1 rad-1' + if "rad" in freq_units: + fs = 2 * np.pi * fs_in + freq_units = "rad s-1" + units = "m2 s-1 rad-1" else: fs = fs_in - freq_units = 'Hz' - units = 'm2 s-2 Hz-1' - freq = xr.DataArray(self._fft_freq(fs=fs_in, units=freq_units, n_fft=n_fft), - dims=['freq'], - name='freq', - attrs={'units': freq_units, - 'long_name': 'FFT Frequency Vector', - 'coverage_content_type': 'coordinate'} - ).astype('float32') + freq_units = "Hz" + units = "m2 s-2 Hz-1" + freq = xr.DataArray( + self._fft_freq(fs=fs_in, units=freq_units, n_fft=n_fft), + dims=["freq"], + name="freq", + attrs={ + "units": freq_units, + "long_name": "FFT Frequency Vector", + "coverage_content_type": "coordinate", + }, + ).astype("float32") # Spectra, if input is full velocity or a single array - if len(vel.shape) == 2: - assert vel.shape[0] == 3, "Function can only handle 1D or 3D arrays." \ - " If ADCP data, please select a specific depth bin." - if (noise is not None) and (np.shape(noise)[0] != 3): - raise Exception( - 'Noise should have same first dimension as velocity') + if len(vel.shape) >= 2: + if vel.shape[0] != 3: + raise ValueError( + "Function can only handle 1D or 3D arrays." + " If ADCP data, please select a specific depth bin." + ) + if np.array(noise).any(): + if np.size(noise) != 3: + raise ValueError("Noise is expected to be an array of 3 scalars") else: + # Reset default to list of 3 zeros noise = np.array([0, 0, 0]) - out = np.empty(self._outshape_fft(vel[:3].shape, n_fft=n_fft, n_bin=n_bin), - dtype=np.float32) + + out = np.empty( + self._outshape_fft(vel[:3].shape, n_fft=n_fft, n_bin=n_bin), + dtype=np.float32, + ) for idx in range(3): - out[idx] = self._psd_base(vel[idx], - fs=fs, - noise=noise[idx], - window=window, - n_bin=n_bin, - n_pad=n_pad, - n_fft=n_fft, - step=step) - coords = {'S': self.S, - 'time': self.mean(veldat['time'].values), - 'freq': freq} - dims = ['S', 'time', 'freq'] + out[idx] = self._psd_base( + vel[idx], + fs=fs, + noise=noise[idx], + window=window, + n_bin=n_bin, + n_pad=n_pad, + n_fft=n_fft, + step=step, + ) + coords = { + "S": self.S, + "time": self.mean(veldat["time"].values), + "freq": freq, + } + dims = ["S", "time", "freq"] else: - if (noise is not None) and (len(np.shape(noise)) > 1): - raise Exception( - 'Noise should have same first dimension as velocity') - else: - noise = np.array(0) - out = self._psd_base(vel, - fs=fs, - noise=noise, - window=window, - n_bin=n_bin, - n_pad=n_pad, - n_fft=n_fft, - step=step) - coords = {veldat.dims[-1]: self.mean(veldat[veldat.dims[-1]].values), - 'freq': freq} - dims = [veldat.dims[-1], 'freq'] + if np.array(noise).any() and np.size(noise) > 1: + raise ValueError("Noise is expected to be a scalar") + + out = self._psd_base( + vel, + fs=fs, + noise=noise, + window=window, + n_bin=n_bin, + n_pad=n_pad, + n_fft=n_fft, + step=step, + ) + coords = { + veldat.dims[-1]: self.mean(veldat[veldat.dims[-1]].values), + "freq": freq, + } + dims = [veldat.dims[-1], "freq"] return xr.DataArray( - out.astype('float32'), + out.astype("float32"), coords=coords, dims=dims, - attrs={'units': units, - 'n_fft': n_fft, - 'long_name': 'Power Spectral Density'}) + attrs={ + "units": units, + "n_fft": n_fft, + "long_name": "Power Spectral Density", + }, + ) diff --git a/mhkit/loads/__init__.py b/mhkit/loads/__init__.py index cd0ea3c22..4c21c7391 100644 --- a/mhkit/loads/__init__.py +++ b/mhkit/loads/__init__.py @@ -1,3 +1,12 @@ +""" +The `loads` package of the MHKiT (Marine and Hydrokinetic Toolkit) library +provides tools and functionalities for analyzing and visualizing loads data +from marine and hydrokinetic (MHK) devices. This package is designed to +assist engineers, researchers, and analysts in understanding the forces and +stresses applied to MHK devices under various operational and environmental +conditions. +""" + from mhkit.loads import general from mhkit.loads import graphics -from mhkit.loads import extreme \ No newline at end of file +from mhkit.loads import extreme diff --git a/mhkit/loads/extreme.py b/mhkit/loads/extreme.py deleted file mode 100644 index b282c0826..000000000 --- a/mhkit/loads/extreme.py +++ /dev/null @@ -1,757 +0,0 @@ -import numpy as np -import pandas as pd -from scipy import stats -from scipy import optimize -from mhkit.wave.resource import frequency_moment - - -def global_peaks(t, data): - """ - Find the global peaks of a zero-centered response time-series. - - The global peaks are the maxima between consecutive zero - up-crossings. - - Parameters - ---------- - t: np.array - Time array. - data: np.array - Response time-series. - - Returns - ------- - t_peaks: np.array - Time array for peaks - peaks: np.array - Peak values of the response time-series - """ - assert isinstance(t, np.ndarray), 't must be of type np.ndarray' - assert isinstance(data, np.ndarray), 'data must be of type np.ndarray' - - # eliminate zeros - zeroMask = (data == 0) - data[zeroMask] = 0.5 * np.min(np.abs(data)) - # zero up-crossings - diff = np.diff(np.sign(data)) - zeroUpCrossings_mask = (diff == 2) | (diff == 1) - zeroUpCrossings_index = np.where(zeroUpCrossings_mask)[0] - zeroUpCrossings_index = np.append(zeroUpCrossings_index, len(data) - 1) - # global peaks - npeaks = len(zeroUpCrossings_index) - peaks = np.array([]) - t_peaks = np.array([]) - for i in range(npeaks - 1): - peak_index = np.argmax( - data[zeroUpCrossings_index[i]:zeroUpCrossings_index[i + 1]]) - t_peaks = np.append(t_peaks, t[zeroUpCrossings_index[i] + peak_index]) - peaks = np.append(peaks, data[zeroUpCrossings_index[i] + peak_index]) - return t_peaks, peaks - - -def number_of_short_term_peaks(n, t, t_st): - """ - Estimate the number of peaks in a specified period. - - Parameters - ---------- - n : int - Number of peaks in analyzed timeseries. - t : float - Length of time of analyzed timeseries. - t_st: float - Short-term period for which to estimate the number of peaks. - - Returns - ------- - n_st : float - Number of peaks in short term period. - """ - assert isinstance(n, int), 'n must be of type int' - assert isinstance(t, float), 't must be of type float' - assert isinstance(t_st, float), 't_st must be of type float' - - return n * t_st / t - - -def peaks_distribution_weibull(x): - """ - Estimate the peaks distribution by fitting a Weibull - distribution to the peaks of the response. - - The fitted parameters can be accessed through the `params` field of - the returned distribution. - - Parameters - ---------- - x : np.array - Global peaks. - - Returns - ------- - peaks: scipy.stats.rv_frozen - Probability distribution of the peaks. - """ - assert isinstance(x, np.ndarray), 'x must be of type np.ndarray' - - # peaks distribution - peaks_params = stats.exponweib.fit(x, f0=1, floc=0) - param_names = ['a', 'c', 'loc', 'scale'] - peaks_params = {k: v for k, v in zip(param_names, peaks_params)} - peaks = stats.exponweib(**peaks_params) - # save the parameter info - peaks.params = peaks_params - return peaks - - -def peaks_distribution_weibull_tail_fit(x): - """ - Estimate the peaks distribution using the Weibull tail fit - method. - - The fitted parameters can be accessed through the `params` field of - the returned distribution. - - Parameters - ---------- - x : np.array - Global peaks. - - Returns - ------- - peaks: scipy.stats.rv_frozen - Probability distribution of the peaks. - """ - assert isinstance(x, np.ndarray), 'x must be of type np.ndarray' - - # Initial guess for Weibull parameters - p0 = stats.exponweib.fit(x, f0=1, floc=0) - p0 = np.array([p0[1], p0[3]]) - # Approximate CDF - x = np.sort(x) - npeaks = len(x) - F = np.zeros(npeaks) - for i in range(npeaks): - F[i] = i / (npeaks + 1.0) - # Divide into seven sets & fit Weibull - subset_shape_params = np.zeros(7) - subset_scale_params = np.zeros(7) - setLim = np.arange(0.60, 0.90, 0.05) - func = lambda x, c, s: stats.exponweib(a=1, c=c, loc=0, scale=s).cdf(x) - for set in range(7): - xset = x[(F > setLim[set])] - Fset = F[(F > setLim[set])] - popt, _ = optimize.curve_fit(func, xset, Fset, p0=p0) - subset_shape_params[set] = popt[0] - subset_scale_params[set] = popt[1] - # peaks distribution - peaks_params = [1, np.mean(subset_shape_params), 0, - np.mean(subset_scale_params)] - param_names = ['a', 'c', 'loc', 'scale'] - peaks_params = {k: v for k, v in zip(param_names, peaks_params)} - peaks = stats.exponweib(**peaks_params) - # save the parameter info - peaks.params = peaks_params - peaks.subset_shape_params = subset_shape_params - peaks.subset_scale_params = subset_scale_params - return peaks - - -def peaks_distribution_peaks_over_threshold(x, threshold=None): - """ - Estimate the peaks distribution using the peaks over threshold - method. - - This fits a generalized Pareto distribution to all the peaks above - the specified threshold. The distribution is only defined for values - above the threshold and therefore cannot be used to obtain integral - metrics such as the expected value. A typical choice of threshold is - 1.4 standard deviations above the mean. The peaks over threshold - distribution can be accessed through the `pot` field of the returned - peaks distribution. - - Parameters - ---------- - x : np.array - Global peaks. - threshold : float - Threshold value. Only peaks above this value will be used. - Default value calculated as: `np.mean(x) + 1.4 * np.std(x)` - - Returns - ------- - peaks: scipy.stats.rv_frozen - Probability distribution of the peaks. - """ - assert isinstance(x, np.ndarray), 'x must be of type np.ndarray' - if threshold is None: - threshold = np.mean(x) + 1.4 * np.std(x) - assert isinstance(threshold, float - ), 'threshold must be of type float' - - # peaks over threshold - x = np.sort(x) - pot = x[(x > threshold)] - threshold - npeaks = len(x) - npot = len(pot) - # Fit a generalized Pareto - pot_params = stats.genpareto.fit(pot, floc=0.) - param_names = ['c', 'loc', 'scale'] - pot_params = {k: v for k, v in zip(param_names, pot_params)} - pot = stats.genpareto(**pot_params) - # save the parameter info - pot.params = pot_params - - # peaks - class _Peaks(stats.rv_continuous): - - def __init__(self, *args, **kwargs): - self.pot = kwargs.pop('pot_distribution') - self.threshold = kwargs.pop('threshold') - super().__init__(*args, **kwargs) - - def _cdf(self, x): - x = np.atleast_1d(np.array(x)) - out = np.zeros(x.shape) - out[x < self.threshold] = np.NaN - xt = x[x >= self.threshold] - if xt.size != 0: - pot_ccdf = 1. - self.pot.cdf(xt-self.threshold) - prop_pot = npot/npeaks - out[x >= self.threshold] = 1. - (prop_pot * pot_ccdf) - return out - - peaks = _Peaks(name="peaks", pot_distribution=pot, threshold=threshold) - # save the peaks over threshold distribution - peaks.pot = pot - return peaks - - -def ste_peaks(peaks_distribution, npeaks): - """ - Estimate the short-term extreme distribution from the peaks - distribution. - - Parameters - ---------- - peaks_distribution: scipy.stats.rv_frozen - Probability distribution of the peaks. - npeaks : float - Number of peaks in short term period. - - Returns - ------- - ste: scipy.stats.rv_frozen - Short-term extreme distribution. - """ - assert callable(peaks_distribution.cdf - ), 'peaks_distribution must be a scipy.stat distribution.' - assert isinstance(npeaks, float), 'npeaks must be of type float' - - class _ShortTermExtreme(stats.rv_continuous): - - def __init__(self, *args, **kwargs): - self.peaks = kwargs.pop('peaks_distribution') - self.npeaks = kwargs.pop('npeaks') - super().__init__(*args, **kwargs) - - def _cdf(self, x): - peaks_cdf = np.array(self.peaks.cdf(x)) - peaks_cdf[np.isnan(peaks_cdf)] = 0.0 - if len(peaks_cdf) == 1: - peaks_cdf = peaks_cdf[0] - return peaks_cdf ** self.npeaks - - ste = _ShortTermExtreme(name="short_term_extreme", - peaks_distribution=peaks_distribution, - npeaks=npeaks) - return ste - - -def block_maxima(t, x, t_st): - """ - Find the block maxima of a time-series. - - The timeseries (t,x) is divided into blocks of length t_st, and the - maxima of each bloock is returned. - - Parameters - ---------- - t : np.array - Time array. - x : np.array - global peaks timeseries. - t_st : float - Short-term period. - - Returns - ------- - block_maxima: np.array - Block maxima (i.e. largest peak in each block). - """ - assert isinstance(t, np.ndarray), 't must be of type np.ndarray' - assert isinstance(x, np.ndarray), 'x must be of type np.ndarray' - assert isinstance(t_st, float), 't_st must be of type float' - - nblock = int(t[-1] / t_st) - block_maxima = np.zeros(int(nblock)) - for iblock in range(nblock): - ix = x[(t >= iblock * t_st) & (t < (iblock+1)*t_st)] - block_maxima[iblock] = np.max(ix) - return block_maxima - - -def ste_block_maxima_gev(block_maxima): - """ - Approximate the short-term extreme distribution using the block - maxima method and the Generalized Extreme Value distribution. - - Parameters - ---------- - block_maxima: np.array - Block maxima (i.e. largest peak in each block). - - Returns - ------- - ste: scipy.stats.rv_frozen - Short-term extreme distribution. - """ - assert isinstance( - block_maxima, np.ndarray), 'block_maxima must be of type np.ndarray' - - ste_params = stats.genextreme.fit(block_maxima) - param_names = ['c', 'loc', 'scale'] - ste_params = {k: v for k, v in zip(param_names, ste_params)} - ste = stats.genextreme(**ste_params) - ste.params = ste_params - return ste - - -def ste_block_maxima_gumbel(block_maxima): - """ - Approximate the short-term extreme distribution using the block - maxima method and the Gumbel (right) distribution. - - Parameters - ---------- - block_maxima: np.array - Block maxima (i.e. largest peak in each block). - - Returns - ------- - ste: scipy.stats.rv_frozen - Short-term extreme distribution. - """ - assert isinstance( - block_maxima, np.ndarray), 'block_maxima must be of type np.ndarray' - - ste_params = stats.gumbel_r.fit(block_maxima) - param_names = ['loc', 'scale'] - ste_params = {k: v for k, v in zip(param_names, ste_params)} - ste = stats.gumbel_r(**ste_params) - ste.params = ste_params - return ste - - -def ste(t, data, t_st, method): - """ - Alias for `short_term_extreme`. - """ - ste = short_term_extreme(t, data, t_st, method) - return ste - - -def short_term_extreme(t, data, t_st, method): - """ - Approximate the short-term extreme distribution from a - timeseries of the response using chosen method. - - The availabe methods are: 'peaks_weibull', 'peaks_weibull_tail_fit', - 'peaks_over_threshold', 'block_maxima_gev', and 'block_maxima_gumbel'. - For the block maxima methods the timeseries needs to be many times - longer than the short-term period. For the peak-fitting methods the - timeseries can be of arbitrary length. - - Parameters - ---------- - t: np.array - Time array. - data: np.array - Response timeseries. - t_st: float - Short-term period. - method : string - Method for estimating the short-term extreme distribution. - - Returns - ------- - ste: scipy.stats.rv_frozen - Short-term extreme distribution. - """ - assert isinstance(t, np.ndarray), 't must be of type np.ndarray' - assert isinstance(data, np.ndarray), 'x must be of type np.ndarray' - assert isinstance(t_st, float), 't_st must be of type float' - assert isinstance(method, str), 'method must be of type string' - - peaks_methods = { - 'peaks_weibull': peaks_distribution_weibull, - 'peaks_weibull_tail_fit': peaks_distribution_weibull_tail_fit, - 'peaks_over_threshold': peaks_distribution_peaks_over_threshold} - blockmaxima_methods = { - 'block_maxima_gev': ste_block_maxima_gev, - 'block_maxima_gumbel': ste_block_maxima_gumbel, - } - - if method in peaks_methods.keys(): - fit_peaks = peaks_methods[method] - _, peaks = global_peaks(t, data) - npeaks = len(peaks) - time = t[-1]-t[0] - nst = number_of_short_term_peaks(npeaks, time, t_st) - peaks_dist = fit_peaks(peaks) - ste = ste_peaks(peaks_dist, nst) - elif method in blockmaxima_methods.keys(): - fit_maxima = blockmaxima_methods[method] - maxima = block_maxima(t, data, t_st) - ste = fit_maxima(maxima) - else: - print("Passed `method` not found.") - return ste - - -def full_seastate_long_term_extreme(ste, weights): - """ - Return the long-term extreme distribution of a response of - interest using the full sea state approach. - - Parameters - ---------- - ste: list[scipy.stats.rv_frozen] - Short-term extreme distribution of the quantity of interest for - each sample sea state. - weights: list[floats] - The weights from the full sea state sampling - - Returns - ------- - ste: scipy.stats.rv_frozen - Short-term extreme distribution. - """ - assert isinstance( - ste, list), 'ste must be of type list[scipy.stats.rv_frozen]' - assert isinstance(weights, (list, np.ndarray) - ), 'weights must be of type list[floats]' - - class _LongTermExtreme(stats.rv_continuous): - - def __init__(self, *args, **kwargs): - weights = kwargs.pop('weights') - # make sure weights add to 1.0 - self.weights = weights / np.sum(weights) - self.ste = kwargs.pop('ste') - self.n = len(self.weights) - super().__init__(*args, **kwargs) - - def _cdf(self, x): - f = 0.0 - for w_i, ste_i in zip(self.weights, self.ste): - f += w_i * ste_i.cdf(x) - return f - - return _LongTermExtreme(name="long_term_extreme", weights=weights, ste=ste) - - -def mler_coefficients(rao, wave_spectrum, response_desired): - """ - Calculate MLER (most likely extreme response) coefficients from a - sea state spectrum and a response RAO. - - Parameters - ---------- - rao: numpy ndarray - Response amplitude operator. - wave_spectrum: pd.DataFrame - Wave spectral density [m^2/Hz] indexed by frequency [Hz]. - response_desired: int or float - Desired response, units should correspond to a motion RAO or - units of force for a force RAO. - - Returns - ------- - mler: pd.DataFrame - DataFrame containing conditioned wave spectral amplitude - coefficient [m^2-s], and Phase [rad] indexed by freq [Hz]. - """ - try: - rao = np.array(rao) - except: - pass - assert isinstance(rao, np.ndarray), 'rao must be of type np.ndarray' - assert isinstance(wave_spectrum, pd.DataFrame - ), 'wave_spectrum must be of type pd.DataFrame' - assert isinstance(response_desired, (int, float) - ), 'response_desired must be of type int or float' - - freq_hz = wave_spectrum.index.values - # convert from Hz to rad/s - freq = freq_hz * (2*np.pi) - # change from Hz to rad/s - wave_spectrum = wave_spectrum.iloc[:, 0].values / (2*np.pi) - # get delta - dw = (2*np.pi - 0.) / (len(freq)-1) - - spectrum_r = np.zeros(len(freq)) # [(response units)^2-s/rad] - _s = np.zeros(len(freq)) # [m^2-s/rad] - _a = np.zeros(len(freq)) # [m^2-s/rad] - _coeff_a_rn = np.zeros(len(freq)) # [1/(response units)] - _phase = np.zeros(len(freq)) - - # Note: waves.A is "S" in Quon2016; 'waves' naming convention - # matches WEC-Sim conventions (EWQ) - # Response spectrum [(response units)^2-s/rad] -- Quon2016 Eqn. 3 - spectrum_r[:] = np.abs(rao)**2 * (2*wave_spectrum) - - # calculate spectral moments and other important spectral values. - m0 = (frequency_moment(pd.Series(spectrum_r, index=freq), 0)).iloc[0, 0] - m1 = (frequency_moment(pd.Series(spectrum_r, index=freq), 1)).iloc[0, 0] - m2 = (frequency_moment(pd.Series(spectrum_r, index=freq), 2)).iloc[0, 0] - wBar = m1 / m0 - - # calculate coefficient A_{R,n} [(response units)^-1] -- Quon2016 Eqn. 8 - # Drummen version. Dietz has negative of this. - _coeff_a_rn[:] = np.abs(rao) * np.sqrt(2*wave_spectrum*dw) * \ - ((m2 - freq*m1) + wBar*(freq*m0 - m1)) / (m0*m2 - m1**2) - - # save the new spectral info to pass out - # Phase delay should be a positive number in this convention (AP) - _phase[:] = -np.unwrap(np.angle(rao)) - - # for negative values of Amp, shift phase by pi and flip sign - # for negative amplitudes, add a pi phase shift, then flip sign on - # negative Amplitudes - _phase[_coeff_a_rn < 0] -= np.pi - _coeff_a_rn[_coeff_a_rn < 0] *= -1 - - # calculate the conditioned spectrum [m^2-s/rad] - _s[:] = wave_spectrum * _coeff_a_rn[:]**2 * response_desired**2 - _a[:] = 2*wave_spectrum * _coeff_a_rn[:]**2 * \ - response_desired**2 - - # if the response amplitude we ask for is negative, we will add - # a pi phase shift to the phase information. This is because - # the sign of self.desiredRespAmp is lost in the squaring above. - # Ordinarily this would be put into the final equation, but we - # are shaping the wave information so that it is buried in the - # new spectral information, S. (AP) - if response_desired < 0: - _phase += np.pi - - mler = pd.DataFrame( - data={'WaveSpectrum': _s, 'Phase': _phase}, index=freq_hz) - mler = mler.fillna(0) - return mler - - -def mler_simulation(parameters=None): - """ - Define the simulation parameters that are used in various MLER - functionalities. - - See `extreme_response_contour_example.ipynb` example for how this is - useful. If no input is given, then default values are returned. - - Parameters - ---------- - parameters: dict (optional) - Simulation parameters. - Keys: - ----- - 'startTime': starting time [s] - 'endTime': ending time [s] - 'dT': time-step size [s] - 'T0': time of maximum event [s] - 'startx': start of simulation space [m] - 'endX': end of simulation space [m] - 'dX': horizontal spacing [m] - 'X': position of maximum event [m] - - Returns - ------- - sim: dict - Simulation parameters including spatial and time calculated - arrays. - """ - if not parameters == None: - assert isinstance(parameters, dict), 'parameters must be of type dict' - - sim = {} - - if parameters == None: - sim['startTime'] = -150.0 # [s] Starting time - sim['endTime'] = 150.0 # [s] Ending time - sim['dT'] = 1.0 # [s] Time-step size - sim['T0'] = 0.0 # [s] Time of maximum event - - sim['startX'] = -300.0 # [m] Start of simulation space - sim['endX'] = 300.0 # [m] End of simulation space - sim['dX'] = 1.0 # [m] Horiontal spacing - sim['X0'] = 0.0 # [m] Position of maximum event - else: - sim = parameters - - # maximum timestep index - sim['maxIT'] = int( - np.ceil((sim['endTime'] - sim['startTime'])/sim['dT'] + 1)) - sim['T'] = np.linspace(sim['startTime'], sim['endTime'], sim['maxIT']) - - sim['maxIX'] = int(np.ceil((sim['endX'] - sim['startX'])/sim['dX'] + 1)) - sim['X'] = np.linspace(sim['startX'], sim['endX'], sim['maxIX']) - - return sim - - -def mler_wave_amp_normalize(wave_amp, mler, sim, k): - """ - Function that renormalizes the incoming amplitude of the MLER wave - to the desired peak height (peak to MSL). - - Parameters - ---------- - wave_amp: float - Desired wave amplitude (peak to MSL). - mler: pd.DataFrame - MLER coefficients generated by 'mler_coefficients' function. - sim: dict - Simulation parameters formatted by output from - 'mler_simulation'. - k: numpy ndarray - Wave number. - - Returns - ------- - mler_norm : pd.DataFrame - MLER coefficients - """ - try: - k = np.array(k) - except: - pass - assert isinstance(mler, pd.DataFrame), 'mler must be of type pd.DataFrame' - assert isinstance(wave_amp, (int, float) - ), 'wave_amp must be of type int or float' - assert isinstance(sim, dict), 'sim must be of type dict' - assert isinstance(k, np.ndarray), 'k must be of type ndarray' - - freq = mler.index.values * 2*np.pi - dw = (max(freq) - min(freq)) / (len(freq)-1) # get delta - - wave_amp_time = np.zeros((sim['maxIX'], sim['maxIT'])) - for ix, x in enumerate(sim['X']): - for it, t in enumerate(sim['T']): - # conditioned wave - wave_amp_time[ix, it] = np.sum( - np.sqrt(2*mler['WaveSpectrum']*dw) * - np.cos(freq*(t-sim['T0']) - k*(x-sim['X0']) + mler['Phase']) - ) - - tmp_max_amp = np.max(np.abs(wave_amp_time)) - - # renormalization of wave amplitudes - rescale_fact = np.abs(wave_amp) / np.abs(tmp_max_amp) - # rescale the wave spectral amplitude coefficients - spectrum = mler['WaveSpectrum'] * rescale_fact**2 - - mler_norm = pd.DataFrame(index=mler.index) - mler_norm['WaveSpectrum'] = spectrum - mler_norm['Phase'] = mler['Phase'] - - return mler_norm - - -def mler_export_time_series(rao, mler, sim, k): - """ - Generate the wave amplitude time series at X0 from the calculated - MLER coefficients - - Parameters - ---------- - rao: numpy ndarray - Response amplitude operator. - mler: pd.DataFrame - MLER coefficients dataframe generated from an MLER function. - sim: dict - Simulation parameters formatted by output from - 'mler_simulation'. - k: numpy ndarray - Wave number. - - Returns - ------- - mler_ts: pd.DataFrame - Time series of wave height [m] and linear response [*] indexed - by time [s]. - - """ - try: - rao = np.array(rao) - except: - pass - try: - k = np.array(k) - except: - pass - assert isinstance(rao, np.ndarray), 'rao must be of type ndarray' - assert isinstance(mler, pd.DataFrame), 'mler must be of type pd.DataFrame' - assert isinstance(sim, dict), 'sim must be of type dict' - assert isinstance(k, np.ndarray), 'k must be of type ndarray' - - freq = mler.index.values * 2*np.pi # convert Hz to rad/s - dw = (max(freq) - min(freq)) / (len(freq)-1) # get delta - - # calculate the series - wave_amp_time = np.zeros((sim['maxIT'], 2)) - xi = sim['X0'] - for i, ti in enumerate(sim['T']): - # conditioned wave - wave_amp_time[i, 0] = np.sum( - np.sqrt(2*mler['WaveSpectrum']*dw) * - np.cos(freq*(ti-sim['T0']) + mler['Phase'] - k*(xi-sim['X0'])) - ) - # Response calculation - wave_amp_time[i, 1] = np.sum( - np.sqrt(2*mler['WaveSpectrum']*dw) * np.abs(rao) * - np.cos(freq*(ti-sim['T0']) - k*(xi-sim['X0'])) - ) - - mler_ts = pd.DataFrame(wave_amp_time, index=sim['T']) - mler_ts = mler_ts.rename(columns={0: 'WaveHeight', 1: 'LinearResponse'}) - - return mler_ts - - -def return_year_value(ppf, return_year, short_term_period_hr): - """ - Calculate the value from a given distribution corresponding to a particular - return year. - - Parameters - ---------- - ppf: callable function of 1 argument - Percentage Point Function (inverse CDF) of short term distribution. - return_year: int, float - Return period in years. - short_term_period_hr: int, float - Short term period the distribution is created from in hours. - - Returns - ------- - value: float - The value corresponding to the return period from the distribution. - """ - assert callable(ppf) - assert isinstance(return_year, (float, int)) - assert isinstance(short_term_period_hr, (float, int)) - - p = 1 / (return_year * 365.25 * 24 / short_term_period_hr) - - return ppf(1 - p) diff --git a/mhkit/loads/extreme/__init__.py b/mhkit/loads/extreme/__init__.py new file mode 100644 index 000000000..318a2cdc8 --- /dev/null +++ b/mhkit/loads/extreme/__init__.py @@ -0,0 +1,39 @@ +""" +This package provides tools and functions for extreme value analysis +and wave data statistics. + +It includes methods for calculating peaks over threshold, estimating +short-term extreme distributions,and performing wave amplitude +normalization for most likely extreme response analysis. +""" + +from mhkit.loads.extreme.extremes import ( + ste_peaks, + block_maxima, + ste_block_maxima_gev, + ste_block_maxima_gumbel, + ste, + short_term_extreme, + full_seastate_long_term_extreme, +) + +from mhkit.loads.extreme.mler import ( + mler_coefficients, + mler_simulation, + mler_wave_amp_normalize, + mler_export_time_series, +) + +from mhkit.loads.extreme.peaks import ( + _peaks_over_threshold, + global_peaks, + number_of_short_term_peaks, + peaks_distribution_weibull, + peaks_distribution_weibull_tail_fit, + automatic_hs_threshold, + peaks_distribution_peaks_over_threshold, +) + +from mhkit.loads.extreme.sample import ( + return_year_value, +) diff --git a/mhkit/loads/extreme/extremes.py b/mhkit/loads/extreme/extremes.py new file mode 100644 index 000000000..d89545c9d --- /dev/null +++ b/mhkit/loads/extreme/extremes.py @@ -0,0 +1,293 @@ +""" +This module provides functionality for estimating the short-term and +long-term extreme distributions of responses in a time series. It +includes methods for analyzing peaks, block maxima, and applying +statistical distributions to model extreme events. The module supports +various methods for short-term extreme estimation, including peaks +fitting with Weibull, tail fitting, peaks over threshold, and block +maxima methods with GEV (Generalized Extreme Value) and Gumbel +distributions. Additionally, it offers functionality to approximate +the long-term extreme distribution by weighting short-term extremes +across different sea states. + +Functions: +- ste_peaks: Estimates the short-term extreme distribution from peaks + distribution using specified statistical methods. +- block_maxima: Finds the block maxima in a time-series data to be used + in block maxima methods. +- ste_block_maxima_gev: Approximates the short-term extreme distribution + using the block maxima method with the GEV distribution. +- ste_block_maxima_gumbel: Approximates the short-term extreme + distribution using the block maxima method with the Gumbel distribution. +- ste: Alias for `short_term_extreme`, facilitating easier access to the + primary functionality of estimating short-term extremes. +- short_term_extreme: Core function to approximate the short-term extreme + distribution from a time series using chosen methods. +- full_seastate_long_term_extreme: Combines short-term extreme + distributions using weights to estimate the long-term extreme distribution. +""" + +from typing import Union + +import numpy as np +from scipy import stats +from scipy.stats import rv_continuous + +import mhkit.loads.extreme.peaks as peaks_distributions + + +def ste_peaks(peaks_distribution: rv_continuous, npeaks: float) -> rv_continuous: + """ + Estimate the short-term extreme distribution from the peaks + distribution. + + Parameters + ---------- + peaks_distribution: scipy.stats.rv_frozen + Probability distribution of the peaks. + npeaks : float + Number of peaks in short term period. + + Returns + ------- + short_term_extreme: scipy.stats.rv_frozen + Short-term extreme distribution. + """ + if not callable(peaks_distribution.cdf): + raise TypeError("peaks_distribution must be a scipy.stat distribution.") + if not isinstance(npeaks, float): + raise TypeError(f"npeaks must be of type float. Got: {type(npeaks)}") + + class _ShortTermExtreme(stats.rv_continuous): + def __init__(self, *args, **kwargs): + self.peaks = kwargs.pop("peaks_distribution") + self.npeaks = kwargs.pop("npeaks") + super().__init__(*args, **kwargs) + + def _cdf(self, x, *args, **kwargs): + peaks_cdf = np.array(self.peaks.cdf(x, *args, **kwargs)) + peaks_cdf[np.isnan(peaks_cdf)] = 0.0 + if len(peaks_cdf) == 1: + peaks_cdf = peaks_cdf[0] + return peaks_cdf**self.npeaks + + short_term_extreme_peaks = _ShortTermExtreme( + name="short_term_extreme", peaks_distribution=peaks_distribution, npeaks=npeaks + ) + return short_term_extreme_peaks + + +def block_maxima( + time: np.ndarray, global_peaks_data: np.ndarray, time_st: float +) -> np.ndarray: + """ + Find the block maxima of a time-series. + + The timeseries (time, global_peaks) is divided into blocks of length t_st, and the + maxima of each bloock is returned. + + Parameters + ---------- + time : np.array + Time array. + global_peaks_data : np.array + global peaks timeseries. + time_st : float + Short-term period. + + Returns + ------- + block_max: np.array + Block maxima (i.e. largest peak in each block). + """ + if not isinstance(time, np.ndarray): + raise TypeError(f"time must be of type np.ndarray. Got: {type(time)}") + if not isinstance(global_peaks_data, np.ndarray): + raise TypeError( + f"global_peaks_data must be of type np.ndarray. Got: {type(global_peaks_data)}" + ) + if not isinstance(time_st, float): + raise TypeError(f"time_st must be of type float. Got: {type(time_st)}") + + nblock = int(time[-1] / time_st) + block_max = np.zeros(int(nblock)) + for iblock in range(nblock): + i_x = global_peaks_data[ + (time >= iblock * time_st) & (time < (iblock + 1) * time_st) + ] + block_max[iblock] = np.max(i_x) + return block_max + + +def ste_block_maxima_gev(block_max): + """ + Approximate the short-term extreme distribution using the block + maxima method and the Generalized Extreme Value distribution. + + Parameters + ---------- + block_max: np.array + Block maxima (i.e. largest peak in each block). + + Returns + ------- + short_term_extreme_rv: scipy.stats.rv_frozen + Short-term extreme distribution. + """ + if not isinstance(block_max, np.ndarray): + raise TypeError(f"block_max must be of type np.ndarray. Got: {type(block_max)}") + + ste_params = stats.genextreme.fit(block_max) + param_names = ["c", "loc", "scale"] + ste_params = dict(zip(param_names, ste_params)) + short_term_extreme_rv = stats.genextreme(**ste_params) + short_term_extreme_rv.params = ste_params + return short_term_extreme_rv + + +def ste_block_maxima_gumbel(block_max): + """ + Approximate the short-term extreme distribution using the block + maxima method and the Gumbel (right) distribution. + + Parameters + ---------- + block_max: np.array + Block maxima (i.e. largest peak in each block). + + Returns + ------- + ste: scipy.stats.rv_frozen + Short-term extreme distribution. + """ + if not isinstance(block_max, np.ndarray): + raise TypeError(f"block_max must be of type np.ndarray. Got: {type(block_max)}") + + ste_params = stats.gumbel_r.fit(block_max) + param_names = ["loc", "scale"] + ste_params = dict(zip(param_names, ste_params)) + short_term_extreme_rv = stats.gumbel_r(**ste_params) + short_term_extreme_rv.params = ste_params + return short_term_extreme_rv + + +def ste(time: np.ndarray, data: np.ndarray, t_st: float, method: str) -> rv_continuous: + """ + Alias for `short_term_extreme`. + """ + ste_dist = short_term_extreme(time, data, t_st, method) + return ste_dist + + +def short_term_extreme( + time: np.ndarray, data: np.ndarray, t_st: float, method: str +) -> Union[rv_continuous, None]: + """ + Approximate the short-term extreme distribution from a + timeseries of the response using chosen method. + + The availabe methods are: 'peaks_weibull', 'peaks_weibull_tail_fit', + 'peaks_over_threshold', 'block_maxima_gev', and 'block_maxima_gumbel'. + For the block maxima methods the timeseries needs to be many times + longer than the short-term period. For the peak-fitting methods the + timeseries can be of arbitrary length. + + Parameters + ---------- + time: np.array + Time array. + data: np.array + Response timeseries. + t_st: float + Short-term period. + method : string + Method for estimating the short-term extreme distribution. + + Returns + ------- + short_term_extreme_dist: scipy.stats.rv_frozen + Short-term extreme distribution. + """ + if not isinstance(time, np.ndarray): + raise TypeError(f"time must be of type np.ndarray. Got: {type(time)}") + if not isinstance(data, np.ndarray): + raise TypeError(f"data must be of type np.ndarray. Got: {type(data)}") + if not isinstance(t_st, float): + raise TypeError(f"t_st must be of type float. Got: {type(t_st)}") + if not isinstance(method, str): + raise TypeError(f"method must be of type string. Got: {type(method)}") + + peaks_methods = { + "peaks_weibull": peaks_distributions.peaks_distribution_weibull, + "peaks_weibull_tail_fit": peaks_distributions.peaks_distribution_weibull_tail_fit, + "peaks_over_threshold": peaks_distributions.peaks_distribution_peaks_over_threshold, + } + blockmaxima_methods = { + "block_maxima_gev": ste_block_maxima_gev, + "block_maxima_gumbel": ste_block_maxima_gumbel, + } + + if method in peaks_methods: + fit_peaks = peaks_methods[method] + _, peaks = peaks_distributions.global_peaks(time, data) + npeaks = len(peaks) + time = time[-1] - time[0] + nst = peaks_distributions.number_of_short_term_peaks(npeaks, time, t_st) + peaks_dist = fit_peaks(peaks) + short_term_extreme_dist = ste_peaks(peaks_dist, nst) + elif method in blockmaxima_methods: + fit_maxima = blockmaxima_methods[method] + maxima = block_maxima(time, data, t_st) + short_term_extreme_dist = fit_maxima(maxima) + else: + print("Passed `method` not found.") + return short_term_extreme_dist + + +def full_seastate_long_term_extreme(short_term_extreme_dist, weights): + """ + Return the long-term extreme distribution of a response of + interest using the full sea state approach. + + Parameters + ---------- + ste: list[scipy.stats.rv_frozen] + Short-term extreme distribution of the quantity of interest for + each sample sea state. + weights: list, np.ndarray + The weights from the full sea state sampling + + Returns + ------- + ste: scipy.stats.rv_frozen + Short-term extreme distribution. + """ + if not isinstance(short_term_extreme_dist, list): + raise TypeError( + "short_term_extreme_dist must be of type list[scipy.stats.rv_frozen]." + + f"Got: {type(short_term_extreme_dist)}" + ) + if not isinstance(weights, (list, np.ndarray)): + raise TypeError( + f"weights must be of type list or np.ndarray. Got: {type(weights)}" + ) + + class _LongTermExtreme(stats.rv_continuous): + def __init__(self, *args, **kwargs): + weights = kwargs.pop("weights") + # make sure weights add to 1.0 + self.weights = weights / np.sum(weights) + self.ste = kwargs.pop("ste") + # Disabled bc not sure where/ how n is applied + self.n = len(self.weights) # pylint: disable=invalid-name + super().__init__(*args, **kwargs) + + def _cdf(self, x, *args, **kwargs): + weighted_cdf = 0.0 + for w_i, ste_i in zip(self.weights, self.ste): + weighted_cdf += w_i * ste_i.cdf(x, *args, **kwargs) + return weighted_cdf + + return _LongTermExtreme( + name="long_term_extreme", weights=weights, ste=short_term_extreme_dist + ) diff --git a/mhkit/loads/extreme/mler.py b/mhkit/loads/extreme/mler.py new file mode 100644 index 000000000..2922fc3b9 --- /dev/null +++ b/mhkit/loads/extreme/mler.py @@ -0,0 +1,458 @@ +""" +This module provides functionalities to calculate and analyze Most +Likely Extreme Response (MLER) coefficients for wave energy converter +design and risk assessment. It includes functions to: + + - Calculate MLER coefficients (`mler_coefficients`) from a sea state + spectrum and a response Amplitude Response Operator (ARO). + - Define and manipulate simulation parameters (`mler_simulation`) used + across various MLER analyses. + - Renormalize the incoming amplitude of the MLER wave + (`mler_wave_amp_normalize`) to match the desired peak height for more + accurate modeling and analysis. + - Export the wave amplitude time series (`mler_export_time_series`) + based on the calculated MLER coefficients for further analysis or + visualization. +""" + +from typing import Union, List, Optional, Dict, Any + +import pandas as pd +import xarray as xr +import numpy as np +from numpy.typing import NDArray + +from mhkit.wave.resource import frequency_moment + +SimulationParameters = Dict[str, Union[float, int, np.ndarray]] + + +def _calculate_spectral_values( + freq_hz: Union[np.ndarray, pd.Series], + rao_array: np.ndarray, + wave_spectrum: Union[pd.Series, pd.DataFrame, np.ndarray], + d_w: float, +) -> Dict[str, Union[float, np.ndarray]]: + """ + Calculates spectral moments and the coefficient A_{R,n} from a given sea state spectrum + and a response RAO. + + Parameters + ---------- + spectrum_r : Union[np.ndarray, pd.Series] + Real part of the spectrum. + freq_hz : Union[np.ndarray, pd.Series] + Frequencies in Hz corresponding to spectrum_r. + rao : numpy ndarray + Response Amplitude Operator (RAO) of the system. + wave_spectrum : Union[pd.Series, pd.DataFrame, np.ndarray] + Wave spectrum values corresponding to freq_hz. + d_w : float + Delta omega, the frequency interval. + + Returns + ------- + Dict[str, Union[float, np.ndarray]] + A dictionary containing spectral moments (m_0, m_1, m_2) and the coefficient A_{R,n}. + """ + # Note: waves.A is "S" in Quon2016; 'waves' naming convention + # matches WEC-Sim conventions (EWQ) + # Response spectrum [(response units)^2-s/rad] -- Quon2016 Eqn. 3 + spectrum_r = np.abs(rao_array) ** 2 * (2 * wave_spectrum) + + # Calculate spectral moments + m_0 = frequency_moment(pd.Series(spectrum_r, index=freq_hz), 0).iloc[0, 0] + m_1 = frequency_moment(pd.Series(spectrum_r, index=freq_hz), 1).iloc[0, 0] + m_2 = frequency_moment(pd.Series(spectrum_r, index=freq_hz), 2).iloc[0, 0] + + # Calculate coefficient A_{R,n} + coeff_a_rn = ( + np.abs(rao_array) + * np.sqrt(2 * wave_spectrum * d_w) + * ((m_2 - freq_hz * m_1) + (m_1 / m_0) * (freq_hz * m_0 - m_1)) + / (m_0 * m_2 - m_1**2) + ) + + return { + "m_0": m_0, + "m_1": m_1, + "m_2": m_2, + "coeff_a_rn": coeff_a_rn, + } + + +def mler_coefficients( + rao: Union[NDArray[np.float_], pd.Series, List[float], List[int], xr.DataArray], + wave_spectrum: Union[pd.Series, pd.DataFrame, xr.DataArray, xr.Dataset], + response_desired: Union[int, float], + frequency_dimension: str = "", + to_pandas: bool = True, +) -> Union[pd.DataFrame, xr.Dataset]: + """ + Calculate MLER (most likely extreme response) coefficients from a + sea state spectrum and a response RAO. + + Parameters + ---------- + rao: numpy ndarray + Response amplitude operator. + wave_spectrum: pandas Series, pandas DataFrame, xarray DataArray, or xarray Dataset + Wave spectral density [m^2/Hz] indexed by frequency [Hz]. + DataFrame and Dataset inputs should only have one data variable + response_desired: int or float + Desired response, units should correspond to a motion RAO or + units of force for a force RAO. + frequency_dimension: string (optional) + Name of the xarray dimension corresponding to frequency. If not supplied, + defaults to the first dimension. Does not affect pandas input. + to_pandas: bool (optional) + Flag to output pandas instead of xarray. Default = True. + + Returns + ------- + mler: pandas DataFrame or xarray Dataset + DataFrame containing conditioned wave spectral amplitude + coefficient [m^2-s], and Phase [rad] indexed by freq [Hz]. + """ + + if isinstance(rao, (list, pd.Series, xr.DataArray)): + rao_array = np.array(rao) + elif isinstance(rao, np.ndarray): + rao_array = rao + else: + raise TypeError( + "Unsupported type for 'rao'. Must be one of: list, pd.Series, \ + np.ndarray, xr.DataArray." + ) + + if not isinstance(rao_array, np.ndarray): + raise TypeError(f"rao must be of type np.ndarray. Got: {type(rao_array)}") + if not isinstance( + wave_spectrum, (pd.Series, pd.DataFrame, xr.DataArray, xr.Dataset) + ): + raise TypeError( + f"wave_spectrum must be of type pd.Series, pd.DataFrame, " + f"xr.DataArray, or xr.Dataset. Got: {type(wave_spectrum)}" + ) + if not isinstance(response_desired, (int, float)): + raise TypeError( + f"response_desired must be of type int or float. Got: {type(response_desired)}" + ) + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type bool. Got: {type(to_pandas)}") + + # Convert input to xarray DataArray + if isinstance(wave_spectrum, (pd.Series, pd.DataFrame)): + wave_spectrum = wave_spectrum.squeeze().to_xarray() + + if isinstance(wave_spectrum, xr.Dataset): + if len(wave_spectrum.data_vars) > 1: + raise ValueError( + f"wave_spectrum can only contain one variable. Got {list(wave_spectrum.data_vars)}." + ) + wave_spectrum = wave_spectrum.to_array() + + if frequency_dimension == "": + frequency_dimension = list(wave_spectrum.coords)[0] + + # convert from Hz to rad/s + freq_hz = wave_spectrum.coords[frequency_dimension].values * (2 * np.pi) + wave_spectrum = wave_spectrum.to_numpy() / (2 * np.pi) + + # get frequency step + d_w = 2.0 * np.pi / (len(freq_hz) - 1) + + spectral_values = _calculate_spectral_values(freq_hz, rao_array, wave_spectrum, d_w) + + # save the new spectral info to pass out + # Phase delay should be a positive number in this convention (AP) + _phase = -np.unwrap(np.angle(rao_array)) + + # for negative values of Amp, shift phase by pi and flip sign + # for negative amplitudes, add a pi phase shift, then flip sign on + # negative Amplitudes + _phase[spectral_values["coeff_a_rn"] < 0] -= np.pi + spectral_values["coeff_a_rn"][spectral_values["coeff_a_rn"] < 0] *= -1 + + # calculate the conditioned spectrum [m^2-s/rad] + conditioned_spectrum = ( + wave_spectrum * spectral_values["coeff_a_rn"] ** 2 * response_desired**2 + ) + + # if the response amplitude we ask for is negative, we will add + # a pi phase shift to the phase information. This is because + # the sign of self.desiredRespAmp is lost in the squaring above. + # Ordinarily this would be put into the final equation, but we + # are shaping the wave information so that it is buried in the + # new spectral information, S. (AP) + if response_desired < 0: + _phase += np.pi + + mler = xr.Dataset( + { + "WaveSpectrum": (["frequency"], np.array(conditioned_spectrum)), + "Phase": (["frequency"], _phase + np.pi * (response_desired < 0)), + }, + coords={"frequency": freq_hz}, + ) + mler.fillna(0) + + return mler.to_pandas() if to_pandas else mler + + +def mler_simulation( + parameters: Optional[SimulationParameters] = None, +) -> SimulationParameters: + """ + Define the simulation parameters that are used in various MLER + functionalities. + + See `extreme_response_contour_example.ipynb` example for how this is + useful. If no input is given, then default values are returned. + + Parameters + ---------- + parameters: dict (optional) + Simulation parameters. + Keys: + ----- + - 'startTime': starting time [s] + - 'endTime': ending time [s] + - 'dT': time-step size [s] + - 'T0': time of maximum event [s] + - 'startx': start of simulation space [m] + - 'endX': end of simulation space [m] + - 'dX': horizontal spacing [m] + - 'X': position of maximum event [m] + The following keys are calculated from the above parameters: + - 'maxIT': int, maximum timestep index + - 'T': np.ndarray, time array + - 'maxIX': int, maximum index for space + - 'X': np.ndarray, space array + + Returns + ------- + sim: dict + Simulation parameters including spatial and time calculated + arrays. + """ + if not isinstance(parameters, (type(None), dict)): + raise TypeError( + f"If specified, parameters must be of type dict. Got: {type(parameters)}" + ) + + sim = {} + + if parameters is None: + sim["startTime"] = -150.0 # [s] Starting time + sim["endTime"] = 150.0 # [s] Ending time + sim["dT"] = 1.0 # [s] Time-step size + sim["T0"] = 0.0 # [s] Time of maximum event + sim["startX"] = -300.0 # [m] Start of simulation space + sim["endX"] = 300.0 # [m] End of simulation space + sim["dX"] = 1.0 # [m] Horiontal spacing + sim["X0"] = 0.0 # [m] Position of maximum event + else: + sim = parameters + + # maximum timestep index + sim["maxIT"] = int(np.ceil((sim["endTime"] - sim["startTime"]) / sim["dT"] + 1)) + sim["T"] = np.linspace(sim["startTime"], sim["endTime"], sim["maxIT"]) + + sim["maxIX"] = int(np.ceil((sim["endX"] - sim["startX"]) / sim["dX"] + 1)) + sim["X"] = np.linspace(sim["startX"], sim["endX"], sim["maxIX"]) + + return sim + + +def mler_wave_amp_normalize( + wave_amp: float, + mler: Union[pd.DataFrame, xr.Dataset], + sim: SimulationParameters, + k: Union[NDArray[np.float_], List[float], pd.Series], + **kwargs: Any, +) -> Union[pd.DataFrame, xr.Dataset]: + """ + Function that renormalizes the incoming amplitude of the MLER wave + to the desired peak height (peak to MSL). + + Parameters + ---------- + wave_amp: float + Desired wave amplitude (peak to MSL). + mler: pandas DataFrame or xarray Dataset + MLER coefficients generated by 'mler_coefficients' function. + sim: dict + Simulation parameters formatted by output from + 'mler_simulation'. + k: numpy ndarray + Wave number + frequency_dimension: string (optional) + Name of the xarray dimension corresponding to frequency. If not supplied, + defaults to the first dimension. Does not affect pandas input. + to_pandas: bool (optional) + Flag to output pandas instead of xarray. Default = True. + + Returns + ------- + mler_norm : pandas DataFrame or xarray Dataset + MLER coefficients + """ + frequency_dimension = kwargs.get("frequency_dimension", "") + to_pandas = kwargs.get("to_pandas", True) + + k_array = np.array(k, dtype=float) if not isinstance(k, np.ndarray) else k + + if not isinstance(mler, (pd.DataFrame, xr.Dataset)): + raise TypeError( + f"mler must be of type pd.DataFrame or xr.Dataset. Got: {type(mler)}" + ) + if not isinstance(wave_amp, (int, float)): + raise TypeError(f"wave_amp must be of type int or float. Got: {type(wave_amp)}") + if not isinstance(sim, dict): + raise TypeError(f"sim must be of type dict. Got: {type(sim)}") + if not isinstance(frequency_dimension, str): + raise TypeError( + "frequency_dimension must be of type bool." + + f"Got: {type(frequency_dimension)}" + ) + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type bool. Got: {type(to_pandas)}") + + # If input is pandas, convert to xarray + mler_xr = mler.to_xarray() if isinstance(mler, pd.DataFrame) else mler() + + # Determine frequency dimension + freq_dim = frequency_dimension or list(mler_xr.coords)[0] + # freq = mler_xr.coords[freq_dim].values * 2 * np.pi + # d_w = np.diff(freq).mean() + + wave_amp_time = np.array( + [ + np.sum( + np.sqrt( + 2 + * mler_xr["WaveSpectrum"].values + * np.diff(mler_xr.coords[freq_dim].values * 2 * np.pi).mean() + ) + * np.cos( + mler_xr.coords[freq_dim].values * 2 * np.pi * (t - sim["T0"]) + - k_array * (x - sim["X0"]) + + mler_xr["Phase"].values + ) + ) + for x in np.linspace(sim["startX"], sim["endX"], sim["maxIX"]) + for t in np.linspace(sim["startTime"], sim["endTime"], sim["maxIT"]) + ] + ).reshape(sim["maxIX"], sim["maxIT"]) + + rescale_fact = np.abs(wave_amp) / np.max(np.abs(wave_amp_time)) + + # Rescale the wave spectral amplitude coefficients and assign phase + mler_norm = xr.Dataset( + { + "WaveSpectrum": ( + ["frequency"], + mler_xr["WaveSpectrum"].data * rescale_fact**2, + ), + "Phase": (["frequency"], mler_xr["Phase"].data), + }, + coords={"frequency": (["frequency"], mler_xr.coords[freq_dim].data)}, + ) + return mler_norm.to_pandas() if to_pandas else mler_norm + + +def mler_export_time_series( + rao: Union[NDArray[np.float_], List[float], pd.Series], + mler: Union[pd.DataFrame, xr.Dataset], + sim: SimulationParameters, + k: Union[NDArray[np.float_], List[float], pd.Series], + **kwargs: Any, +) -> Union[pd.DataFrame, xr.Dataset]: + """ + Generate the wave amplitude time series at X0 from the calculated + MLER coefficients + + Parameters + ---------- + rao: numpy ndarray + Response amplitude operator. + mler: pandas DataFrame or xarray Dataset + MLER coefficients dataframe generated from an MLER function. + sim: dict + Simulation parameters formatted by output from + 'mler_simulation'. + k: numpy ndarray + Wave number. + frequency_dimension: string (optional) + Name of the xarray dimension corresponding to frequency. If not supplied, + defaults to the first dimension. Does not affect pandas input. + to_pandas: bool (optional) + Flag to output pandas instead of xarray. Default = True. + + Returns + ------- + mler_ts: pandas DataFrame or xarray Dataset + Time series of wave height [m] and linear response [*] indexed + by time [s]. + + """ + frequency_dimension = kwargs.get("frequency_dimension", "") + to_pandas = kwargs.get("to_pandas", True) + + if not isinstance(rao, np.ndarray): + raise TypeError(f"rao must be of type ndarray. Got: {type(rao)}") + if not isinstance(mler, (pd.DataFrame, xr.Dataset)): + raise TypeError( + f"mler must be of type pd.DataFrame or xr.Dataset. Got: {type(mler)}" + ) + if not isinstance(sim, dict): + raise TypeError(f"sim must be of type dict. Got: {type(sim)}") + if not isinstance(k, (np.ndarray, list, pd.Series)): + raise TypeError(f"k must be of type ndarray. Got: {type(k)}") + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type bool. Got: {type(to_pandas)}") + if not isinstance(frequency_dimension, str): + raise TypeError( + f"frequency_dimension must be of type str. Got: {type(frequency_dimension)}" + ) + + rao = np.array(rao, dtype=float) if not isinstance(rao, np.ndarray) else rao + k = np.array(k, dtype=float) if not isinstance(k, np.ndarray) else k + # If input is pandas, convert to xarray + mler = mler if isinstance(mler, xr.Dataset) else mler.to_xarray() + + # Handle optional frequency dimension + frequency_dimension = ( + frequency_dimension if frequency_dimension else list(mler.coords)[0] + ) + freq = mler.coords[frequency_dimension].values * 2 * np.pi + d_w = np.diff(freq).mean() + + wave_height = np.zeros(len(sim["T"])) + linear_response = np.zeros(len(sim["T"])) + for i, t_i in enumerate(sim["T"]): + cos_terms = np.cos( + freq * (t_i - sim["T0"]) + - k * (sim["X0"] - sim["X0"]) + + mler["Phase"].values + ) + wave_height[i] = np.sum(np.sqrt(2 * mler["WaveSpectrum"] * d_w) * cos_terms) + + linear_response[i] = np.sum( + np.sqrt(2 * mler["WaveSpectrum"] * d_w) + * np.abs(rao) + * np.cos(freq * (t_i - sim["T0"]) - k * (sim["X0"] - sim["X0"])) + ) + + # Construct the output dataset + mler_ts = xr.Dataset( + { + "WaveHeight": (["time"], wave_height), + "LinearResponse": (["time"], linear_response), + }, + coords={"time": sim["T"]}, + ) + + # Convert to pandas DataFrame if requested + return mler_ts.to_dataframe() if to_pandas else mler_ts diff --git a/mhkit/loads/extreme/peaks.py b/mhkit/loads/extreme/peaks.py new file mode 100644 index 000000000..3f588237a --- /dev/null +++ b/mhkit/loads/extreme/peaks.py @@ -0,0 +1,481 @@ +""" +This module provides utilities for analyzing wave data, specifically +for identifying significant wave heights and estimating wave peak +distributions using statistical methods. + +Functions: +- _calculate_window_size: Calculates the window size for peak + independence using the auto-correlation function of wave peaks. +- _peaks_over_threshold: Identifies peaks over a specified + threshold and returns independent storm peak values adjusted by + the threshold. +- global_peaks: Identifies global peaks in a zero-centered + response time-series based on consecutive zero up-crossings. +- number_of_short_term_peaks: Estimates the number of peaks within a + specified short-term period. +- peaks_distribution_weibull: Estimates the peaks distribution by + fitting a Weibull distribution to the peaks of the response. +- peaks_distribution_weibull_tail_fit: Estimates the peaks distribution + using the Weibull tail fit method. +- automatic_hs_threshold: Determines the best significant wave height + threshold for the peaks-over-threshold method. +- peaks_distribution_peaks_over_threshold: Estimates the peaks + distribution using the peaks over threshold method by fitting a + generalized Pareto distribution. + +References: +- Neary, V. S., S. Ahn, B. E. Seng, M. N. Allahdadi, T. Wang, Z. Yang, + and R. He (2020). "Characterization of Extreme Wave Conditions for + Wave Energy Converter Design and Project Risk Assessment.” J. Mar. + Sci. Eng. 2020, 8(4), 289; https://doi.org/10.3390/jmse8040289. + +""" + +from typing import List, Tuple, Optional + +import numpy as np +from numpy.typing import NDArray +from scipy import stats, optimize, signal +from scipy.stats import rv_continuous + +from mhkit.utils import upcrossing + + +def _calculate_window_size(peaks: NDArray[np.float64], sampling_rate: float) -> float: + """ + Calculate the window size for independence based on the auto-correlation function. + + Parameters + ---------- + peaks : np.ndarray + A NumPy array of peak values from a time series. + sampling_rate : float + The sampling rate of the time series in Hz (samples per second). + + Returns + ------- + float + The window size determined by the auto-correlation function. + """ + n_lags = int(14 * 24 / sampling_rate) + deviations_from_mean = peaks - np.mean(peaks) + acf = signal.correlate(deviations_from_mean, deviations_from_mean, mode="full") + lag = signal.correlation_lags(len(peaks), len(peaks), mode="full") + idx_zero = np.argmax(lag == 0) + positive_lag = lag[idx_zero : idx_zero + n_lags + 1] + acf_positive = acf[idx_zero : idx_zero + n_lags + 1] / acf[idx_zero] + + window_size = sampling_rate * positive_lag[acf_positive < 0.5][0] + return window_size / sampling_rate + + +def _peaks_over_threshold( + peaks: NDArray[np.float64], threshold: float, sampling_rate: float +) -> List[float]: + """ + Identifies peaks in a time series that are over a specified threshold and + returns a list of independent storm peak values adjusted by the threshold. + Independence is determined by a window size calculated from the auto-correlation + function to ensure that peaks are separated by at least the duration + corresponding to the first significant drop in auto-correlation. + + Parameters + ---------- + peaks : np.ndarray + A NumPy array of peak values from a time series. + threshold : float + The percentile threshold (0-1) to identify significant peaks. + For example, 0.95 for the 95th percentile. + sampling_rate : float + The sampling rate of the time series in Hz (samples per second). + + Returns + ------- + List[float] + A list of peak values exceeding the specified threshold, adjusted + for independence based on the calculated window size. + + Notes + ----- + This function requires the global_peaks function to identify the + maxima between consecutive zero up-crossings and uses the signal processing + capabilities from scipy.signal for calculating the auto-correlation function. + """ + threshold_unit = np.percentile(peaks, 100 * threshold, method="hazen") + idx_peaks = np.arange(len(peaks)) + idx_storm_peaks, storm_peaks = global_peaks(idx_peaks, peaks - threshold_unit) + idx_storm_peaks = idx_storm_peaks.astype(int) + + independent_storm_peaks = [storm_peaks[0]] + idx_independent_storm_peaks = [idx_storm_peaks[0]] + + window = _calculate_window_size(peaks, sampling_rate) + + for idx in idx_storm_peaks[1:]: + if (idx - idx_independent_storm_peaks[-1]) > window: + idx_independent_storm_peaks.append(idx) + independent_storm_peaks.append(peaks[idx] - threshold_unit) + elif peaks[idx] > independent_storm_peaks[-1]: + idx_independent_storm_peaks[-1] = idx + independent_storm_peaks[-1] = peaks[idx] - threshold_unit + + return independent_storm_peaks + + +def global_peaks(time: np.ndarray, data: np.ndarray) -> Tuple[np.ndarray, np.ndarray]: + """ + Find the global peaks of a zero-centered response time-series. + + The global peaks are the maxima between consecutive zero + up-crossings. + + Parameters + ---------- + time: np.array + Time array. + data: np.array + Response time-series. + + Returns + ------- + time_peaks: np.array + Time array for peaks + peaks: np.array + Peak values of the response time-series + """ + if not isinstance(time, np.ndarray): + raise TypeError(f"time must be of type np.ndarray. Got: {type(time)}") + if not isinstance(data, np.ndarray): + raise TypeError(f"data must be of type np.ndarray. Got: {type(data)}") + + # Find zero up-crossings + inds = upcrossing(time, data) + + # We also include the final point in the dataset + inds = np.append(inds, len(data) - 1) + + # As we want to return both the time and peak + # values, look for the index at the peak. + # The call to argmax gives us the index within the + # upcrossing period. Therefore to get the index in the + # original array we need to add on the index that + # starts the zero crossing period, ind1. + def find_peak_index(ind1, ind2): + return np.argmax(data[ind1:ind2]) + ind1 + + peak_inds = np.array( + [find_peak_index(ind1, inds[i + 1]) for i, ind1 in enumerate(inds[:-1])], + dtype=int, + ) + + return time[peak_inds], data[peak_inds] + + +def number_of_short_term_peaks(n_peaks: int, time: float, time_st: float) -> float: + """ + Estimate the number of peaks in a specified period. + + Parameters + ---------- + n_peaks : int + Number of peaks in analyzed timeseries. + time : float + Length of time of analyzed timeseries. + time_st: float + Short-term period for which to estimate the number of peaks. + + Returns + ------- + n_st : float + Number of peaks in short term period. + """ + if not isinstance(n_peaks, int): + raise TypeError(f"n_peaks must be of type int. Got: {type(n_peaks)}") + if not isinstance(time, float): + raise TypeError(f"time must be of type float. Got: {type(time)}") + if not isinstance(time_st, float): + raise TypeError(f"time_st must be of type float. Got: {type(time_st)}") + + return n_peaks * time_st / time + + +def peaks_distribution_weibull(peaks_data: NDArray[np.float_]) -> rv_continuous: + """ + Estimate the peaks distribution by fitting a Weibull + distribution to the peaks of the response. + + The fitted parameters can be accessed through the `params` field of + the returned distribution. + + Parameters + ---------- + peaks_data : NDArray[np.float_] + Global peaks. + + Returns + ------- + peaks: scipy.stats.rv_frozen + Probability distribution of the peaks. + """ + if not isinstance(peaks_data, np.ndarray): + raise TypeError( + f"peaks_data must be of type np.ndarray. Got: {type(peaks_data)}" + ) + + # peaks distribution + peaks_params = stats.exponweib.fit(peaks_data, f0=1, floc=0) + param_names = ["a", "c", "loc", "scale"] + peaks_params = dict(zip(param_names, peaks_params)) + peaks = stats.exponweib(**peaks_params) + # save the parameter info + peaks.params = peaks_params + return peaks + + +# pylint: disable=R0914 +def peaks_distribution_weibull_tail_fit( + peaks_data: NDArray[np.float_], +) -> rv_continuous: + """ + Estimate the peaks distribution using the Weibull tail fit + method. + + The fitted parameters can be accessed through the `params` field of + the returned distribution. + + Parameters + ---------- + peaks_data : np.array + Global peaks. + + Returns + ------- + peaks: scipy.stats.rv_frozen + Probability distribution of the peaks. + """ + if not isinstance(peaks_data, np.ndarray): + raise TypeError( + f"peaks_data must be of type np.ndarray. Got: {type(peaks_data)}" + ) + + # Initial guess for Weibull parameters + p_0 = stats.exponweib.fit(peaks_data, f0=1, floc=0) + p_0 = np.array([p_0[1], p_0[3]]) + # Approximate CDF + peaks_data = np.sort(peaks_data) + n_peaks = len(peaks_data) + cdf_positions = np.zeros(n_peaks) + for i in range(n_peaks): + cdf_positions[i] = i / (n_peaks + 1.0) + # Divide into seven sets & fit Weibull + subset_shape_params = np.zeros(7) + subset_scale_params = np.zeros(7) + set_lim = np.arange(0.60, 0.90, 0.05) + + def weibull_cdf(data_points, shape, scale): + return stats.exponweib(a=1, c=shape, loc=0, scale=scale).cdf(data_points) + + for local_set in range(7): + global_peaks_set = peaks_data[(cdf_positions > set_lim[local_set])] + cdf_positions_set = cdf_positions[(cdf_positions > set_lim[local_set])] + # pylint: disable=W0632 + p_opt, _ = optimize.curve_fit( + weibull_cdf, global_peaks_set, cdf_positions_set, p0=p_0 + ) + subset_shape_params[local_set] = p_opt[0] + subset_scale_params[local_set] = p_opt[1] + # peaks distribution + peaks_params = [1, np.mean(subset_shape_params), 0, np.mean(subset_scale_params)] + param_names = ["a", "c", "loc", "scale"] + peaks_params = dict(zip(param_names, peaks_params)) + peaks = stats.exponweib(**peaks_params) + # save the parameter info + peaks.params = peaks_params + peaks.subset_shape_params = subset_shape_params + peaks.subset_scale_params = subset_scale_params + return peaks + + +# pylint: disable=R0914 +def automatic_hs_threshold( + peaks: NDArray[np.float_], + sampling_rate: float, + initial_threshold_range: Tuple[float, float, float] = (0.990, 0.995, 0.001), + max_refinement: int = 5, +) -> Tuple[float, float]: + """ + Find the best significant wave height threshold for the + peaks-over-threshold method. + + This method was developed by: + + > Neary, V. S., S. Ahn, B. E. Seng, M. N. Allahdadi, T. Wang, Z. Yang and R. He (2020). + > "Characterization of Extreme Wave Conditions for Wave Energy Converter Design and + > Project Risk Assessment.” + > J. Mar. Sci. Eng. 2020, 8(4), 289; https://doi.org/10.3390/jmse8040289. + + Please cite this paper if using this method. + + After all thresholds in the initial range are evaluated, the search + range is refined around the optimal point until either (i) there + is minimal change from the previous refinement results, (ii) the + number of data points become smaller than about 1 per year, or (iii) + the maximum number of iterations is reached. + + Parameters + ---------- + peaks: NDArray[np.float_] + Peak values of the response time-series. + sampling_rate: float + Sampling rate in hours. + initial_threshold_range: Tuple[float, float, float] + Initial range of thresholds to search. Described as + (min, max, step). + max_refinement: int + Maximum number of times to refine the search range. + + Returns + ------- + Tuple[float, float] + The best threshold and its corresponding unit. + + """ + if not isinstance(sampling_rate, (float, int)): + raise TypeError( + f"sampling_rate must be of type float or int. Got: {type(sampling_rate)}" + ) + if not isinstance(peaks, np.ndarray): + raise TypeError(f"peaks must be of type np.ndarray. Got: {type(peaks)}") + if not len(initial_threshold_range) == 3: + raise ValueError( + f"initial_threshold_range must be length 3. Got: {len(initial_threshold_range)}" + ) + if not isinstance(max_refinement, int): + raise TypeError( + f"max_refinement must be of type int. Got: {type(max_refinement)}" + ) + + range_min, range_max, range_step = initial_threshold_range + best_threshold = -1 + years = len(peaks) / (365.25 * 24 / sampling_rate) + + for i in range(max_refinement): + thresholds = np.arange(range_min, range_max, range_step) + correlations = [] + + for threshold in thresholds: + distribution = stats.genpareto + over_threshold = _peaks_over_threshold(peaks, threshold, sampling_rate) + rate_per_year = len(over_threshold) / years + if rate_per_year < 2: + break + distributions_parameters = distribution.fit(over_threshold, floc=0.0) + _, (_, _, correlation) = stats.probplot( + peaks, distributions_parameters, distribution, fit=True + ) + correlations.append(correlation) + + max_i = np.argmax(correlations) + minimal_change = np.abs(best_threshold - thresholds[max_i]) < 0.0005 + best_threshold = thresholds[max_i] + if minimal_change and i < max_refinement - 1: + break + range_step /= 10 + if max_i == len(thresholds) - 1: + range_min = thresholds[max_i - 1] + range_max = thresholds[max_i] + 5 * range_step + elif max_i == 0: + range_min = thresholds[max_i] - 9 * range_step + range_max = thresholds[max_i + 1] + else: + range_min = thresholds[max_i - 1] + range_max = thresholds[max_i + 1] + + best_threshold_unit = np.percentile(peaks, 100 * best_threshold, method="hazen") + return best_threshold, best_threshold_unit + + +def peaks_distribution_peaks_over_threshold( + peaks_data: NDArray[np.float_], threshold: Optional[float] = None +) -> rv_continuous: + """ + Estimate the peaks distribution using the peaks over threshold + method. + + This fits a generalized Pareto distribution to all the peaks above + the specified threshold. The distribution is only defined for values + above the threshold and therefore cannot be used to obtain integral + metrics such as the expected value. A typical choice of threshold is + 1.4 standard deviations above the mean. The peaks over threshold + distribution can be accessed through the `pot` field of the returned + peaks distribution. + + Parameters + ---------- + peaks_data : NDArray[np.float_] + Global peaks. + threshold : Optional[float] + Threshold value. Only peaks above this value will be used. + Default value calculated as: `np.mean(x) + 1.4 * np.std(x)` + + Returns + ------- + peaks: rv_continuous + Probability distribution of the peaks. + """ + if not isinstance(peaks_data, np.ndarray): + raise TypeError( + f"peaks_data must be of type np.ndarray. Got: {type(peaks_data)}" + ) + if threshold is None: + threshold = np.mean(peaks_data) + 1.4 * np.std(peaks_data) + if threshold is not None and not isinstance(threshold, float): + raise TypeError( + f"If specified, threshold must be of type float. Got: {type(threshold)}" + ) + + # peaks over threshold + peaks_data = np.sort(peaks_data) + pot = peaks_data[peaks_data > threshold] - threshold + npeaks = len(peaks_data) + npot = len(pot) + # Fit a generalized Pareto + pot_params = stats.genpareto.fit(pot, floc=0.0) + param_names = ["c", "loc", "scale"] + pot_params = dict(zip(param_names, pot_params)) + pot = stats.genpareto(**pot_params) + # save the parameter info + pot.params = pot_params + + # peaks + class _Peaks(rv_continuous): + def __init__( + self, pot_distribution: rv_continuous, threshold: float, *args, **kwargs + ): + self.pot = pot_distribution + self.threshold = threshold + super().__init__(*args, **kwargs) + + # pylint: disable=arguments-differ + def _cdf(self, data_points, *args, **kwds) -> NDArray[np.float_]: + # Convert data_points to a NumPy array if it's not already + data_points = np.atleast_1d(data_points) + out = np.zeros_like(data_points) + + # Use the instance's threshold attribute instead of passing as a parameter + below_threshold = data_points < self.threshold + out[below_threshold] = np.NaN + + above_threshold_indices = ~below_threshold + if np.any(above_threshold_indices): + points_above_threshold = data_points[above_threshold_indices] + pot_ccdf = 1.0 - self.pot.cdf( + points_above_threshold - self.threshold, *args, **kwds + ) + prop_pot = npot / npeaks + out[above_threshold_indices] = 1.0 - (prop_pot * pot_ccdf) + return out + + peaks = _Peaks(name="peaks", pot_distribution=pot, threshold=threshold) + peaks.pot = pot + return peaks diff --git a/mhkit/loads/extreme/sample.py b/mhkit/loads/extreme/sample.py new file mode 100644 index 000000000..3da0377de --- /dev/null +++ b/mhkit/loads/extreme/sample.py @@ -0,0 +1,52 @@ +""" +This module provides statistical analysis tools for extreme value +analysis in environmental and engineering applications. It focuses on +estimating values corresponding to specific return periods based on +the statistical distribution of observed or simulated data. + +Functionality: +- return_year_value: Calculates the value from a given distribution + corresponding to a specified return year. This function is particularly + useful for determining design values for engineering structures or for + risk assessment in environmental studies. + +""" + +from typing import Callable + + +def return_year_value( + ppf: Callable[[float], float], return_year: float, short_term_period_hr: float +) -> float: + """ + Calculate the value from a given distribution corresponding to a particular + return year. + + Parameters + ---------- + ppf: callable function of 1 argument + Percentage Point Function (inverse CDF) of short term distribution. + return_year: int, float + Return period in years. + short_term_period_hr: int, float + Short term period the distribution is created from in hours. + + Returns + ------- + value: float + The value corresponding to the return period from the distribution. + """ + if not callable(ppf): + raise TypeError("ppf must be a callable Percentage Point Function") + if not isinstance(return_year, (float, int)): + raise TypeError( + f"return_year must be of type float or int. Got: {type(return_year)}" + ) + if not isinstance(short_term_period_hr, (float, int)): + raise TypeError( + f"short_term_period_hr must be of type float or int. Got: {type(short_term_period_hr)}" + ) + + probability_of_exceedance = 1 / (return_year * 365.25 * 24 / short_term_period_hr) + + return ppf(1 - probability_of_exceedance) diff --git a/mhkit/loads/general.py b/mhkit/loads/general.py index 0c38b6bc7..119731443 100644 --- a/mhkit/loads/general.py +++ b/mhkit/loads/general.py @@ -1,79 +1,148 @@ +""" +This module provides tools for analyzing and processing data signals +related to turbine blade performance and fatigue analysis. It implements +methodologies based on standards such as IEC TS 62600-3:2020 ED1, +incorporating statistical binning, moment calculations, and fatigue +damage estimation using the rainflow counting algorithm. Key +functionalities include: + + - `bin_statistics`: Bins time-series data against a specified signal, + such as wind speed, to calculate mean and standard deviation statistics + for each bin, following IEC TS 62600-3:2020 ED1 guidelines. It supports + output in both pandas DataFrame and xarray Dataset formats. + + - `blade_moments`: Calculates the flapwise and edgewise moments of turbine + blades using derived calibration coefficients and raw strain signals. + This function is crucial for understanding the loading and performance + characteristics of turbine blades. + + - `damage_equivalent_load`: Estimates the damage equivalent load (DEL) + of a single data signal using a 4-point rainflow counting algorithm. + This method is vital for assessing fatigue life and durability of + materials under variable amplitude loading. + +References: +- C. Amzallag et. al., International Journal of Fatigue, 16 (1994) 287-293. +- ISO 12110-2, Metallic materials - Fatigue testing - Variable amplitude fatigue testing. +- G. Marsh et. al., International Journal of Fatigue, 82 (2016) 757-765. +""" + +from typing import Union, List, Tuple, Optional from scipy.stats import binned_statistic -import pandas as pd +import pandas as pd +import xarray as xr import numpy as np import fatpack +from mhkit.utils.type_handling import to_numeric_array -def bin_statistics(data,bin_against,bin_edges,data_signal=[]): + +def bin_statistics( + data: Union[pd.DataFrame, xr.Dataset], + bin_against: np.ndarray, + bin_edges: np.ndarray, + data_signal: Optional[List[str]] = None, + to_pandas: bool = True, +) -> Tuple[Union[pd.DataFrame, xr.Dataset], Union[pd.DataFrame, xr.Dataset]]: """ - Bins calculated statistics against data signal (or channel) + Bins calculated statistics against data signal (or channel) according to IEC TS 62600-3:2020 ED1. - + Parameters ----------- - data : pandas DataFrame - Time-series statistics of data signal(s) + data : pandas DataFrame or xarray Dataset + Time-series statistics of data signal(s) bin_against : array Data signal to bin data against (e.g. wind speed) bin_edges : array Bin edges with consistent step size - data_signal : list, optional + data_signal : list, optional List of data signal(s) to bin, default = all data signals - + to_pandas: bool (optional) + Flag to output pandas instead of xarray. Default = True. + Returns -------- - bin_mean : pandas DataFrame + bin_mean : pandas DataFrame or xarray Dataset Mean of each bin - bin_std : pandas DataFrame + bin_std : pandas DataFrame or xarray Dataset Standard deviation of each bim """ - assert isinstance(data, pd.DataFrame), 'data must be of type pd.DataFram' - try: bin_against = np.asarray(bin_against) - except: 'bin_against must be of type np.ndarray' - try: bin_edges = np.asarray(bin_edges) - except: 'bin_edges must be of type np.ndarray' + if not isinstance(data, (pd.DataFrame, xr.Dataset)): + raise TypeError( + f"data must be of type pd.DataFrame or xr.Dataset. Got: {type(data)}" + ) + + # Use _to_numeric_array to process bin_against and bin_edges + bin_against = to_numeric_array(bin_against, "bin_against") + bin_edges = to_numeric_array(bin_edges, "bin_edges") + + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type bool. Got: {type(to_pandas)}") + # If input is pandas, convert to xarray + if isinstance(data, pd.DataFrame): + data = data.to_xarray() + + if data_signal is None: + data_signal = [] # Determine variables to analyze - if len(data_signal)==0: # if not specified, bin all variables - data_signal=data.columns.values + if len(data_signal) == 0: # if not specified, bin all variables + data_signal = list(data.keys()) else: - assert isinstance(data_signal, list), 'must be of type list' + if not isinstance(data_signal, list): + raise TypeError( + f"data_signal must be of type list. Got: {type(data_signal)}" + ) - # Pre-allocate list variables - bin_stat_list = [] - bin_std_list = [] + # Pre-allocate variable dictionaries + bin_stat_list = {} + bin_std_list = {} # loop through data_signal and get binned means for signal_name in data_signal: # Bin data - bin_stat = binned_statistic(bin_against,data[signal_name], - statistic='mean',bins=bin_edges) - # Calculate std of bins - std = [] - stdev = pd.DataFrame(data[signal_name]) - stdev.set_index(bin_stat.binnumber,inplace=True) - for i in range(1,len(bin_stat.bin_edges)): - try: - temp = stdev.loc[i].std(ddof=0) - std.append(temp[0]) - except: - std.append(np.nan) - bin_stat_list.append(bin_stat.statistic) - bin_std_list.append(std) - - # Convert to DataFrames - bin_mean = pd.DataFrame(np.transpose(bin_stat_list),columns=data_signal) - bin_std = pd.DataFrame(np.transpose(bin_std_list),columns=data_signal) - - # Check for nans - if bin_mean.isna().any().any(): - print('Warning: some bins may be empty!') + bin_stat_mean = binned_statistic( + bin_against, data[signal_name], statistic="mean", bins=bin_edges + ) + bin_stat_std = binned_statistic( + bin_against, data[signal_name], statistic="std", bins=bin_edges + ) + + bin_stat_list[signal_name] = ("index", bin_stat_mean.statistic) + bin_std_list[signal_name] = ("index", bin_stat_std.statistic) + + # Convert to Datasets + bin_mean = xr.Dataset( + data_vars=bin_stat_list, + coords={"index": np.arange(0, len(bin_stat_mean.statistic))}, + ) + bin_std = xr.Dataset( + data_vars=bin_std_list, + coords={"index": np.arange(0, len(bin_stat_std.statistic))}, + ) + + # Check for nans + for variable in list(bin_mean.variables): + if bin_mean[variable].isnull().any(): + print("Warning: bins for some variables may be empty!") + break + + if to_pandas: + bin_mean = bin_mean.to_pandas() + bin_std = bin_std.to_pandas() return bin_mean, bin_std -def blade_moments(blade_coefficients,flap_offset,flap_raw,edge_offset,edge_raw): - ''' +def blade_moments( + blade_coefficients: np.ndarray, + flap_offset: float, + flap_raw: np.ndarray, + edge_offset: float, + edge_raw: np.ndarray, +) -> Tuple[np.ndarray, np.ndarray]: + """ Transfer function for deriving blade flap and edge moments using blade matrix. Parameters @@ -88,42 +157,51 @@ def blade_moments(blade_coefficients,flap_offset,flap_raw,edge_offset,edge_raw): Derived offset of raw edge signal obtained during calibration process edge_raw : numpy array Raw strain signal of blade in the edgewise direction - + Returns -------- M_flap : numpy array Blade flapwise moment in SI units M_edge : numpy array Blade edgewise moment in SI units - ''' - - try: blade_coefficients = np.asarray(blade_coefficients) - except: 'blade_coefficients must be of type np.ndarray' - try: flap_raw = np.asarray(flap_raw) - except: 'flap_raw must be of type np.ndarray' - try: edge_raw = np.asarray(edge_raw) - except: 'edge_raw must be of type np.ndarray' - - assert isinstance(flap_offset, (float,int)), 'flap_offset must be of type int or float' - assert isinstance(edge_offset, (float,int)), 'edge_offset must be of type int or float' - + """ + + # Convert and validate blade_coefficients, flap_raw, and edge_raw + blade_coefficients = to_numeric_array(blade_coefficients, "blade_coefficients") + flap_raw = to_numeric_array(flap_raw, "flap_raw") + edge_raw = to_numeric_array(edge_raw, "edge_raw") + + if not isinstance(flap_offset, (float, int)): + raise TypeError( + f"flap_offset must be of type int or float. Got: {type(flap_offset)}" + ) + if not isinstance(edge_offset, (float, int)): + raise TypeError( + f"edge_offset must be of type int or float. Got: {type(edge_offset)}" + ) + # remove offset from raw signal flap_signal = flap_raw - flap_offset edge_signal = edge_raw - edge_offset # apply matrix to get load signals - M_flap = blade_coefficients[0]*flap_signal + blade_coefficients[1]*edge_signal - M_edge = blade_coefficients[2]*flap_signal + blade_coefficients[3]*edge_signal + m_flap = blade_coefficients[0] * flap_signal + blade_coefficients[1] * edge_signal + m_edge = blade_coefficients[2] * flap_signal + blade_coefficients[3] * edge_signal - return M_flap, M_edge + return m_flap, m_edge -def damage_equivalent_load(data_signal, m, bin_num=100, data_length=600): - ''' - Calculates the damage equivalent load of a single data signal (or channel) - based on IEC TS 62600-3:2020 ED1. 4-point rainflow counting algorithm from +def damage_equivalent_load( + data_signal: np.ndarray, + m: Union[float, int], + bin_num: int = 100, + data_length: Union[float, int] = 600, +) -> float: + """ + Calculates the damage equivalent load of a single data signal (or channel) + based on IEC TS 62600-3:2020 ED1. 4-point rainflow counting algorithm from fatpack module is based on the following resources: - + - `C. Amzallag et. al. Standardization of the rainflow counting method for fatigue analysis. International Journal of Fatigue, 16 (1994) 287-293` - `ISO 12110-2, Metallic materials - Fatigue testing - Variable amplitude @@ -131,7 +209,7 @@ def damage_equivalent_load(data_signal, m, bin_num=100, data_length=600): - `G. Marsh et. al. Review and application of Rainflow residue processing techniques for accurate fatigue damage estimation. International Journal of Fatigue, 82 (2016) 757-765` - + Parameters: ----------- @@ -143,25 +221,29 @@ def damage_equivalent_load(data_signal, m, bin_num=100, data_length=600): Number of bins for rainflow counting method (minimum=100) data_length : float/int Length of measured data (seconds) - + Returns -------- DEL : float Damage equivalent load (DEL) of single data signal - ''' - - try: data_signal = np.array(data_signal) - except: 'data_signal must be of type np.ndarray' - assert isinstance(m, (float,int)), 'm must be of type float or int' - assert isinstance(bin_num, (float,int)), 'bin_num must be of type float or int' - assert isinstance(data_length, (float,int)), 'data_length must be of type float or int' + """ + + to_numeric_array(data_signal, "data_signal") + if not isinstance(m, (float, int)): + raise TypeError(f"m must be of type float or int. Got: {type(m)}") + if not isinstance(bin_num, (float, int)): + raise TypeError(f"bin_num must be of type float or int. Got: {type(bin_num)}") + if not isinstance(data_length, (float, int)): + raise TypeError( + f"data_length must be of type float or int. Got: {type(data_length)}" + ) - rainflow_ranges = fatpack.find_rainflow_ranges(data_signal,k=256) + rainflow_ranges = fatpack.find_rainflow_ranges(data_signal, k=256) # Range count and bin - Nrf, Srf = fatpack.find_range_count(rainflow_ranges, bin_num) + n_rf, s_rf = fatpack.find_range_count(rainflow_ranges, bin_num) - DELs = Srf**m * Nrf / data_length - DEL = DELs.sum() ** (1/m) + del_s = s_rf**m * n_rf / data_length + del_value = del_s.sum() ** (1 / m) - return DEL + return del_value diff --git a/mhkit/loads/graphics.py b/mhkit/loads/graphics.py index 291e028af..26847f5ef 100644 --- a/mhkit/loads/graphics.py +++ b/mhkit/loads/graphics.py @@ -1,8 +1,36 @@ -import matplotlib.pyplot as plt +""" +This module provides functionalities for plotting statistical data +related to a given variable or dataset. + + - `plot_statistics` is designed to plot raw statistical measures + (mean, maximum, minimum, and optional standard deviation) of a + variable across a series of x-axis values. It allows for + customization of plot labels, title, and saving the plot to a file. + + - `plot_bin_statistics` extends these capabilities to binned data, + offering a way to visualize binned statistics (mean, maximum, minimum) + along with their respective standard deviations. This function also + supports label and title customization, as well as saving the plot to + a specified path. +""" + +from typing import Optional, Dict, Any import numpy as np +import matplotlib.pyplot as plt + +from mhkit.utils.type_handling import to_numeric_array + -def plot_statistics(x,y_mean,y_max,y_min,y_stdev=[],**kwargs): - ''' +# pylint: disable=R0914 +def plot_statistics( + x: np.ndarray, + y_mean: np.ndarray, + y_max: np.ndarray, + y_min: np.ndarray, + y_stdev: Optional[np.ndarray] = None, + **kwargs: Dict[str, Any], +) -> plt.Axes: + """ Plot showing standard raw statistics of variable Parameters @@ -17,7 +45,7 @@ def plot_statistics(x,y_mean,y_max,y_min,y_stdev=[],**kwargs): Array of min statistical values of variable y_stdev : numpy array, optional Array of standard deviation statistical values of variable - **kwargs : optional + **kwargs : optional x_label : string x axis label for plot y_label : string @@ -30,53 +58,72 @@ def plot_statistics(x,y_mean,y_max,y_min,y_stdev=[],**kwargs): Returns -------- ax : matplotlib pyplot axes - ''' - - try: x = np.array(x) - except: 'x must be of type np.ndarray' - try: y_mean = np.array(y_mean) - except: 'y_mean must be of type np.ndarray' - try:y_max = np.array(y_max) - except: 'y_max must be of type np.ndarray' - try: y_min = np.array(y_min) - except: 'y_min must be of type np.ndarray' - - x_label = kwargs.get("x_label", None) - y_label = kwargs.get("y_label", None) - title = kwargs.get("title", None) + """ + if y_stdev is None: + y_stdev = [] + + input_variables = [x, y_mean, y_max, y_min, y_stdev] + + variable_names = ["x", "y_mean", "y_max", "y_min", "y_stdev"] + # Convert each input variable to a numeric array, ensuring all are numeric + for i, variable in enumerate(input_variables): + input_variables[i] = to_numeric_array(variable, variable_names[i]) + + x, y_mean, y_max, y_min, y_stdev = input_variables + + x_label = kwargs.get("x_label", None) + y_label = kwargs.get("y_label", None) + title = kwargs.get("title", None) save_path = kwargs.get("save_path", None) - - assert isinstance(x_label, (str, type(None))), 'x_label must be of type str' - assert isinstance(y_label, (str, type(None))), 'y_label must be of type str' - assert isinstance(title, (str, type(None))), 'title must be of type str' - assert isinstance(save_path, (str, type(None))), 'save_path must be of type str' - - fig, ax = plt.subplots(figsize=(6,4)) - ax.plot(x,y_max,'^',label='max',mfc='none') - ax.plot(x,y_mean,'o',label='mean',mfc='none') - ax.plot(x,y_min,'v',label='min',mfc='none') - - if len(y_stdev)>0: ax.plot(x,y_stdev,'+',label='stdev',c='m') + + if not isinstance(x_label, (str, type(None))): + raise TypeError(f"x_label must be of type str. Got: {type(x_label)}") + if not isinstance(y_label, (str, type(None))): + raise TypeError(f"y_label must be of type str. Got: {type(y_label)}") + if not isinstance(title, (str, type(None))): + raise TypeError(f"title must be of type str. Got: {type(title)}") + if not isinstance(save_path, (str, type(None))): + raise TypeError(f"save_path must be of type str. Got: {type(save_path)}") + + fig, ax = plt.subplots(figsize=(6, 4)) + ax.plot(x, y_max, "^", label="max", mfc="none") + ax.plot(x, y_mean, "o", label="mean", mfc="none") + ax.plot(x, y_min, "v", label="min", mfc="none") + + if len(y_stdev) > 0: + ax.plot(x, y_stdev, "+", label="stdev", c="m") ax.grid(alpha=0.4) - ax.legend(loc='best') - - if x_label!=None: ax.set_xlabel(x_label) - if y_label!=None: ax.set_ylabel(y_label) - if title!=None: ax.set_title(title) - + ax.legend(loc="best") + + if x_label: + ax.set_xlabel(x_label) + if y_label: + ax.set_ylabel(y_label) + if title: + ax.set_title(title) + fig.tight_layout() - - if save_path==None: plt.show() - else: + + if save_path is None: + plt.show() + else: fig.savefig(save_path) plt.close() return ax -def plot_bin_statistics(bin_centers, bin_mean,bin_max, bin_min, - bin_mean_std, bin_max_std, bin_min_std, - **kwargs): - ''' +# pylint: disable=R0913 +def plot_bin_statistics( + bin_centers: np.ndarray, + bin_mean: np.ndarray, + bin_max: np.ndarray, + bin_min: np.ndarray, + bin_mean_std: np.ndarray, + bin_max_std: np.ndarray, + bin_min_std: np.ndarray, + **kwargs: Dict[str, Any], +) -> plt.Axes: + """ Plot showing standard binned statistics of single variable Parameters @@ -95,7 +142,7 @@ def plot_bin_statistics(bin_centers, bin_mean,bin_max, bin_min, Standard deviations of max binned statistics bin_min_std : numpy array Standard deviations of min binned statistics - **kwargs : optional + **kwargs : optional x_label : string x axis label for plot y_label : string @@ -108,55 +155,99 @@ def plot_bin_statistics(bin_centers, bin_mean,bin_max, bin_min, Returns -------- ax : matplotlib pyplot axes - ''' - - try: bin_centers = np.asarray(bin_centers) - except: 'bin_centers must be of type np.ndarray' - - try: bin_mean = np.asarray(bin_mean) - except: 'bin_mean must be of type np.ndarray' - try: bin_max = np.asarray(bin_max) - except:'bin_max must be of type np.ndarray' - try: bin_min = np.asarray(bin_min) - except: 'bin_min must be of type type np.ndarray' - - try: bin_mean_std = np.asarray(bin_mean_std) - except: 'bin_mean_std must be of type np.ndarray' - try: bin_max_std = np.asarray(bin_max_std) - except: 'bin_max_std must be of type np.ndarray' - try: bin_min_std = np.asarray(bin_min_std) - except: 'bin_min_std must be of type np.ndarray' - - x_label = kwargs.get("x_label", None) - y_label = kwargs.get("y_label", None) - title = kwargs.get("title", None) + """ + + input_variables = [ + bin_centers, + bin_mean, + bin_max, + bin_min, + bin_mean_std, + bin_max_std, + bin_min_std, + ] + variable_names = [ + "bin_centers", + "bin_mean", + "bin_max", + "bin_min", + "bin_mean_std", + "bin_max_std", + "bin_min_std", + ] + + # Convert each input variable to a numeric array, ensuring all are numeric + for i, variable in enumerate(input_variables): + input_variables[i] = to_numeric_array(variable, variable_names[i]) + + ( + bin_centers, + bin_mean, + bin_max, + bin_min, + bin_mean_std, + bin_max_std, + bin_min_std, + ) = input_variables + + x_label = kwargs.get("x_label", None) + y_label = kwargs.get("y_label", None) + title = kwargs.get("title", None) save_path = kwargs.get("save_path", None) - - assert isinstance(x_label, (str, type(None))), 'x_label must be of type str' - assert isinstance(y_label, (str, type(None))), 'y_label must be of type str' - assert isinstance(title, (str, type(None))), 'title must be of type str' - assert isinstance(save_path, (str, type(None))), 'save_path must be of type str' - - fig, ax = plt.subplots(figsize=(7,5)) - ax.errorbar(bin_centers,bin_max,marker='^',mfc='none', - yerr=bin_max_std,capsize=4,label='max') - ax.errorbar(bin_centers,bin_mean,marker='o',mfc='none', - yerr=bin_mean_std,capsize=4,label='mean') - ax.errorbar(bin_centers,bin_min,marker='v',mfc='none', - yerr=bin_min_std,capsize=4,label='min') - + + if not isinstance(x_label, (str, type(None))): + raise TypeError(f"x_label must be of type str. Got: {type(x_label)}") + if not isinstance(y_label, (str, type(None))): + raise TypeError(f"y_label must be of type str. Got: {type(y_label)}") + if not isinstance(title, (str, type(None))): + raise TypeError(f"title must be of type str. Got: {type(title)}") + if not isinstance(save_path, (str, type(None))): + raise TypeError(f"save_path must be of type str. Got: {type(save_path)}") + + fig, ax = plt.subplots(figsize=(7, 5)) + ax.errorbar( + bin_centers, + bin_max, + marker="^", + mfc="none", + yerr=bin_max_std, + capsize=4, + label="max", + ) + ax.errorbar( + bin_centers, + bin_mean, + marker="o", + mfc="none", + yerr=bin_mean_std, + capsize=4, + label="mean", + ) + ax.errorbar( + bin_centers, + bin_min, + marker="v", + mfc="none", + yerr=bin_min_std, + capsize=4, + label="min", + ) + ax.grid(alpha=0.5) - ax.legend(loc='best') - - if x_label!=None: ax.set_xlabel(x_label) - if y_label!=None: ax.set_ylabel(y_label) - if title!=None: ax.set_title(title) - + ax.legend(loc="best") + + if x_label: + ax.set_xlabel(x_label) + if y_label: + ax.set_ylabel(y_label) + if title: + ax.set_title(title) + fig.tight_layout() - - if save_path==None: plt.show() - else: + + if save_path is None: + plt.show() + else: fig.savefig(save_path) plt.close() return ax - diff --git a/mhkit/mooring/graphics.py b/mhkit/mooring/graphics.py index a8dc678df..389953c45 100644 --- a/mhkit/mooring/graphics.py +++ b/mhkit/mooring/graphics.py @@ -29,8 +29,22 @@ from matplotlib.animation import FuncAnimation -def animate(dsani, dimension='2d', xaxis='x', yaxis='z', zaxis='y', xlim=None, ylim=None, zlim=None, - interval=10, repeat=False, xlabel=None, ylabel=None, zlabel=None, title=None): +def animate( + dsani, + dimension="2d", + xaxis="x", + yaxis="z", + zaxis="y", + xlim=None, + ylim=None, + zlim=None, + interval=10, + repeat=False, + xlabel=None, + ylabel=None, + zlabel=None, + title=None, +): """ Graphics function that creates a 2D or 3D animation of the node positions of a mooring line over time. @@ -73,25 +87,26 @@ def animate(dsani, dimension='2d', xaxis='x', yaxis='z', zaxis='y', xlim=None, y Raises ------ TypeError - Checks for correct input types for dsani, dimension, xaxis, yaxis, zaxis, xlim, ylim, + Checks for correct input types for dsani, dimension, xaxis, yaxis, zaxis, xlim, ylim, zlim, interval, repeat, xlabel, ylabel, zlabel, and title """ - _validate_input(dsani, xlim, ylim, interval, repeat, - xlabel, ylabel, title, dimension) - if dimension == '3d': + _validate_input( + dsani, xlim, ylim, interval, repeat, xlabel, ylabel, title, dimension + ) + if dimension == "3d": if not isinstance(zlim, (list, type(None))): - raise TypeError('zlim must be of type list') + raise TypeError("zlim must be of type list") if not isinstance(zlabel, (str, type(None))): - raise TypeError('zlabel must be of type str') + raise TypeError("zlabel must be of type str") if not isinstance(xaxis, str): - raise TypeError('xaxis must be of type str') + raise TypeError("xaxis must be of type str") if not isinstance(yaxis, str): - raise TypeError('yaxis must be of type str') + raise TypeError("yaxis must be of type str") if not isinstance(zaxis, str): - raise TypeError('zaxis must be of type str') + raise TypeError("zaxis must be of type str") current_idx = list(dsani.dims.mapping.keys())[0] - dsani = dsani.rename({current_idx: 'time'}) + dsani = dsani.rename({current_idx: "time"}) nodes_x, nodes_y, nodes_z = _get_axis_nodes(dsani, xaxis, yaxis, zaxis) @@ -99,18 +114,18 @@ def animate(dsani, dimension='2d', xaxis='x', yaxis='z', zaxis='y', xlim=None, y xlim = _find_limits(dsani[nodes_x]) if not ylim: ylim = _find_limits(dsani[nodes_y]) - if dimension == '3d' and not zlim: + if dimension == "3d" and not zlim: zlim = _find_limits(dsani[nodes_z]) fig = plt.figure() - if dimension == '3d': - ax = fig.add_subplot(projection='3d') + if dimension == "3d": + ax = fig.add_subplot(projection="3d") else: ax = fig.add_subplot() ax.grid() - if dimension == '2d': - ln, = ax.plot([], [], '-o') + if dimension == "2d": + (ln,) = ax.plot([], [], "-o") def init(): ax.set(xlim=xlim, ylim=ylim) @@ -122,8 +137,8 @@ def update(frame): y = dsani[nodes_y].isel(time=frame).to_array().values ln.set_data(x, y) - elif dimension == '3d': - ln, = ax.plot([], [], [], '-o') + elif dimension == "3d": + (ln,) = ax.plot([], [], [], "-o") def init(): ax.set(xlim3d=xlim, ylim3d=ylim, zlim3d=zlim) @@ -137,33 +152,41 @@ def update(frame): ln.set_data(x, y) ln.set_3d_properties(z) - ani = FuncAnimation(fig, update, frames=len(dsani.time), - init_func=init, interval=interval, repeat=repeat) + ani = FuncAnimation( + fig, + update, + frames=len(dsani.time), + init_func=init, + interval=interval, + repeat=repeat, + ) return ani -def _validate_input(dsani, xlim, ylim, interval, repeat, xlabel, ylabel, title, dimension): +def _validate_input( + dsani, xlim, ylim, interval, repeat, xlabel, ylabel, title, dimension +): """ Validate common input parameters for animate function. """ if not isinstance(dsani, xr.Dataset): - raise TypeError('dsani must be of type xr.Dataset') + raise TypeError("dsani must be of type xr.Dataset") if not isinstance(xlim, (list, type(None))): - raise TypeError('xlim must be of type list') + raise TypeError("xlim must be of type list") if not isinstance(ylim, (list, type(None))): - raise TypeError('ylim must be of type list') + raise TypeError("ylim must be of type list") if not isinstance(interval, int): - raise TypeError('interval must be of type int') + raise TypeError("interval must be of type int") if not isinstance(repeat, bool): - raise TypeError('repeat must be of type bool') + raise TypeError("repeat must be of type bool") if not isinstance(xlabel, (str, type(None))): - raise TypeError('xlabel must be of type str') + raise TypeError("xlabel must be of type str") if not isinstance(ylabel, (str, type(None))): - raise TypeError('ylabel must be of type str') + raise TypeError("ylabel must be of type str") if not isinstance(title, (str, type(None))): - raise TypeError('title must be of type str') - if dimension not in ['2d', '3d']: + raise TypeError("title must be of type str") + if dimension not in ["2d", "3d"]: raise ValueError('dimension must be either "2d" or "3d"') @@ -191,10 +214,10 @@ def _get_axis_nodes(dsani, xaxis, yaxis, zaxis): nodesZ : list List of nodes along the z-axis """ - nodes = [s for s in list(dsani.data_vars) if 'Node' in s] - nodes_x = [s for s in nodes if f'p{xaxis}' in s] - nodes_y = [s for s in nodes if f'p{yaxis}' in s] - nodes_z = [s for s in nodes if f'p{zaxis}' in s] + nodes = [s for s in list(dsani.data_vars) if "Node" in s] + nodes_x = [s for s in nodes if f"p{xaxis}" in s] + nodes_y = [s for s in nodes if f"p{yaxis}" in s] + nodes_z = [s for s in nodes if f"p{zaxis}" in s] return nodes_x, nodes_y, nodes_z @@ -213,9 +236,9 @@ def _find_limits(dataset): Min and max plot limits for axis """ x_1 = dataset.min().to_array().min().values - x_1 = x_1 - abs(x_1*0.1) + x_1 = x_1 - abs(x_1 * 0.1) x_2 = dataset.max().to_array().max().values - x_2 = x_2 + abs(x_2*0.1) + x_2 = x_2 + abs(x_2 * 0.1) return [x_1, x_2] diff --git a/mhkit/mooring/io.py b/mhkit/mooring/io.py index bb5715193..a85c92358 100644 --- a/mhkit/mooring/io.py +++ b/mhkit/mooring/io.py @@ -16,15 +16,16 @@ dataset = read_moordyn(filepath="FAST.MD.out", input_file="FAST.MD.input") """ + import os import pandas as pd def read_moordyn(filepath, input_file=None): """ - Reads in MoorDyn OUT files such as "FAST.MD.out" and - "FAST.MD.Line1.out" and stores inside xarray. Also allows for - parsing and storage of MoorDyn input file as attributes inside + Reads in MoorDyn OUT files such as "FAST.MD.out" and + "FAST.MD.Line1.out" and stores inside xarray. Also allows for + parsing and storage of MoorDyn input file as attributes inside the xarray. Parameters @@ -45,15 +46,16 @@ def read_moordyn(filepath, input_file=None): Checks for correct input types for filepath and input_file """ if not isinstance(filepath, str): - raise TypeError('filepath must be of type str') + raise TypeError("filepath must be of type str") if input_file: if not isinstance(input_file, str): - raise TypeError('input_file must be of type str') + raise TypeError("input_file must be of type str") if not os.path.isfile(filepath): raise FileNotFoundError(f"No file found at provided path: {filepath}") - data = pd.read_csv(filepath, header=0, skiprows=[ - 1], sep=' ', skipinitialspace=True, index_col=0) + data = pd.read_csv( + filepath, header=0, skiprows=[1], sep=" ", skipinitialspace=True, index_col=0 + ) data = data.dropna(axis=1) dataset = data.to_xarray() @@ -80,11 +82,13 @@ def _moordyn_input(input_file, dataset): return Dataset that includes input file parameters as attributes """ - with open(input_file, 'r', encoding='utf-8') as moordyn_file: - for line in moordyn_file: # loop through each line in the file + with open(input_file, "r", encoding="utf-8") as moordyn_file: + for line in moordyn_file: # loop through each line in the file # get line type property sets - if line.count('---') > 0 and (line.upper().count('LINE DICTIONARY') > 0 or - line.upper().count('LINE TYPES') > 0): + if line.count("---") > 0 and ( + line.upper().count("LINE DICTIONARY") > 0 + or line.upper().count("LINE TYPES") > 0 + ): linetypes = dict() # skip this header line, plus channel names and units lines line = next(moordyn_file) @@ -92,19 +96,21 @@ def _moordyn_input(input_file, dataset): line = next(moordyn_file) units = line.split() line = next(moordyn_file) - while line.count('---') == 0: + while line.count("---") == 0: entries = line.split() linetypes[entries[0]] = dict() for x in range(1, len(entries)): linetypes[entries[0]][variables[x]] = entries[x] line = next(moordyn_file) - linetypes['units'] = units[1:] - dataset.attrs['LINE_TYPES'] = linetypes + linetypes["units"] = units[1:] + dataset.attrs["LINE_TYPES"] = linetypes # get properties of each Point - if line.count('---') > 0 and (line.upper().count('POINTS') > 0 - or line.upper().count('POINT LIST') > 0 - or line.upper().count('POINT PROPERTIES') > 0): + if line.count("---") > 0 and ( + line.upper().count("POINTS") > 0 + or line.upper().count("POINT LIST") > 0 + or line.upper().count("POINT PROPERTIES") > 0 + ): # skip this header line, plus channel names and units lines line = next(moordyn_file) variables = line.split() @@ -112,19 +118,21 @@ def _moordyn_input(input_file, dataset): units = line.split() line = next(moordyn_file) points = dict() - while line.count('---') == 0: + while line.count("---") == 0: entries = line.split() points[entries[0]] = dict() for x in range(1, len(entries)): points[entries[0]][variables[x]] = entries[x] line = next(moordyn_file) - points['units'] = units[1:] - dataset.attrs['POINTS'] = points + points["units"] = units[1:] + dataset.attrs["POINTS"] = points # get properties of each line - if line.count('---') > 0 and (line.upper().count('LINES') > 0 - or line.upper().count('LINE LIST') > 0 - or line.upper().count('LINE PROPERTIES') > 0): + if line.count("---") > 0 and ( + line.upper().count("LINES") > 0 + or line.upper().count("LINE LIST") > 0 + or line.upper().count("LINE PROPERTIES") > 0 + ): # skip this header line, plus channel names and units lines line = next(moordyn_file) variables = line.split() @@ -132,24 +140,24 @@ def _moordyn_input(input_file, dataset): units = line.split() line = next(moordyn_file) lines = {} - while line.count('---') == 0: + while line.count("---") == 0: entries = line.split() lines[entries[0]] = dict() for x in range(1, len(entries)): lines[entries[0]][variables[x]] = entries[x] line = next(moordyn_file) - lines['units'] = units[1:] - dataset.attrs['LINES'] = lines + lines["units"] = units[1:] + dataset.attrs["LINES"] = lines # get options entries - if line.count('---') > 0 and "options" in line.lower(): + if line.count("---") > 0 and "options" in line.lower(): line = next(moordyn_file) # skip this header line options = {} - while line.count('---') == 0: + while line.count("---") == 0: entries = line.split() options[entries[1]] = entries[0] line = next(moordyn_file) - dataset.attrs['OPTIONS'] = options + dataset.attrs["OPTIONS"] = options moordyn_file.close() diff --git a/mhkit/mooring/main.py b/mhkit/mooring/main.py index c4221a850..a5ebeafa4 100644 --- a/mhkit/mooring/main.py +++ b/mhkit/mooring/main.py @@ -27,40 +27,41 @@ def lay_length(dataset, depth, tolerance=0.25): Checks for correct input types for ds, depth, and tolerance """ if not isinstance(dataset, xr.Dataset): - raise TypeError('dataset must be of type xr.Dataset') + raise TypeError("dataset must be of type xr.Dataset") if not isinstance(depth, (float, int)): - raise TypeError('depth must be of type float or int') + raise TypeError("depth must be of type float or int") if not isinstance(tolerance, (float, int)): - raise TypeError('tolerance must be of type float or int') + raise TypeError("tolerance must be of type float or int") # get channel names chans = list(dataset.keys()) - nodes_x = [x for x in chans if 'x' in x] - nodes_y = [y for y in chans if 'y' in y] - nodes_z = [z for z in chans if 'z' in z] + nodes_x = [x for x in chans if "x" in x] + nodes_y = [y for y in chans if "y" in y] + nodes_z = [z for z in chans if "z" in z] # check if the dataset contains the necessary 'x', 'y', 'z' nodes if not nodes_x or not nodes_y or not nodes_z: - raise ValueError('The dataset must contain x, y, and z node data') + raise ValueError("The dataset must contain x, y, and z node data") if len(nodes_z) < 3: raise ValueError( - 'This function requires at least 3 nodes to calculate lay length') + "This function requires at least 3 nodes to calculate lay length" + ) # find name of first z point where tolerance is exceeded - laypoint = dataset[nodes_z].where(dataset[nodes_z] > depth+abs(tolerance)) + laypoint = dataset[nodes_z].where(dataset[nodes_z] > depth + abs(tolerance)) laypoint = laypoint.to_dataframe().dropna(axis=1).columns[0] # get previous z-point lay_indx = nodes_z.index(laypoint) - 1 lay_z = nodes_z[lay_indx] # get corresponding x-point and y-point node names - lay_x = lay_z[:-1] + 'x' - lay_y = lay_z[:-1] + 'y' + lay_x = lay_z[:-1] + "x" + lay_y = lay_z[:-1] + "y" lay_0x = nodes_x[0] lay_0y = nodes_y[0] # find distance between initial point and lay point laylength_x = dataset[lay_x] - dataset[lay_0x] laylength_y = dataset[lay_y] - dataset[lay_0y] - line_lay_length = (laylength_x**2 + laylength_y**2) ** (1/2) + line_lay_length = (laylength_x**2 + laylength_y**2) ** (1 / 2) return line_lay_length diff --git a/mhkit/power/__init__.py b/mhkit/power/__init__.py index 0056a8f31..5cae03212 100644 --- a/mhkit/power/__init__.py +++ b/mhkit/power/__init__.py @@ -1,3 +1,6 @@ +""" +Power Module +""" + from mhkit.power import quality from mhkit.power import characteristics - diff --git a/mhkit/power/characteristics.py b/mhkit/power/characteristics.py index 08578f984..0ae45a789 100644 --- a/mhkit/power/characteristics.py +++ b/mhkit/power/characteristics.py @@ -1,112 +1,252 @@ +""" +This module contains functions for calculating electrical power metrics from +measured voltage and current data. It supports both direct current (DC) and +alternating current (AC) calculations, including instantaneous frequency +analysis for AC signals and power calculations for three-phase AC systems. +The calculations can accommodate both line-to-neutral and line-to-line voltage +measurements and offer flexibility in output formats, allowing results to be +saved as either pandas DataFrames or xarray Datasets. + +Functions: + instantaneous_frequency: Calculates the instantaneous frequency of a measured + voltage signal over time. + + dc_power: Computes the DC power from voltage and current measurements, providing + both individual channel outputs and a gross power calculation. + + ac_power_three_phase: Calculates the magnitude of active AC power for three-phase + systems, considering the power factor and voltage measurement configuration + (line-to-neutral or line-to-line). +""" + +from typing import Union import pandas as pd +import xarray as xr import numpy as np from scipy.signal import hilbert -import datetime +from mhkit.utils import convert_to_dataset -def instantaneous_frequency(um): +def instantaneous_frequency( + measured_voltage: Union[pd.Series, pd.DataFrame, xr.DataArray, xr.Dataset], + time_dimension: str = "", + to_pandas: bool = True, +) -> Union[pd.DataFrame, xr.Dataset]: """ Calculates instantaneous frequency of measured voltage - - + Parameters ----------- - um: pandas Series or DataFrame - Measured voltage (V) indexed by time + measured_voltage: pandas Series, pandas DataFrame, xarray DataArray, + or xarray Dataset Measured voltage (V) indexed by time + + time_dimension: string (optional) + Name of the xarray dimension corresponding to time. If not supplied, + defaults to the first dimension. Does not affect pandas input. + + to_pandas: bool (Optional) + Flag to save output to pandas instead of xarray. Default = True. - Returns --------- - frequency: pandas DataFrame - Frequency of the measured voltage (Hz) indexed by time + frequency: pandas DataFrame or xarray Dataset + Frequency of the measured voltage (Hz) indexed by time with signal name columns - """ - assert isinstance(um, (pd.Series, pd.DataFrame)), 'um must be of type pd.Series or pd.DataFrame' - - if isinstance(um.index[0], datetime.datetime): - t = (um.index - datetime.datetime(1970,1,1)).total_seconds() + """ + if not isinstance( + measured_voltage, (pd.Series, pd.DataFrame, xr.DataArray, xr.Dataset) + ): + raise TypeError( + "measured_voltage must be of type pd.Series, pd.DataFrame, " + + f"xr.DataArray, or xr.Dataset. Got {type(measured_voltage)}" + ) + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type bool. Got: {type(to_pandas)}") + if not isinstance(time_dimension, str): + raise TypeError( + f"time_dimension must be of type bool. Got: {type(time_dimension)}" + ) + + # Convert input to xr.Dataset + measured_voltage = convert_to_dataset(measured_voltage, "data") + + if time_dimension != "" and time_dimension not in measured_voltage.coords: + raise ValueError( + "time_dimension was supplied but is not a dimension " + + f"of measured_voltage. Got {time_dimension}" + ) + + # Get the dimension of interest + if time_dimension == "": + time_dimension = list(measured_voltage.coords)[0] + + # Calculate time step + if isinstance(measured_voltage.coords[time_dimension].values[0], np.datetime64): + time = ( + measured_voltage[time_dimension] - np.datetime64("1970-01-01 00:00:00") + ) / np.timedelta64(1, "s") else: - t = um.index + time = measured_voltage[time_dimension] + d_t = np.diff(time) + + # Calculate frequency + frequency = xr.Dataset() + for var in measured_voltage.data_vars: + freq = hilbert(measured_voltage[var]) + instantaneous_phase = np.unwrap(np.angle(freq)) + f_instantaneous = np.diff(instantaneous_phase) / (2.0 * np.pi) * (1 / d_t) - dt = pd.Series(t).diff()[1:] + frequency = frequency.assign({var: (time_dimension, f_instantaneous)}) + frequency = frequency.assign_coords( + {time_dimension: measured_voltage.coords[time_dimension].values[0:-1]} + ) - if isinstance(um,pd.Series): - um = um.to_frame() + if to_pandas: + frequency = frequency.to_pandas() - columns = um.columns - frequency=pd.DataFrame(columns=columns) - for column in um.columns: - f = hilbert(um[column]) - instantaneous_phase = np.unwrap(np.angle(f)) - instantaneous_frequency = np.diff(instantaneous_phase) /(2.0*np.pi) * (1/dt) - frequency[column] = instantaneous_frequency - return frequency -def dc_power(voltage, current): + +def dc_power( + voltage: Union[pd.Series, pd.DataFrame, xr.DataArray, xr.Dataset], + current: Union[pd.Series, pd.DataFrame, xr.DataArray, xr.Dataset], + to_pandas: bool = True, +) -> Union[pd.DataFrame, xr.Dataset]: """ Calculates DC power from voltage and current Parameters ----------- - voltage: pandas Series or DataFrame + voltage: pandas Series, pandas DataFrame, xarray DataArray, or xarray Dataset Measured DC voltage [V] indexed by time - current: pandas Series or DataFrame + + current: pandas Series, pandas DataFrame, xarray DataArray, or xarray Dataset Measured three phase current [A] indexed by time - + + to_pandas: bool (Optional) + Flag to save output to pandas instead of xarray. Default = True. + Returns -------- - P: pandas DataFrame + power_dc: pandas DataFrame or xarray Dataset DC power [W] from each channel and gross power indexed by time """ - assert isinstance(voltage, (pd.Series, pd.DataFrame)), 'voltage must be of type pd.Series or pd.DataFrame' - assert isinstance(current, (pd.Series, pd.DataFrame)), 'current must be of type pd.Series or pd.DataFrame' - assert voltage.shape == current.shape, 'current and volatge must have the same shape' - - - P = current.values * voltage.values - P = pd.DataFrame(P) - P['Gross'] = P.sum(axis=1, skipna=True) + if not isinstance(voltage, (pd.Series, pd.DataFrame, xr.DataArray, xr.Dataset)): + raise TypeError( + "voltage must be of type pd.Series, pd.DataFrame, " + + f"xr.DataArray, or xr.Dataset. Got {type(voltage)}" + ) + if not isinstance(current, (pd.Series, pd.DataFrame, xr.DataArray, xr.Dataset)): + raise TypeError( + "current must be of type pd.Series, pd.DataFrame, " + + f"xr.DataArray, or xr.Dataset. Got {type(current)}" + ) + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type bool. Got: {type(to_pandas)}") + + # Convert inputs to xr.Dataset + voltage = convert_to_dataset(voltage, "voltage") + current = convert_to_dataset(current, "current") - return P + # Check that sizes are the same + if not ( + voltage.sizes == current.sizes + and len(voltage.data_vars) == len(current.data_vars) + ): + raise ValueError("current and voltage must have the same shape") -def ac_power_three_phase(voltage, current, power_factor, line_to_line=False): + power_dc = xr.Dataset() + gross = None + + # Multiply current and voltage variables together, in order they're assigned + for i, (current_var, voltage_var) in enumerate( + zip(current.data_vars, voltage.data_vars) + ): + temp = current[current_var] * voltage[voltage_var] + power_dc = power_dc.assign({f"{i}": temp}) + if gross is None: + gross = temp + else: + gross = gross + temp + + power_dc = power_dc.assign({"Gross": gross}) + + if to_pandas: + power_dc = power_dc.to_dataframe() + + return power_dc + + +def ac_power_three_phase( + voltage: Union[pd.Series, pd.DataFrame, xr.DataArray, xr.Dataset], + current: Union[pd.Series, pd.DataFrame, xr.DataArray, xr.Dataset], + power_factor: float, + line_to_line: bool = False, + to_pandas: bool = True, +) -> Union[pd.DataFrame, xr.Dataset]: """ - Calculates magnitude of active AC power from line to neutral voltage and current + Calculates magnitude of active AC power from line to neutral voltage and current Parameters ----------- - voltage: pandas DataFrame - Time-series of three phase measured voltage [V] indexed by time - current: pandas DataFrame - Time-series of three phase measured current [A] indexed by time - power_factor: float + voltage: pandas Series, pandas DataFrame, xarray DataArray, or xarray Dataset + Measured DC voltage [V] indexed by time + + current: pandas Series, pandas DataFrame, xarray DataArray, or xarray Dataset + Measured three phase current [A] indexed by time + + power_factor: float Power factor for the efficiency of the system - line_to_line: bool + + line_to_line: bool (Optional) Set to true if the given voltage measurements are line_to_line - + + to_pandas: bool (Optional) + Flag to save output to pandas instead of xarray. Default = True. + Returns -------- - P: pandas DataFrame - Magnitude of active AC power [W] indexed by time with Power column + power_ac: pandas DataFrame or xarray Dataset + Magnitude of active AC power [W] indexed by time with Power column """ - assert isinstance(voltage, pd.DataFrame), 'voltage must be of type pd.DataFrame' - assert isinstance(current, pd.DataFrame), 'current must be of type pd.DataFrame' - assert len(voltage.columns) == 3, 'voltage must have three columns' - assert len(current.columns) == 3, 'current must have three columns' - assert current.shape == voltage.shape, 'current and voltage must be of the same size' - + if not isinstance(voltage, (pd.Series, pd.DataFrame, xr.DataArray, xr.Dataset)): + raise TypeError( + "voltage must be of type pd.Series, pd.DataFrame, " + + f"xr.DataArray, or xr.Dataset. Got {type(voltage)}" + ) + if not isinstance(current, (pd.Series, pd.DataFrame, xr.DataArray, xr.Dataset)): + raise TypeError( + "current must be of type pd.Series, pd.DataFrame, " + + f"xr.DataArray, or xr.Dataset. Got {type(current)}" + ) + if not isinstance(line_to_line, bool): + raise TypeError(f"line_to_line must be of type bool. Got: {type(line_to_line)}") + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type bool. Got: {type(to_pandas)}") + + # Convert inputs to xr.Dataset + voltage = convert_to_dataset(voltage, "voltage") + current = convert_to_dataset(current, "current") - abs_current = np.abs(current.values) - abs_voltage = np.abs(voltage.values) + # Check that sizes are the same + if len(voltage.data_vars) != 3: + raise ValueError("voltage must have three columns") + if len(current.data_vars) != 3: + raise ValueError("current must have three columns") + if current.sizes != voltage.sizes: + raise ValueError("current and voltage must be of the same size") + + power = dc_power(voltage, current, to_pandas=False)["Gross"] + power.name = "Power" + power = ( + power.to_dataset() + ) # force xr.DataArray to be consistently in xr.Dataset format + power_ac = np.abs(power) * power_factor if line_to_line: - power = abs_current * (abs_voltage * np.sqrt(3)) - else: - power = abs_current * abs_voltage - - power = pd.DataFrame(power) - P = power.sum(axis=1) * power_factor - P = P.to_frame('Power') - - return P + power_ac = power_ac * np.sqrt(3) + + if to_pandas: + power_ac = power_ac.to_pandas() + + return power_ac diff --git a/mhkit/power/quality.py b/mhkit/power/quality.py index 27f89c20f..8f830348d 100644 --- a/mhkit/power/quality.py +++ b/mhkit/power/quality.py @@ -1,208 +1,378 @@ +""" +This module contains functions for calculating various aspects of power quality, +particularly focusing on the analysis of harmonics and interharmonics in electrical +power systems. These functions are designed to assist in power quality assessments +by providing tools to analyze voltage and current signals for their harmonic +and interharmonic components based on the guidelines and methodologies +outlined in IEC 61000-4-7. + +Functions in this module include: + +- harmonics: Calculates the harmonics from time series of voltage or current. + This function returns the amplitude of the time-series data harmonics indexed by + the harmonic frequency, aiding in the identification of harmonic distortions + within the power system. + +- harmonic_subgroups: Computes the harmonic subgroups as per IEC 61000-4-7 standards. + Harmonic subgroups provide insights into the distribution of power across + different harmonic frequencies, which is crucial for understanding the behavior + of non-linear loads and their impact on the power quality. + +- total_harmonic_current_distortion (THCD): Determines the total harmonic current + distortion, offering a summary metric that quantifies the overall level of + harmonic distortion present in the current waveform. This metric is essential + for assessing compliance with power quality standards and guidelines. + +- interharmonics: Identifies and calculates the interharmonics present in the + power system. Interharmonics, which are frequencies that occur between the + fundamental and harmonic frequencies, can arise from various sources and + potentially lead to power quality issues. +""" + +from typing import Union import pandas as pd import numpy as np -import scipy.integrate as integrate -from scipy.optimize import fsolve -from scipy.signal import hilbert -from scipy import signal, fft, fftpack +from scipy import fftpack +import xarray as xr +from mhkit.utils import convert_to_dataset -#This group of functions are to be used for power quality assessments - -def harmonics(x,freq,grid_freq): +def harmonics( + signal_data: Union[pd.Series, pd.DataFrame, xr.DataArray, xr.Dataset], + freq: Union[float, int], + grid_freq: int, + to_pandas: bool = True, +) -> Union[pd.DataFrame, xr.Dataset]: """ - Calculates the harmonics from time series of voltage or current based on IEC 61000-4-7. + Calculates the harmonics from time series of voltage or current based on IEC 61000-4-7. Parameters ----------- - x: pandas Series or DataFrame + signal_data: pandas Series, pandas DataFrame, xarray DataArray, or xarray Dataset Time-series of voltage [V] or current [A] - + freq: float or Int Frequency of the time-series data [Hz] - + grid_freq: int Value indicating if the power supply is 50 or 60 Hz. Options = 50 or 60 - - + + to_pandas: bool (Optional) + Flag to save output to pandas instead of xarray. Default = True. + Returns -------- - harmonics: pandas DataFrame - Amplitude of the time-series data harmonics indexed by the harmonic + harmonic_amplitudes: pandas DataFrame or xarray Dataset + Amplitude of the time-series data harmonics indexed by the harmonic frequency with signal name columns """ - assert isinstance(x, (pd.Series, pd.DataFrame)), 'Provided voltage or current must be of type pd.DataFrame or pd.Series' - assert isinstance(freq, (float, int)), 'freq must be of type float or integer' - assert (grid_freq == 50 or grid_freq == 60), 'grid_freq must be either 50 or 60' + if not isinstance(signal_data, (pd.Series, pd.DataFrame, xr.DataArray, xr.Dataset)): + raise TypeError( + "signal_data must be of type pd.Series, pd.DataFrame, " + + f"xr.DataArray, or xr.Dataset. Got {type(signal_data)}" + ) + + if not isinstance(freq, (float, int)): + raise TypeError(f"freq must be of type float or integer. Got {type(freq)}") - # Check if x is a DataFrame - if isinstance(x, (pd.DataFrame)) == True: - cols = x.columns - - x = x.to_numpy() - sample_spacing = 1./freq - frequency_bin_centers = fftpack.fftfreq(len(x), d=sample_spacing) + if grid_freq not in [50, 60]: + raise ValueError(f"grid_freq must be either 50 or 60. Got {grid_freq}") - harmonics_amplitude = np.abs(np.fft.fft(x, axis=0)) + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type bool. Got {type(to_pandas)}") - harmonics = pd.DataFrame(harmonics_amplitude, index=frequency_bin_centers) - harmonics = harmonics.sort_index() - - # Keep the signal name as the column name - if 'cols' in locals(): - harmonics.columns = cols + # Convert input to xr.Dataset + signal_data = convert_to_dataset(signal_data, "data") - if grid_freq == 60: - hz = np.arange(0,3060,5) - elif grid_freq == 50: - hz = np.arange(0,2570,5) + sample_spacing = 1.0 / freq + # Loop through all variables in signal_data + harmonic_amplitudes = xr.Dataset() + for var in signal_data.data_vars: + dataarray = signal_data[var] + dataarray = dataarray.to_numpy() - harmonics = harmonics.reindex(hz, method='nearest') - harmonics = harmonics/len(x)*2 + frequency_bin_centers = fftpack.fftfreq(len(dataarray), d=sample_spacing) + harmonics_amplitude = np.abs(np.fft.fft(dataarray, axis=0)) + + harmonic_amplitudes = harmonic_amplitudes.assign( + {var: (["frequency"], harmonics_amplitude)} + ) + harmonic_amplitudes = harmonic_amplitudes.assign_coords( + {"frequency": frequency_bin_centers} + ) + harmonic_amplitudes = harmonic_amplitudes.sortby("frequency") + + if grid_freq == 60: + hertz = np.arange(0, 3060, 5) + elif grid_freq == 50: + hertz = np.arange(0, 2570, 5) - - return harmonics + harmonic_amplitudes = harmonic_amplitudes.reindex( + {"frequency": hertz}, method="nearest" + ) + harmonic_amplitudes = ( + harmonic_amplitudes / len(signal_data[list(signal_data.dims)[0]]) * 2 + ) + if to_pandas: + harmonic_amplitudes = harmonic_amplitudes.to_pandas() -def harmonic_subgroups(harmonics, grid_freq): + return harmonic_amplitudes + + +def harmonic_subgroups( + harmonic_amplitudes: Union[pd.Series, pd.DataFrame, xr.DataArray, xr.Dataset], + grid_freq: int, + frequency_dimension: str = "", + to_pandas: bool = True, +) -> Union[pd.DataFrame, xr.Dataset]: """ Calculates the harmonic subgroups based on IEC 61000-4-7 Parameters ---------- - harmonics: pandas Series or DataFrame - Harmonic amplitude indexed by the harmonic frequency + harmonic_amplitudes: pandas Series, pandas DataFrame, xarray DataArray, or xarray Dataset + Harmonic amplitude indexed by the harmonic frequency + grid_freq: int Value indicating if the power supply is 50 or 60 Hz. Options = 50 or 60 + frequency_dimension: string (optional) + Name of the xarray dimension corresponding to frequency. If not supplied, + defaults to the first dimension. Does not affect pandas input. + + to_pandas: bool (Optional) + Flag to save output to pandas instead of xarray. Default = True. + Returns -------- - harmonic_subgroups: pandas DataFrame - Harmonic subgroups indexed by harmonic frequency + subgroup_results: pandas DataFrame or xarray Dataset + Harmonic subgroups indexed by harmonic frequency with signal name columns - """ - assert isinstance(harmonics, (pd.Series, pd.DataFrame)), 'harmonics must be of type pd.DataFrame or pd.Series' - assert (grid_freq == 50 or grid_freq == 60), 'grid_freq must be either 50 or 60' - - # Check if harmonics is a DataFrame - if isinstance(harmonics, (pd.DataFrame)) == True: - cols = harmonics.columns - - + """ + if not isinstance( + harmonic_amplitudes, (pd.Series, pd.DataFrame, xr.DataArray, xr.Dataset) + ): + raise TypeError( + "harmonic_amplitudes must be of type pd.Series, pd.DataFrame, " + + f"xr.DataArray, or xr.Dataset. Got {type(harmonic_amplitudes)}" + ) + + if grid_freq not in [50, 60]: + raise ValueError(f"grid_freq must be either 50 or 60. Got {grid_freq}") + + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type bool. Got: {type(to_pandas)}") + + if not isinstance(frequency_dimension, str): + raise TypeError( + f"frequency_dimension must be of type str. Got: {type(frequency_dimension)}" + ) + + # Convert input to xr.Dataset + harmonic_amplitudes = convert_to_dataset(harmonic_amplitudes, "harmonic_amplitudes") + + if ( + frequency_dimension != "" + and frequency_dimension not in harmonic_amplitudes.coords + ): + raise ValueError( + "frequency_dimension was supplied but is not a dimension " + + f"of harmonic_amplitudes. Got {frequency_dimension}" + ) + if grid_freq == 60: - - hz = np.arange(0,3060,60) - elif grid_freq == 50: - - hz = np.arange(0,2550,50) - - j=0 - i=0 - cols=harmonics.columns - harmonic_subgroups=np.ones((np.size(hz),np.size(cols))) - for n in hz: - - harmonics=harmonics.sort_index(axis=0) - ind=pd.Index(harmonics.index) - - indn = ind.get_loc(n, method='nearest') - for col in cols: - harmonic_subgroups[i,j] = np.sqrt(np.sum([harmonics[col].iloc[indn-1]**2,harmonics[col].iloc[indn]**2,harmonics[col].iloc[indn+1]**2])) - j=j+1 - j=0 - i=i+1 - - harmonic_subgroups = pd.DataFrame(harmonic_subgroups,index=hz) - - # Keep the signal name as the column name - if 'cols' in locals(): - harmonic_subgroups.columns = cols - - return harmonic_subgroups - -def total_harmonic_current_distortion(harmonics_subgroup,rated_current): + hertz = np.arange(0, 3060, 60) + else: + hertz = np.arange(0, 2550, 50) + + # Sort input data index + if frequency_dimension == "": + frequency_dimension = list(harmonic_amplitudes.dims)[0] + harmonic_amplitudes = harmonic_amplitudes.sortby(frequency_dimension) + + # Loop through all variables in harmonics + subgroup_results = xr.Dataset() + for var in harmonic_amplitudes.data_vars: + dataarray = harmonic_amplitudes[var] + subgroup = np.zeros(np.size(hertz)) + for ihz in np.arange(0, len(hertz)): + current_frequency = hertz[ihz] + ind = dataarray.indexes[frequency_dimension].get_loc(current_frequency) + + data_subset = dataarray.isel({frequency_dimension: [ind - 1, ind, ind + 1]}) + subgroup[ihz] = (data_subset**2).sum() ** 0.5 + + subgroup_results = subgroup_results.assign({var: (["frequency"], subgroup)}) + subgroup_results = subgroup_results.assign_coords({"frequency": hertz}) + + if to_pandas: + subgroup_results = subgroup_results.to_pandas() + + return subgroup_results + + +def total_harmonic_current_distortion( + harmonics_subgroup: Union[pd.Series, pd.DataFrame, xr.DataArray, xr.Dataset], + frequency_dimension: str = "", + to_pandas: bool = True, +) -> Union[pd.DataFrame, xr.Dataset]: """ Calculates the total harmonic current distortion (THC) based on IEC/TS 62600-30 Parameters ---------- - harmonics_subgroup: pandas DataFrame or Series + harmonics_subgroup: pandas Series, pandas DataFrame, xarray DataArray, or xarray Dataset Subgrouped current harmonics indexed by harmonic frequency - - rated_current: float - Rated current of the energy device in Amps - + + frequency_dimension: string (optional) + Name of the xarray dimension corresponding to frequency. If not supplied, + defaults to the first dimension. Does not affect pandas input. + + to_pandas: bool (optional) + Flag to save output to pandas instead of xarray. Default = True. + Returns -------- - THCD: pd.DataFrame - Total harmonic current distortion indexed by signal name with THCD column + thcd_result: pd.DataFrame or xarray Dataset + Total harmonic current distortion indexed by signal name with THCD column """ - assert isinstance(harmonics_subgroup, (pd.Series, pd.DataFrame)), 'harmonic_subgroups must be of type pd.DataFrame or pd.Series' - assert isinstance(rated_current, float), 'rated_current must be a float' - - harmonics_sq = harmonics_subgroup.iloc[2:50]**2 + if not isinstance( + harmonics_subgroup, (pd.Series, pd.DataFrame, xr.DataArray, xr.Dataset) + ): + raise TypeError( + "harmonics_subgroup must be of type pd.Series, pd.DataFrame, " + + f"xr.DataArray, or xr.Dataset. Got {type(harmonics_subgroup)}" + ) + + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type bool. Got: {type(to_pandas)}") + + if not isinstance(frequency_dimension, str): + raise TypeError( + f"frequency_dimension must be of type bool. Got: {type(frequency_dimension)}" + ) + + # Convert input to xr.Dataset + harmonics_subgroup = convert_to_dataset(harmonics_subgroup, "harmonics_subgroup") + + if ( + frequency_dimension != "" + and frequency_dimension not in harmonics_subgroup.coords + ): + raise ValueError( + "frequency_dimension was supplied but is not a dimension " + + f"of harmonics. Got {frequency_dimension}" + ) + + if frequency_dimension == "": + frequency_dimension = list(harmonics_subgroup.dims)[0] + harmonics_sq = harmonics_subgroup.isel({frequency_dimension: slice(2, 50)}) ** 2 + harmonics_sum = harmonics_sq.sum() + + thcd_result = ( + np.sqrt(harmonics_sum) / harmonics_subgroup.isel({frequency_dimension: 1}) + ) * 100 - harmonics_sum=harmonics_sq.sum() + if isinstance(thcd_result, xr.DataArray): + thcd_result.name = ["THCD"] - THCD = (np.sqrt(harmonics_sum)/harmonics_subgroup.iloc[1])*100 - THCD = pd.DataFrame(THCD) # converting to dataframe for Matlab - THCD.columns = ['THCD'] - THCD = THCD.T + if to_pandas: + thcd_result = thcd_result.to_pandas() - return THCD + return thcd_result -def interharmonics(harmonics,grid_freq): + +def interharmonics( + harmonic_amplitudes: Union[pd.Series, pd.DataFrame, xr.DataArray, xr.Dataset], + grid_freq: int, + frequency_dimension: str = "", + to_pandas: bool = True, +) -> Union[pd.DataFrame, xr.Dataset]: """ - Calculates the interharmonics from the harmonics of current + Calculates the interharmonics from the harmonic_amplitudes of current Parameters ----------- - harmonics: pandas Series or DataFrame - Harmonic amplitude indexed by the harmonic frequency + harmonic_amplitudes: pandas Series, pandas DataFrame, xarray DataArray, or xarray Dataset + Harmonic amplitude indexed by the harmonic frequency grid_freq: int Value indicating if the power supply is 50 or 60 Hz. Options = 50 or 60 + frequency_dimension: string (optional) + Name of the xarray dimension corresponding to frequency. If not supplied, + defaults to the first dimension. Does not affect pandas input. + + to_pandas: bool (Optional) + Flag to save output to pandas instead of xarray. Default = True. + Returns ------- - interharmonics: pandas DataFrame + interharmonic_groups: pandas DataFrame or xarray Dataset Interharmonics groups """ - assert isinstance(harmonics, (pd.Series, pd.DataFrame)), 'harmonics must be of type pd.DataFrame or pd.Series' - assert (grid_freq == 50 or grid_freq == 60), 'grid_freq must be either 50 or 60' - + if not isinstance( + harmonic_amplitudes, (pd.Series, pd.DataFrame, xr.DataArray, xr.Dataset) + ): + raise TypeError( + "harmonic_amplitudes must be of type pd.Series, pd.DataFrame, " + + f"xr.DataArray, or xr.Dataset. Got {type(harmonic_amplitudes)}" + ) + + if grid_freq not in [50, 60]: + raise ValueError(f"grid_freq must be either 50 or 60. Got {grid_freq}") + + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type bool. Got: {type(to_pandas)}") + + # Convert input to xr.Dataset + harmonic_amplitudes = convert_to_dataset(harmonic_amplitudes, "harmonic_amplitudes") + + if ( + frequency_dimension != "" + and frequency_dimension not in harmonic_amplitudes.coords + ): + raise ValueError( + "frequency_dimension was supplied but is not a dimension " + + f"of harmonic_amplitudes. Got {frequency_dimension}" + ) if grid_freq == 60: - - hz = np.arange(0,3060,60) - elif grid_freq == 50: - - hz = np.arange(0,2550,50) - - j=0 - i=0 - cols=harmonics.columns - interharmonics=np.ones((np.size(hz),np.size(cols))) - for n in hz: - harmonics=harmonics.sort_index(axis=0) - ind=pd.Index(harmonics.index) - - indn = ind.get_loc(n, method='nearest') - for col in cols: + hertz = np.arange(0, 3060, 60) + elif grid_freq == 50: + hertz = np.arange(0, 2550, 50) + + # Sort input data index + if frequency_dimension == "": + frequency_dimension = list(harmonic_amplitudes.dims)[0] + harmonic_amplitudes = harmonic_amplitudes.sortby(frequency_dimension) + + # Loop through all variables in harmonic_amplitudes + interharmonic_groups = xr.Dataset() + for var in harmonic_amplitudes.data_vars: + dataarray = harmonic_amplitudes[var] + subset = np.zeros(np.size(hertz)) + + for ihz in np.arange(0, len(hertz)): + current_frequency = hertz[ihz] + ind = dataarray.indexes[frequency_dimension].get_loc(current_frequency) + if grid_freq == 60: - subset = harmonics[col].iloc[indn+1:indn+11]**2 - subset = subset.squeeze() - else: - subset = harmonics[col].iloc[indn+1:indn+7]**2 - subset = subset.squeeze() - - interharmonics[i,j] = np.sqrt(np.sum(subset)) - j=j+1 - j=0 - i=i+1 - - - interharmonics = pd.DataFrame(interharmonics,index=hz) - - return interharmonics + data = dataarray.isel({frequency_dimension: slice(ind + 1, ind + 11)}) + subset[ihz] = (data**2).sum() ** 0.5 + else: + data = dataarray.isel({frequency_dimension: slice(ind + 1, ind + 7)}) + subset[ihz] = (data**2).sum() ** 0.5 + + interharmonic_groups = interharmonic_groups.assign( + {var: (["frequency"], subset)} + ) + interharmonic_groups = interharmonic_groups.assign_coords({"frequency": hertz}) + + if to_pandas: + interharmonic_groups = interharmonic_groups.to_pandas() + + return interharmonic_groups diff --git a/mhkit/qc/__init__.py b/mhkit/qc/__init__.py index 841442eca..c325f37f2 100644 --- a/mhkit/qc/__init__.py +++ b/mhkit/qc/__init__.py @@ -1,2 +1,8 @@ -from pecos.monitoring import check_timestamp, check_missing, check_corrupt, \ - check_range, check_delta, check_outlier +from pecos.monitoring import ( + check_timestamp, + check_missing, + check_corrupt, + check_range, + check_delta, + check_outlier, +) diff --git a/mhkit/river/__init__.py b/mhkit/river/__init__.py index 452810833..8406b8cf1 100644 --- a/mhkit/river/__init__.py +++ b/mhkit/river/__init__.py @@ -1,5 +1,4 @@ -from mhkit.river import performance +from mhkit.river import performance from mhkit.river import graphics -from mhkit.river import resource -from mhkit.river import io - +from mhkit.river import resource +from mhkit.river import io diff --git a/mhkit/river/graphics.py b/mhkit/river/graphics.py index 46b621f88..396ce1271 100644 --- a/mhkit/river/graphics.py +++ b/mhkit/river/graphics.py @@ -1,10 +1,10 @@ import numpy as np -import pandas as pd -import matplotlib.pyplot as plt +import xarray as xr +import matplotlib.pyplot as plt +from mhkit.utils import convert_to_dataarray -def _xy_plot(x, y, fmt='.', label=None, xlabel=None, ylabel=None, title=None, - ax=None): +def _xy_plot(x, y, fmt=".", label=None, xlabel=None, ylabel=None, title=None, ax=None): """ Base function to plot any x vs y data @@ -14,241 +14,304 @@ def _xy_plot(x, y, fmt='.', label=None, xlabel=None, ylabel=None, title=None, Data for the x axis of plot y: array-like Data for y axis of plot - + Returns ------- ax : matplotlib.pyplot axes - + """ if ax is None: - plt.figure(figsize=(16,8)) - params = {'legend.fontsize': 'x-large', - 'axes.labelsize': 'x-large', - 'axes.titlesize':'x-large', - 'xtick.labelsize':'x-large', - 'ytick.labelsize':'x-large'} + plt.figure(figsize=(16, 8)) + params = { + "legend.fontsize": "x-large", + "axes.labelsize": "x-large", + "axes.titlesize": "x-large", + "xtick.labelsize": "x-large", + "ytick.labelsize": "x-large", + } plt.rcParams.update(params) ax = plt.gca() - + ax.plot(x, y, fmt, label=label, markersize=7) - + ax.grid() - - if label: ax.legend() - if xlabel: ax.set_xlabel(xlabel) - if ylabel: ax.set_ylabel(ylabel) - if title: ax.set_title(title) - + + if label: + ax.legend() + if xlabel: + ax.set_xlabel(xlabel) + if ylabel: + ax.set_ylabel(ylabel) + if title: + ax.set_title(title) + plt.tight_layout() - + return ax def plot_flow_duration_curve(D, F, label=None, ax=None): """ - Plots discharge vs exceedance probability as a Flow Duration Curve (FDC) - + Plots discharge vs exceedance probability as a Flow Duration Curve (FDC) + Parameters ------------ D: array-like Discharge [m/s] indexed by time - - F: array-like + + F: array-like Exceedance probability [unitless] indexed by time - + label: string Label to use in the legend - + ax : matplotlib axes object - Axes for plotting. If None, then a new figure with a single + Axes for plotting. If None, then a new figure with a single axes is used. - + Returns --------- ax : matplotlib pyplot axes - + """ # Sort by F - temp = pd.DataFrame({'D': D, 'F': F}) - temp.sort_values('F', ascending=False, kind='mergesort', inplace=True) - - ax = _xy_plot(temp['D'], temp['F'], fmt='-', label=label, xlabel='Discharge [$m^3/s$]', - ylabel='Exceedance Probability', ax=ax) - plt.xscale('log') + temp = xr.Dataset(data_vars={"D": D, "F": F}) + temp.sortby("F", ascending=False) + + ax = _xy_plot( + temp["D"], + temp["F"], + fmt="-", + label=label, + xlabel="Discharge [$m^3/s$]", + ylabel="Exceedance Probability", + ax=ax, + ) + plt.xscale("log") return ax def plot_velocity_duration_curve(V, F, label=None, ax=None): """ - Plots velocity vs exceedance probability as a Velocity Duration Curve (VDC) - + Plots velocity vs exceedance probability as a Velocity Duration Curve (VDC) + Parameters ------------ - V: array-like + V: array-like Velocity [m/s] indexed by time - - F: array-like + + F: array-like Exceedance probability [unitless] indexed by time - + label: string Label to use in the legend - + ax : matplotlib axes object - Axes for plotting. If None, then a new figure with a single + Axes for plotting. If None, then a new figure with a single axes is used. - + Returns --------- ax : matplotlib pyplot axes - + """ # Sort by F - temp = pd.DataFrame({'V': V, 'F': F}) - temp.sort_values('F', ascending=False, kind='mergesort', inplace=True) - - ax = _xy_plot(temp['V'], temp['F'], fmt='-', label=label, xlabel='Velocity [$m/s$]', - ylabel='Exceedance Probability', ax=ax) + temp = xr.Dataset(data_vars={"V": V, "F": F}) + temp.sortby("F", ascending=False) + + ax = _xy_plot( + temp["V"], + temp["F"], + fmt="-", + label=label, + xlabel="Velocity [$m/s$]", + ylabel="Exceedance Probability", + ax=ax, + ) return ax def plot_power_duration_curve(P, F, label=None, ax=None): """ - Plots power vs exceedance probability as a Power Duration Curve (PDC) + Plots power vs exceedance probability as a Power Duration Curve (PDC) Parameters ------------ - P: array-like + P: array-like Power [W] indexed by time - - F: array-like + + F: array-like Exceedance probability [unitless] indexed by time - + label: string Label to use in the legend - + ax : matplotlib axes object - Axes for plotting. If None, then a new figure with a single + Axes for plotting. If None, then a new figure with a single axes is used. - + Returns --------- ax : matplotlib pyplot axes - + """ # Sort by F - temp = pd.DataFrame({'P': P, 'F': F}) - temp.sort_values('F', ascending=False, kind='mergesort', inplace=True) - - ax = _xy_plot(temp['P'], temp['F'], fmt='-', label=label, xlabel='Power [W]', - ylabel='Exceedance Probability', ax=ax) + temp = xr.Dataset(data_vars={"P": P, "F": F}) + temp.sortby("F", ascending=False) + + ax = _xy_plot( + temp["P"], + temp["F"], + fmt="-", + label=label, + xlabel="Power [W]", + ylabel="Exceedance Probability", + ax=ax, + ) return ax - -def plot_discharge_timeseries(Q, label=None, ax=None): + +def plot_discharge_timeseries(Q, time_dimension="", label=None, ax=None): """ Plots discharge time-series - + Parameters ------------ Q: array-like Discharge [m3/s] indexed by time - + + time_dimension: string (optional) + Name of the xarray dimension corresponding to time. If not supplied, + defaults to the first dimension. + label: string Label to use in the legend - + ax : matplotlib axes object - Axes for plotting. If None, then a new figure with a single + Axes for plotting. If None, then a new figure with a single axes is used. - + Returns --------- - ax : matplotlib pyplot axes - + ax : matplotlib pyplot axes + """ + Q = convert_to_dataarray(Q) + + if time_dimension == "": + time_dimension = list(Q.coords)[0] + ax = _xy_plot( - Q.index, - Q, - fmt='-', - label=label, - xlabel='Time', - ylabel='Discharge [$m^3/s$]', - ax=ax + Q.coords[time_dimension].values, + Q, + fmt="-", + label=label, + xlabel="Time", + ylabel="Discharge [$m^3/s$]", + ax=ax, ) - + return ax def plot_discharge_vs_velocity(D, V, polynomial_coeff=None, label=None, ax=None): """ Plots discharge vs velocity data along with the polynomial fit - + Parameters ------------ - D : pandas Series + D : array-like Discharge [m/s] indexed by time - - V : pandas Series + + V : array-like Velocity [m/s] indexed by time - + polynomial_coeff: numpy polynomial - Polynomial coefficients, which can be computed using - `river.resource.polynomial_fit`. If None, then the polynomial fit is - not included int the plot. - + Polynomial coefficients, which can be computed using + `river.resource.polynomial_fit`. If None, then the polynomial fit is + not included int the plot. + ax : matplotlib axes object - Axes for plotting. If None, then a new figure with a single + Axes for plotting. If None, then a new figure with a single axes is used. - + Returns --------- ax : matplotlib pyplot axes - + """ - ax = _xy_plot(D, V, fmt='.', label=label, xlabel='Discharge [$m^3/s$]', - ylabel='Velocity [$m/s$]', ax=ax) + ax = _xy_plot( + D, + V, + fmt=".", + label=label, + xlabel="Discharge [$m^3/s$]", + ylabel="Velocity [$m/s$]", + ax=ax, + ) if polynomial_coeff: x = np.linspace(D.min(), D.max()) - ax = _xy_plot(x, polynomial_coeff(x), fmt='--', label='Polynomial fit', - xlabel='Discharge [$m^3/s$]', ylabel='Velocity [$m/s$]', - ax=ax) + ax = _xy_plot( + x, + polynomial_coeff(x), + fmt="--", + label="Polynomial fit", + xlabel="Discharge [$m^3/s$]", + ylabel="Velocity [$m/s$]", + ax=ax, + ) return ax def plot_velocity_vs_power(V, P, polynomial_coeff=None, label=None, ax=None): """ - Plots velocity vs power data along with the polynomial fit - + Plots velocity vs power data along with the polynomial fit + Parameters ------------ - V : pandas Series + V : array-like Velocity [m/s] indexed by time - - P: pandas Series + + P: array-like Power [W] indexed by time - + polynomial_coeff: numpy polynomial - Polynomial coefficients, which can be computed using - `river.resource.polynomial_fit`. If None, then the polynomial fit is - not included int the plot. - + Polynomial coefficients, which can be computed using + `river.resource.polynomial_fit`. If None, then the polynomial fit is + not included int the plot. + ax : matplotlib axes object - Axes for plotting. If None, then a new figure with a single + Axes for plotting. If None, then a new figure with a single axes is used. - + Returns --------- ax : matplotlib pyplot axes - + """ - ax = _xy_plot(V, P, fmt='.', label=label, xlabel='Velocity [$m/s$]', - ylabel='Power [$W$]', ax=ax) + ax = _xy_plot( + V, + P, + fmt=".", + label=label, + xlabel="Velocity [$m/s$]", + ylabel="Power [$W$]", + ax=ax, + ) if polynomial_coeff: x = np.linspace(V.min(), V.max()) - ax = _xy_plot(x, polynomial_coeff(x), fmt='--', label='Polynomial fit', - xlabel='Velocity [$m/s$]', ylabel='Power [$W$]', ax=ax) - + ax = _xy_plot( + x, + polynomial_coeff(x), + fmt="--", + label="Polynomial fit", + xlabel="Velocity [$m/s$]", + ylabel="Power [$W$]", + ax=ax, + ) + return ax diff --git a/mhkit/river/io/__init__.py b/mhkit/river/io/__init__.py index bf2aea4d1..852964f7b 100644 --- a/mhkit/river/io/__init__.py +++ b/mhkit/river/io/__init__.py @@ -1,2 +1,2 @@ from mhkit.river.io import usgs -from mhkit.river.io import d3d +from mhkit.river.io import d3d diff --git a/mhkit/river/io/d3d.py b/mhkit/river/io/d3d.py index d4db2e266..19a61df62 100644 --- a/mhkit/river/io/d3d.py +++ b/mhkit/river/io/d3d.py @@ -2,20 +2,21 @@ import scipy.interpolate as interp import numpy as np import pandas as pd +import xarray as xr import netCDF4 import warnings def get_all_time(data): - ''' - Returns all of the time stamps from a D3D simulation passed to the function + """ + Returns all of the time stamps from a D3D simulation passed to the function as a NetCDF object (data) - + Parameters ---------- - data: NetCDF4 object + data: NetCDF4 object A NetCDF4 object that contains spatial data, e.g. velocity or shear - stress generated by running a Delft3D model. + stress generated by running a Delft3D model. Returns ------- @@ -23,25 +24,26 @@ def get_all_time(data): Returns an array of integers representing the number of seconds after the simulation started and that the data object contains a snapshot of simulation conditions at that time. - ''' - - assert type(data)== netCDF4._netCDF4.Dataset, 'data must be NetCDF4 object' + """ + + if not isinstance(data, netCDF4._netCDF4.Dataset): + raise TypeError("data must be a NetCDF4 object") - seconds_run = np.ma.getdata(data.variables['time'][:], False) + seconds_run = np.ma.getdata(data.variables["time"][:], False) return seconds_run def index_to_seconds(data, time_index): - ''' - The function will return 'seconds_run' if passed a 'time_index' + """ + The function will return 'seconds_run' if passed a 'time_index' Parameters ---------- - data: NetCDF4 object + data: NetCDF4 object A NetCDF4 object that contains spatial data, e.g. velocity or shear - stress, generated by running a Delft3D model. - time_index: int + stress, generated by running a Delft3D model. + time_index: int A positive integer to pull the time index from the dataset. 0 being closest to time 0. Default is last time index -1. @@ -49,87 +51,98 @@ def index_to_seconds(data, time_index): ------- seconds_run: int, float The 'seconds_run' is the seconds corresponding to the 'time_index' increments. - ''' + """ return _convert_time(data, time_index=time_index) def seconds_to_index(data, seconds_run): - ''' + """ The function will return the nearest 'time_index' in the data if passed an integer number of 'seconds_run' - + Parameters ---------- - data: NetCDF4 object + data: NetCDF4 object A NetCDF4 object that contains spatial data, e.g. velocity or shear - stress, generated by running a Delft3D model. + stress, generated by running a Delft3D model. seconds_run: int, float - A positive integer or float that represents the amount of time in seconds + A positive integer or float that represents the amount of time in seconds passed since starting the simulation. Returns ------- time_index: int - The 'time_index' is a positive integer starting from 0 + The 'time_index' is a positive integer starting from 0 and incrementing until in simulation is complete. - ''' + """ return _convert_time(data, seconds_run=seconds_run) def _convert_time(data, time_index=None, seconds_run=None): - ''' - Converts a time index to seconds or seconds to a time index. The user - must specify 'time_index' or 'seconds_run' (Not both). The function - will returns 'seconds_run' if passed a 'time_index' or will return the + """ + Converts a time index to seconds or seconds to a time index. The user + must specify 'time_index' or 'seconds_run' (Not both). The function + will returns 'seconds_run' if passed a 'time_index' or will return the closest 'time_index' if passed a number of 'seconds_run'. Parameters ---------- - data: NetCDF4 object + data: NetCDF4 object A NetCDF4 object that contains spatial data, e.g. velocity or shear - stress, generated by running a Delft3D model. - time_index: int + stress, generated by running a Delft3D model. + time_index: int An integer to pull the time index from the dataset. 0 being closest - to the start time. + to the start time. seconds_run: int, float - An integer or float that represents the amount of time in seconds + An integer or float that represents the amount of time in seconds passed since starting the simulation. Returns ------- QoI: int, float - The quantity of interest is the unknown value either the 'time_index' - or the 'seconds_run'. The 'time_index' is an integer starting from 0 + The quantity of interest is the unknown value either the 'time_index' + or the 'seconds_run'. The 'time_index' is an integer starting from 0 and incrementing until in simulation is complete. The 'seconds_run' is the seconds corresponding to the 'time_index' increments. - ''' - - assert type(data)== netCDF4._netCDF4.Dataset, 'data must be NetCDF4 object' - assert time_index or seconds_run, 'input of time_index or seconds_run needed' - assert not(time_index and seconds_run), f'only one time_index or seconds_run' - assert isinstance(time_index, (int, float)) or isinstance(seconds_run, (int, - float)),'time_index or seconds_run input must be a int or float' - + """ + + if not isinstance(data, netCDF4._netCDF4.Dataset): + raise TypeError("data must be NetCDF4 object") + + if not (time_index or seconds_run): + raise ValueError("Input of time_index or seconds_run needed") + + if time_index and seconds_run: + raise ValueError("Only one of time_index or seconds_run should be provided") + + if not ( + isinstance(time_index, (int, float)) or isinstance(seconds_run, (int, float)) + ): + raise TypeError("time_index or seconds_run input must be an int or float") + times = get_all_time(data) - + if time_index: - QoI= times[time_index] + QoI = times[time_index] if seconds_run: - try: - idx=np.where(times == seconds_run) - QoI=idx[0][0] - except: + try: + idx = np.where(times == seconds_run) + QoI = idx[0][0] + except: idx = (np.abs(times - seconds_run)).argmin() - QoI= idx - warnings.warn( f'Warning: seconds_run not found. Closest time stamp' - +'found {times[idx]}', stacklevel= 2) + QoI = idx + warnings.warn( + "Warning: seconds_run not found. Closest time stamp" + + f"found {times[idx]}", + stacklevel=2, + ) return QoI -def get_layer_data(data, variable, layer_index=-1, time_index=-1): - ''' - Get variable data from the NetCDF4 object at a specified layer and timestep. +def get_layer_data(data, variable, layer_index=-1, time_index=-1, to_pandas=True): + """ + Get variable data from the NetCDF4 object at a specified layer and timestep. If the data is 2D the layer_index is ignored. Parameters @@ -139,490 +152,658 @@ def get_layer_data(data, variable, layer_index=-1, time_index=-1): stress, generated by running a Delft3D model. variable: string Delft3D outputs many vairables. The full list can be - found using "data.variables.keys()" in the console. + found using "data.variables.keys()" in the console. layer_index: int - An integer to pull out a layer from the dataset. 0 being closest + An integer to pull out a layer from the dataset. 0 being closest to the surface. Default is the bottom layer, found with input -1. - time_index: int + time_index: int An integer to pull the time index from the dataset. 0 being closest to the start time. Default is last time index, found with input -1. + to_pandas : bool (optional) + Flag to output pandas instead of xarray. Default = True. + Returns ------- - layer_data: DataFrame - DataFrame with columns of "x", "y", "waterdepth", and "waterlevel" location - of the specified layer, variable values "v", and the "time" the + layer_data: pd.DataFrame or xr.Dataset + Dataset with columns of "x", "y", "waterdepth", and "waterlevel" location + of the specified layer, variable values "v", and the "time" the simulation has run. The waterdepth is measured from the water surface and the - "waterlevel" is the water level diffrencein meters from the zero water level. - ''' - - assert isinstance(time_index, int), 'time_index must be an int' - assert isinstance(layer_index, int), 'layer_index must be an int' - assert type(data)== netCDF4._netCDF4.Dataset, 'data must be NetCDF4 object' - assert variable in data.variables.keys(), 'variable not recognized' + "waterlevel" is the water level diffrencein meters from the zero water level. + """ + + if not isinstance(time_index, int): + raise TypeError("time_index must be an int") + + if not isinstance(layer_index, int): + raise TypeError("layer_index must be an int") + + if not isinstance(data, netCDF4._netCDF4.Dataset): + raise TypeError("data must be NetCDF4 object") + + if variable not in data.variables.keys(): + raise ValueError("variable not recognized") + + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type bool. Got: {type(to_pandas)}") + coords = str(data.variables[variable].coordinates).split() - var=data.variables[variable][:] - max_time_index= data['time'].shape[0]-1 # to account for zero index - assert abs(time_index) <= max_time_index, (f'time_index must be less than' - +'the absolute value of the max time index {max_time_index}') - - x=np.ma.getdata(data.variables[coords[0]][:], False) - y=np.ma.getdata(data.variables[coords[1]][:], False) - - - if type(var[0][0]) == np.ma.core.MaskedArray: - max_layer= len(var[0][0]) - - assert abs(layer_index) <= max_layer,( f'layer_index must be less than' - +'the max layer {max_layer}') - v= np.ma.getdata(var[time_index,:,layer_index], False) - dimensions= 3 - - else: - assert type(var[0][0])== np.float64, 'data not recognized' - dimensions= 2 - v= np.ma.getdata(var[time_index,:], False) - - #waterdepth + var = data.variables[variable][:] + max_time_index = data["time"].shape[0] - 1 # to account for zero index + + if abs(time_index) > max_time_index: + raise ValueError( + f"time_index must be less than the absolute value of the max time index {max_time_index}" + ) + + x = np.ma.getdata(data.variables[coords[0]][:], False) + y = np.ma.getdata(data.variables[coords[1]][:], False) + + if type(var[0][0]) == np.ma.core.MaskedArray: + max_layer = len(var[0][0]) + + if abs(layer_index) > max_layer: + raise ValueError(f"layer_index must be less than the max layer {max_layer}") + + v = np.ma.getdata(var[time_index, :, layer_index], False) + dimensions = 3 + + else: + if type(var[0][0]) != np.float64: + raise TypeError("data not recognized") + + dimensions = 2 + v = np.ma.getdata(var[time_index, :], False) + + # waterdepth if "mesh2d" in variable: - cords_to_layers= {'mesh2d_face_x mesh2d_face_y': {'name':'mesh2d_nLayers', - 'coords':data.variables['mesh2d_layer_sigma'][:]}, - 'mesh2d_edge_x mesh2d_edge_y': {'name':'mesh2d_nInterfaces', - 'coords':data.variables['mesh2d_interface_sigma'][:]}} - bottom_depth=np.ma.getdata(data.variables['mesh2d_waterdepth'][time_index, :], False) - waterlevel= np.ma.getdata(data.variables['mesh2d_s1'][time_index, :], False) - coords = str(data.variables['waterdepth'].coordinates).split() - + cords_to_layers = { + "mesh2d_face_x mesh2d_face_y": { + "name": "mesh2d_nLayers", + "coords": data.variables["mesh2d_layer_sigma"][:], + }, + "mesh2d_edge_x mesh2d_edge_y": { + "name": "mesh2d_nInterfaces", + "coords": data.variables["mesh2d_interface_sigma"][:], + }, + } + bottom_depth = np.ma.getdata( + data.variables["mesh2d_waterdepth"][time_index, :], False + ) + waterlevel = np.ma.getdata(data.variables["mesh2d_s1"][time_index, :], False) + coords = str(data.variables["waterdepth"].coordinates).split() + + elif str(data.variables[variable].coordinates) == "FlowElem_xcc FlowElem_ycc": + cords_to_layers = { + "FlowElem_xcc FlowElem_ycc": { + "name": "laydim", + "coords": data.variables["LayCoord_cc"][:], + }, + "FlowLink_xu FlowLink_yu": { + "name": "wdim", + "coords": data.variables["LayCoord_w"][:], + }, + } + bottom_depth = np.ma.getdata(data.variables["waterdepth"][time_index, :], False) + waterlevel = np.ma.getdata(data.variables["s1"][time_index, :], False) + coords = str(data.variables["waterdepth"].coordinates).split() else: - cords_to_layers= {'FlowElem_xcc FlowElem_ycc':{'name':'laydim', - 'coords':data.variables['LayCoord_cc'][:]}, - 'FlowLink_xu FlowLink_yu': {'name':'wdim', - 'coords':data.variables['LayCoord_w'][:]}} - bottom_depth=np.ma.getdata(data.variables['waterdepth'][time_index, :], False) - waterlevel= np.ma.getdata(data.variables['s1'][time_index, :], False) - coords = str(data.variables['waterdepth'].coordinates).split() - - layer_dim = str(data.variables[variable].coordinates) - - cord_sys= cords_to_layers[layer_dim]['coords'] - layer_percentages= np.ma.getdata(cord_sys, False) #accumulative - - if layer_dim == 'FlowLink_xu FlowLink_yu': - #interpolate - x_laydim=np.ma.getdata(data.variables[coords[0]][:], False) - y_laydim=np.ma.getdata(data.variables[coords[1]][:], False) - points_laydim = np.array([ [x, y] for x, y in zip(x_laydim, y_laydim)]) - + cords_to_layers = { + "FlowElem_xcc FlowElem_ycc LayCoord_cc LayCoord_cc": { + "name": "laydim", + "coords": data.variables["LayCoord_cc"][:], + }, + "FlowLink_xu FlowLink_yu": { + "name": "wdim", + "coords": data.variables["LayCoord_w"][:], + }, + } + bottom_depth = np.ma.getdata(data.variables["waterdepth"][time_index, :], False) + waterlevel = np.ma.getdata(data.variables["s1"][time_index, :], False) + coords = str(data.variables["waterdepth"].coordinates).split() + + layer_dim = str(data.variables[variable].coordinates) + + cord_sys = cords_to_layers[layer_dim]["coords"] + layer_percentages = np.ma.getdata(cord_sys, False) # accumulative + + if layer_dim == "FlowLink_xu FlowLink_yu": + # interpolate + x_laydim = np.ma.getdata(data.variables[coords[0]][:], False) + y_laydim = np.ma.getdata(data.variables[coords[1]][:], False) + points_laydim = np.array([[x, y] for x, y in zip(x_laydim, y_laydim)]) + coords_request = str(data.variables[variable].coordinates).split() - x_wdim=np.ma.getdata(data.variables[coords_request[0]][:], False) - y_wdim=np.ma.getdata(data.variables[coords_request[1]][:], False) - points_wdim=np.array([ [x, y] for x, y in zip(x_wdim, y_wdim)]) - - bottom_depth_wdim = interp.griddata(points_laydim, bottom_depth, - points_wdim) - water_level_wdim= interp.griddata(points_laydim, waterlevel, - points_wdim) - - idx_bd= np.where(np.isnan(bottom_depth_wdim)) - - for i in idx_bd: - bottom_depth_wdim[i]= interp.griddata(points_laydim, bottom_depth, - points_wdim[i], method='nearest') - water_level_wdim[i]= interp.griddata(points_laydim, waterlevel, - points_wdim[i], method='nearest') - - - waterdepth=[] - - if dimensions== 2: - if layer_dim == 'FlowLink_xu FlowLink_yu': + x_wdim = np.ma.getdata(data.variables[coords_request[0]][:], False) + y_wdim = np.ma.getdata(data.variables[coords_request[1]][:], False) + points_wdim = np.array([[x, y] for x, y in zip(x_wdim, y_wdim)]) + + bottom_depth_wdim = interp.griddata(points_laydim, bottom_depth, points_wdim) + water_level_wdim = interp.griddata(points_laydim, waterlevel, points_wdim) + + idx_bd = np.where(np.isnan(bottom_depth_wdim)) + + for i in idx_bd: + bottom_depth_wdim[i] = interp.griddata( + points_laydim, bottom_depth, points_wdim[i], method="nearest" + ) + water_level_wdim[i] = interp.griddata( + points_laydim, waterlevel, points_wdim[i], method="nearest" + ) + + waterdepth = [] + + if dimensions == 2: + if layer_dim == "FlowLink_xu FlowLink_yu": z = [bottom_depth_wdim] - waterlevel=water_level_wdim + waterlevel = water_level_wdim else: z = [bottom_depth] else: - if layer_dim == 'FlowLink_xu FlowLink_yu': - z = [bottom_depth_wdim*layer_percentages[layer_index]] - waterlevel=water_level_wdim + if layer_dim == "FlowLink_xu FlowLink_yu": + z = [bottom_depth_wdim * layer_percentages[layer_index]] + waterlevel = water_level_wdim else: - z = [bottom_depth*layer_percentages[layer_index]] - waterdepth=np.append(waterdepth, z) + z = [bottom_depth * layer_percentages[layer_index]] + waterdepth = np.append(waterdepth, z) + + time = np.ma.getdata(data.variables["time"][time_index], False) * np.ones(len(x)) + + index = np.arange(0, len(time)) + layer_data = xr.Dataset( + data_vars={ + "x": (["index"], x), + "y": (["index"], y), + "waterdepth": (["index"], waterdepth), + "waterlevel": (["index"], waterlevel), + "v": (["index"], v), + "time": (["index"], time), + }, + coords={"index": index}, + ) + + if to_pandas: + layer_data = layer_data.to_pandas() - time= np.ma.getdata(data.variables['time'][time_index], False)*np.ones(len(x)) + return layer_data - layer= np.array([ [x_i, y_i, d_i, w_i, v_i, t_i] for x_i, y_i, d_i, w_i, v_i, t_i in - zip(x, y, waterdepth, waterlevel, v, time)]) - layer_data = pd.DataFrame(layer, columns=['x', 'y', 'waterdepth','waterlevel', 'v', 'time']) - return layer_data +def create_points(x, y, waterdepth, to_pandas=True): + """ + Generate a Dataset of points from combinations of input coordinates. + + This function accepts three inputs and combines them to generate a + Dataset of points. The inputs can be: + - 3 points + - 2 points and 1 array + - 1 point and 2 arrays + - 3 arrays (x and y must have the same size) + For 3 points or less, every combination will be in the output. + For 3 arrays, x and y are treated as coordinate pairs and combined + with each value from the waterdepth array. -def create_points(x, y, waterdepth): - ''' - Turns three coordinate inputs into a single output DataFrame of points. - In any order the three inputs can consist of 3 points, 2 points and 1 array, - or 1 point and 2 arrays. The final output DataFrame will be the unique - combinations of the 3 inputs. - Parameters ---------- - x: float, array or int - x values to create points. - y: float, array or int - y values to create points. - waterdepth: float, array or int - waterdepth values to create points. + x : int, float, array-like + X values (longitude) for the points. + y : int, float, array-like + Y values (latitude) for the points. + waterdepth : int, float, array-like + Waterdepth values for the points. + to_pandas : bool (optional) + Flag to output pandas instead of xarray. Default = True. Returns ------- - points: DateFrame - DataFrame with columns x, y and waterdepth points. - - Example + points : xr.Dataset or pd.DataFrame + A Dataset with columns 'x', 'y', and 'waterdepth' representing the generated points. + + Example ------- - If the inputs are 2 arrays: and [3,4,5] and 1 point [6], the output - will contain 6 array combinations of the 3 inputs as shown. - - x=np.array([1,2]) - y=np.array([3,4,5]) - waterdepth= 6 - d3d.create_points(x,y,waterdepth) - + 2 arrays and 1 point: + >>> x = np.array([1, 2]) + >>> y = np.array([3, 4, 5]) + >>> waterdepth = 6 + >>> create_points(x, y, waterdepth) + x y waterdepth 0 1.0 3.0 6.0 1 2.0 3.0 6.0 2 1.0 4.0 6.0 3 2.0 4.0 6.0 4 1.0 5.0 6.0 - 5 2.0 5.0 6.0 - ''' - - assert isinstance(x, (int, float, np.ndarray)), ('x must be a int, float' - +' or array') - assert isinstance(y, (int, float, np.ndarray)), ('y must be a int, float' - +' or array') - assert isinstance(waterdepth, (int, float, np.ndarray)), ('waterdepth must be a int, float' - +' or array') - - directions = {0:{'name': 'x', - 'values': x}, - 1:{'name': 'y', - 'values': y}, - 2:{'name': 'waterdepth', - 'values': waterdepth}} - - for i in directions: - try: - N=len(directions[i]['values']) - except: - directions[i]['values'] = np.array([directions[i]['values']]) - N=len(directions[i]['values']) - if N == 1 : - directions[i]['type']= 'point' - elif N > 1 : - directions[i]['type']= 'array' - else: - raise Exception(f'length of direction {directions[i]["name"]} was' - +'neagative or zero') - - # Check how many times point is in "types" - types= [directions[i]['type'] for i in directions] - N_points = types.count('point') - - if N_points >= 2: - lens = np.array([len(directions[d]['values']) for d in directions]) - max_len_idx = lens.argmax() - not_max_idxs= [i for i in directions.keys()] - - del not_max_idxs[max_len_idx] - - for not_max in not_max_idxs: - N= len(directions[max_len_idx]['values']) - vals =np.ones(N)*directions[not_max]['values'] - directions[not_max]['values'] = np.array(vals) - - x_new = directions[0]['values'] - y_new = directions[1]['values'] - depth_new = directions[2]['values'] - - request= np.array([ [x_i, y_i, depth_i] for x_i, y_i, depth_i in zip(x_new, - y_new, depth_new)]) - points= pd.DataFrame(request, columns=[ 'x', 'y', 'waterdepth']) - - elif N_points == 1: - # treat as plane - #find index of point - idx_point = types.index('point') - max_idxs= [i for i in directions.keys()] - print(max_idxs) - del max_idxs[idx_point] - #find vectors - XX, YY = np.meshgrid(directions[max_idxs[0]]['values'], - directions[max_idxs[1]]['values'] ) - N_X=np.shape(XX)[1] - N_Y=np.shape(YY)[0] - ZZ= np.ones((N_Y,N_X))*directions[idx_point]['values'] - - request= np.array([ [x_i, y_i, z_i] for x_i, y_i, z_i in zip(XX.ravel(), - YY.ravel() , ZZ.ravel())]) - columns=[ directions[max_idxs[0]]['name'], - directions[max_idxs[1]]['name'], directions[idx_point]['name']] - - points= pd.DataFrame(request, columns=columns) - else: - raise Exception('Can provide at most two arrays') - - return points - - -def variable_interpolation(data, variables, points='cells', edges= 'none'): - ''' - Interpolate multiple variables from the Delft3D onto the same points. + 5 2.0 5.0 6.0 + + 3 arrays (x and y must have the same length): + >>> x = np.array([1, 2, 3]) + >>> y = np.array([4, 5, 6]) + >>> waterdepth = np.array([1, 2]) + >>> create_points(x, y, waterdepth) + + x y waterdepth + 0 1.0 4.0 1.0 + 1 2.0 5.0 1.0 + 2 3.0 6.0 1.0 + 3 1.0 4.0 2.0 + 4 2.0 5.0 2.0 + 5 4.0 6.0 2.0 + """ + + # Check input types + inputs = {"x": x, "y": y, "waterdepth": waterdepth} + for name, value in inputs.items(): + # Convert lists to numpy arrays + if isinstance(value, list): + value = np.array(value) + inputs[name] = value # Update the value in the dictionary + + # Check data type + if not isinstance(value, (int, float, np.ndarray, pd.Series, xr.DataArray)): + raise TypeError( + f"{name} must be an int, float, np.ndarray, pd.Series, or xr.DataArray. Got: {type(value)}" + ) + + # Check for empty arrays + if isinstance(value, (np.ndarray, pd.Series, xr.DataArray)) and len(value) == 0: + raise ValueError(f"{name} should not be an empty array") + + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type bool. Got: {type(to_pandas)}") + + x_array_like = not isinstance(x, (int, float)) + y_array_like = not isinstance(y, (int, float)) + waterdepth_array_like = not isinstance(waterdepth, (int, float)) + + if x_array_like and y_array_like and waterdepth_array_like: + # if all inputs are arrays, grid the coordinate and waterdepth + y_grid, waterdepth_grid = np.meshgrid(y, waterdepth) + y_grid = y_grid.ravel() + waterdepth_grid = waterdepth_grid.ravel() + + x_grid, _ = np.meshgrid(x, waterdepth) + x_grid = x_grid.ravel() + else: + # if at least one input is a point, grid all inputs + x_grid, y_grid, waterdepth_grid = np.meshgrid(x, y, waterdepth) + x_grid = x_grid.ravel() + y_grid = y_grid.ravel() + waterdepth_grid = waterdepth_grid.ravel() + + index = np.arange(0, len(x_grid)) + points = xr.Dataset( + data_vars={ + "x": (["index"], x_grid), + "y": (["index"], y_grid), + "waterdepth": (["index"], waterdepth_grid), + }, + coords={"index": index}, + ) + + if to_pandas: + points = points.to_pandas() + + return points + + +def variable_interpolation( + data, + variables, + points="cells", + edges="none", + x_max_lim=float("inf"), + x_min_lim=float("-inf"), + y_max_lim=float("inf"), + y_min_lim=float("-inf"), + to_pandas=True, +): + """ + Interpolate multiple variables from the Delft3D onto the same points. Parameters ---------- - data: NetCDF4 object + data: NetCDF4 object A NetCDF4 object that contains spatial data, e.g. velocity or shear - stress generated by running a Delft3D model. + stress generated by running a Delft3D model. variables: array of strings Name of variables to interpolate, e.g. 'turkin1', 'ucx', 'ucy' and 'ucz'. The full list can be found using "data.variables.keys()" in the console. - points: string, DataFrame + points: string, pd.DataFrame, or xr.Dataset The points to interpolate data onto. 'cells'- interpolates all data onto the Delft3D cell coordinate system (Default) - 'faces'- interpolates all dada onto the Delft3D face coordinate system - DataFrame of x, y, and waterdepth coordinates - Interpolates data onto user + 'faces'- interpolates all dada onto the Delft3D face coordinate system + Dataset of x, y, and waterdepth coordinates - Interpolates data onto user povided points. Can be created with `create_points` function. - edges: sting: 'nearest' - If edges is set to 'nearest' the code will fill in nan values with nearest - interpolation. Otherwise only linear interpolarion will be used. - + edges: string: 'nearest' + If edges is set to 'nearest' the code will fill in nan values with nearest + interpolation. Otherwise only linear interpolarion will be used. + to_pandas : bool (optional) + Flag to output pandas instead of xarray. Default = True. + Returns ------- - transformed_data: DataFrame - Variables on specified grid points saved under the input variable names - and the x, y, and waterdepth coordinates of those points. - ''' - - assert isinstance(points, (str, pd.DataFrame)),('points must be a string ' - +'or DataFrame') - if isinstance ( points, str): - assert any([points == 'cells', points=='faces']), ('points must be' - +' cells or faces') - assert type(data)== netCDF4._netCDF4.Dataset, 'data must be nerCDF4 object' + transformed_data: pd.DataFrame or xr.Dataset + Variables on specified grid points saved under the input variable names + and the x, y, and waterdepth coordinates of those points. + """ + + if not isinstance(points, (str, pd.DataFrame, xr.Dataset)): + raise TypeError( + f"points must be a string, pd.DataFrame, or xr.Dataset. Got {type(points)}." + ) + + if isinstance(points, xr.Dataset): + points = points.to_pandas() + + if isinstance(points, str): + if not (points == "cells" or points == "faces"): + raise ValueError( + f"If a string, points must be cells or faces. Got {points}" + ) + + if not isinstance(data, netCDF4._netCDF4.Dataset): + raise TypeError(f"data must be netCDF4 object. Got {type(data)}") + + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type bool. Got: {type(to_pandas)}") data_raw = {} for var in variables: - var_data_df = get_all_data_points(data, var,time_index=-1) - var_data_df=var_data_df.loc[:,~var_data_df.T.duplicated(keep='first')] - data_raw[var] = var_data_df - if type(points) == pd.DataFrame: - print('points provided') - elif points=='faces': - points = data_raw['ucx'][['x','y','waterdepth']] - elif points=='cells': - points = data_raw['turkin1'][['x','y','waterdepth']] - - transformed_data= points.copy(deep=True) - - for var in variables : - transformed_data[var] = interp.griddata(data_raw[var][['x','y','waterdepth']], - data_raw[var][var], points[['x','y','waterdepth']]) - if edges == 'nearest' : - idx= np.where(np.isnan(transformed_data[var])) - + var_data_df = get_all_data_points(data, var, time_index=-1, to_pandas=True) + var_data_df["depth"] = var_data_df.waterdepth - var_data_df.waterlevel # added + var_data_df = var_data_df.loc[:, ~var_data_df.T.duplicated(keep="first")] + var_data_df = var_data_df[var_data_df.x > x_min_lim] + var_data_df = var_data_df[var_data_df.x < x_max_lim] + var_data_df = var_data_df[var_data_df.y > y_min_lim] + var_data_df = var_data_df[var_data_df.y < y_max_lim] + data_raw[var] = var_data_df + if isinstance(points, pd.DataFrame): + print("points provided") + elif points == "faces": + points = data_raw["ucx"][["x", "y", "waterdepth"]] + elif points == "cells": + points = data_raw["turkin1"][["x", "y", "waterdepth"]] + + transformed_data = points.copy(deep=True) + + for var in variables: + transformed_data[var] = interp.griddata( + data_raw[var][["x", "y", "waterdepth"]], # waterdepth to depth + data_raw[var][var], + points[["x", "y", "waterdepth"]], + ) + if edges == "nearest": + idx = np.where(np.isnan(transformed_data[var])) + if len(idx[0]): - for i in idx[0]: - transformed_data[var][i]= (interp - .griddata(data_raw[var][['x','y','waterdepth']], - data_raw[var][var], - [points['x'][i],points['y'][i], - points['waterdepth'][i]], method='nearest')) - + for i in idx[0]: + transformed_data[var][i] = interp.griddata( + data_raw[var][["x", "y", "waterdepth"]], + data_raw[var][var], + [points["x"][i], points["y"][i], points["waterdepth"][i]], + method="nearest", + ) + + if not to_pandas: + transformed_data = transformed_data.to_dataset() + return transformed_data -def get_all_data_points(data, variable, time_index=-1): - ''' - Get data points for a passed variable for all layers at a specified time from - the Delft3D NetCDF4 object by iterating over the `get_layer_data` function. +def get_all_data_points(data, variable, time_index=-1, to_pandas=True): + """ + Get data points for a passed variable for all layers at a specified time from + the Delft3D NetCDF4 object by iterating over the `get_layer_data` function. Parameters ---------- - data: Netcdf4 object + data: Netcdf4 object A NetCDF4 object that contains spatial data, e.g. velocity or shear - stress, generated by running a Delft3D model. + stress, generated by running a Delft3D model. variable: string Delft3D variable. The full list can be of variables can be - found using "data.variables.keys()" in the console. + found using "data.variables.keys()" in the console. time_index: int - An integer to pull the time step from the dataset. + An integer to pull the time step from the dataset. Default is last time step, found with the input -1. - + to_pandas : bool (optional) + Flag to output pandas instead of xarray. Default = True. + Returns ------- - all_data: DataFrame + all_data: xr.Dataset or pd.Dataframe Dataframe with columns x, y, waterdepth, waterlevel, variable, and time. - The waterdepth is measured from the water surface and the "waterlevel" is + The waterdepth is measured from the water surface and the "waterlevel" is the water level diffrence in meters from the zero water level. - - ''' - - assert isinstance(time_index, int), 'time_index must be a int' - assert type(data)== netCDF4._netCDF4.Dataset, 'data must be NetCDF4 object' - assert variable in data.variables.keys(), 'variable not recognized' + + """ + + if not isinstance(time_index, int): + raise TypeError("time_index must be an int") + + if not isinstance(data, netCDF4._netCDF4.Dataset): + raise TypeError("data must be NetCDF4 object") + + if variable not in data.variables.keys(): + raise ValueError("variable not recognized") + + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type bool. Got: {type(to_pandas)}") max_time_index = len(data.variables[variable][:]) - assert abs(time_index) <= max_time_index, (f'time_index must be less than' - +'the max time index {max_time_index}') + if abs(time_index) > max_time_index: + raise ValueError( + f"time_index must be less than the max time index {max_time_index}" + ) if "mesh2d" in variable: - cords_to_layers= {'mesh2d_face_x mesh2d_face_y': {'name':'mesh2d_nLayers', - 'coords':data.variables['mesh2d_layer_sigma'][:]}, - 'mesh2d_edge_x mesh2d_edge_y': {'name':'mesh2d_nInterfaces', - 'coords':data.variables['mesh2d_interface_sigma'][:]}} + cords_to_layers = { + "mesh2d_face_x mesh2d_face_y": { + "name": "mesh2d_nLayers", + "coords": data.variables["mesh2d_layer_sigma"][:], + }, + "mesh2d_edge_x mesh2d_edge_y": { + "name": "mesh2d_nInterfaces", + "coords": data.variables["mesh2d_interface_sigma"][:], + }, + } + + elif str(data.variables[variable].coordinates) == "FlowElem_xcc FlowElem_ycc": + cords_to_layers = { + "FlowElem_xcc FlowElem_ycc": { + "name": "laydim", + "coords": data.variables["LayCoord_cc"][:], + }, + "FlowLink_xu FlowLink_yu": { + "name": "wdim", + "coords": data.variables["LayCoord_w"][:], + }, + } + else: + cords_to_layers = { + "FlowElem_xcc FlowElem_ycc LayCoord_cc LayCoord_cc": { + "name": "laydim", + "coords": data.variables["LayCoord_cc"][:], + }, + "FlowLink_xu FlowLink_yu": { + "name": "wdim", + "coords": data.variables["LayCoord_w"][:], + }, + } + + layer_dim = str(data.variables[variable].coordinates) + + try: + cord_sys = cords_to_layers[layer_dim]["coords"] + except: + raise Exception("Coordinates not recognized.") else: - cords_to_layers= {'FlowElem_xcc FlowElem_ycc':{'name':'laydim', - 'coords':data.variables['LayCoord_cc'][:]}, - 'FlowLink_xu FlowLink_yu': {'name':'wdim', - 'coords':data.variables['LayCoord_w'][:]}} - - layer_dim = str(data.variables[variable].coordinates) - - try: - cord_sys= cords_to_layers[layer_dim]['coords'] - except: - raise Exception('Coordinates not recognized.') - else: - layer_percentages= np.ma.getdata(cord_sys, False) - - x_all=[] - y_all=[] - depth_all=[] - water_level_all=[] - v_all=[] - time_all=[] - + layer_percentages = np.ma.getdata(cord_sys, False) + + x_all = [] + y_all = [] + depth_all = [] + water_level_all = [] + v_all = [] + time_all = [] + layers = range(len(layer_percentages)) for layer in layers: - layer_data= get_layer_data(data, variable, layer, time_index) - - x_all=np.append(x_all, layer_data.x) - y_all=np.append(y_all, layer_data.y) - depth_all=np.append(depth_all, layer_data.waterdepth) - water_level_all=np.append(water_level_all, layer_data.waterlevel) - v_all=np.append(v_all, layer_data.v) - time_all= np.append(time_all, layer_data.time) - - known_points = np.array([ [x, y, waterdepth, waterlevel, v, time] - for x, y, waterdepth, waterlevel, v, time in zip(x_all, y_all, - depth_all, water_level_all, v_all, time_all)]) - - all_data= pd.DataFrame(known_points, columns=['x','y','waterdepth', 'waterlevel' - ,f'{variable}', 'time']) + layer_data = get_layer_data(data, variable, layer, time_index) + + x_all = np.append(x_all, layer_data.x) + y_all = np.append(y_all, layer_data.y) + depth_all = np.append(depth_all, layer_data.waterdepth) + water_level_all = np.append(water_level_all, layer_data.waterlevel) + v_all = np.append(v_all, layer_data.v) + time_all = np.append(time_all, layer_data.time) + + index = np.arange(0, len(time_all)) + all_data = xr.Dataset( + data_vars={ + "x": (["index"], x_all), + "y": (["index"], y_all), + "waterdepth": (["index"], depth_all), + "waterlevel": (["index"], water_level_all), + f"{variable}": (["index"], v_all), + "time": (["index"], time_all), + }, + coords={"index": index}, + ) + + if to_pandas: + all_data = all_data.to_pandas() return all_data - -def turbulent_intensity(data, points='cells', time_index= -1, - intermediate_values = False ): - ''' - Calculate the turbulent intensity percentage for a given data set for the +def turbulent_intensity( + data, points="cells", time_index=-1, intermediate_values=False, to_pandas=True +): + """ + Calculate the turbulent intensity percentage for a given data set for the specified points. Assumes variable names: ucx, ucy, ucz and turkin1. Parameters ---------- - data : NetCDF4 object + data: NetCDF4 object A NetCDF4 object that contains spatial data, e.g. velocity or shear stress, generated by running a Delft3D model. - points : string, DataFrame - Points to interpolate data onto. - 'cells': interpolates all data onto velocity coordinate system (Default). - 'faces': interpolates all data onto the TKE coordinate system. - DataFrame of x, y, and z coordinates: Interpolates data onto user - provided points. - time_index : int + points: string, pd.DataFrame, xr.Dataset + Points to interpolate data onto. + 'cells': interpolates all data onto velocity coordinate system (Default). + 'faces': interpolates all data onto the TKE coordinate system. + DataFrame of x, y, and z coordinates: Interpolates data onto user + provided points. + time_index: int An integer to pull the time step from the dataset. Default is - late time step -1. - intermediate_values : boolean (optional) - If false the function will return position and turbulent intensity values. + late time step -1. + intermediate_values: boolean (optional) + If false the function will return position and turbulent intensity values. If true the function will return position(x,y,z) and values need to calculate turbulent intensity (ucx, uxy, uxz and turkin1) in a Dataframe. Default False. - + to_pandas : bool (optional) + Flag to output pandas instead of xarray. Default = True. + Returns ------- - TI_data : Dataframe - If intermediate_values is true all values are output. - If intermediate_values is equal to false only turbulent_intesity and - x, y, and z variables are output. - x- position in the x direction - y- position in the y direction + TI_data: xr.Dataset or pd.DataFrame + If intermediate_values is true all values are output. + If intermediate_values is equal to false only turbulent_intesity and + x, y, and z variables are output. + x- position in the x direction + y- position in the y direction waterdepth- position in the vertical direction turbulet_intesity- turbulent kinetic energy divided by the root mean squared velocity - turkin1- turbulent kinetic energy - ucx- velocity in the x direction - ucy- velocity in the y direction - ucz- velocity in the vertical direction - ''' - - assert isinstance(points, (str, pd.DataFrame)),('points must a string or' - +' DataFrame') - if isinstance ( points, str): - assert any([points == 'cells', points=='faces']), ('points must be cells' - +' or faces') - assert isinstance(time_index, int), 'time_index must be a int' - max_time_index= data['time'].shape[0]-1 # to account for zero index - assert abs(time_index) <= max_time_index, (f'time_index must be less than' - +'the absolute value of the max time index {max_time_index}') - assert type(data)== netCDF4._netCDF4.Dataset, 'data must be nerCDF4 object' - assert 'turkin1' in data.variables.keys(), ('Varaiable turkin1 not' - +' present in Data') - assert 'ucx' in data.variables.keys(),'Varaiable ucx 1 not present in Data' - assert 'ucy' in data.variables.keys(),'Varaiable ucy 1 not present in Data' - assert 'ucz' in data.variables.keys(),'Varaiable ucz 1 not present in Data' - - TI_vars= ['turkin1', 'ucx', 'ucy', 'ucz'] + turkin1- turbulent kinetic energy + ucx- velocity in the x direction + ucy- velocity in the y direction + ucz- velocity in the vertical direction + """ + + if not isinstance(points, (str, pd.DataFrame, xr.Dataset)): + raise TypeError("points must be a string, pd.DataFrame, xr.Dataset") + + if isinstance(points, str): + if not (points == "cells" or points == "faces"): + raise ValueError("points must be cells or faces") + + if not isinstance(time_index, int): + raise TypeError("time_index must be an int") + + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type bool. Got: {type(to_pandas)}") + + if isinstance(points, xr.Dataset): + points = points.to_pandas() + + max_time_index = data["time"].shape[0] - 1 # to account for zero index + if abs(time_index) > max_time_index: + raise ValueError( + f"time_index must be less than the absolute value of the max time index {max_time_index}" + ) + + if not isinstance(data, netCDF4._netCDF4.Dataset): + raise TypeError("data must be netCDF4 object") + + for variable in ["turkin1", "ucx", "ucy", "ucz"]: + if variable not in data.variables.keys(): + raise ValueError(f"Variable {variable} not present in Data") + + TI_vars = ["turkin1", "ucx", "ucy", "ucz"] TI_data_raw = {} for var in TI_vars: - var_data_df = get_all_data_points(data, var ,time_index) - TI_data_raw[var] = var_data_df - if type(points) == pd.DataFrame: - print('points provided') - elif points=='faces': - points = TI_data_raw['turkin1'].drop(['waterlevel','turkin1'],axis=1) - elif points=='cells': - points = TI_data_raw['ucx'].drop(['waterlevel','ucx'],axis=1) - + var_data_df = get_all_data_points(data, var, time_index) + TI_data_raw[var] = var_data_df + if type(points) == pd.DataFrame: + print("points provided") + elif points == "faces": + points = TI_data_raw["turkin1"].drop(["waterlevel", "turkin1"], axis=1) + elif points == "cells": + points = TI_data_raw["ucx"].drop(["waterlevel", "ucx"], axis=1) + TI_data = points.copy(deep=True) - for var in TI_vars: - TI_data[var] = interp.griddata(TI_data_raw[var][['x','y','waterdepth']], - TI_data_raw[var][var], points[['x','y','waterdepth']]) - idx= np.where(np.isnan(TI_data[var])) - + for var in TI_vars: + TI_data[var] = interp.griddata( + TI_data_raw[var][["x", "y", "waterdepth"]], + TI_data_raw[var][var], + points[["x", "y", "waterdepth"]], + ) + idx = np.where(np.isnan(TI_data[var])) + if len(idx[0]): - for i in idx[0]: - TI_data[var][i]= interp.griddata(TI_data_raw[var][['x','y','waterdepth']], - TI_data_raw[var][var], - [points['x'][i],points['y'][i], points['waterdepth'][i]], - method='nearest') - - u_mag=unorm(np.array(TI_data['ucx']),np.array(TI_data['ucy']), - np.array(TI_data['ucz'])) - - neg_index=np.where( TI_data['turkin1']<0) - zero_bool= np.isclose( TI_data['turkin1'][ TI_data['turkin1']<0].array, - np.zeros(len( TI_data['turkin1'][TI_data['turkin1']<0].array)), - atol=1.0e-4) - zero_ind= neg_index[0][zero_bool] - non_zero_ind= neg_index[0][~zero_bool] - TI_data.loc[zero_ind,'turkin1']=np.zeros(len(zero_ind)) - TI_data.loc[non_zero_ind,'turkin1']=[np.nan]*len(non_zero_ind) - - TI_data['turbulent_intensity']= np.sqrt(2/3*TI_data['turkin1'])/u_mag * 100 #% - + for i in idx[0]: + TI_data[var][i] = interp.griddata( + TI_data_raw[var][["x", "y", "waterdepth"]], + TI_data_raw[var][var], + [points["x"][i], points["y"][i], points["waterdepth"][i]], + method="nearest", + ) + + u_mag = unorm( + np.array(TI_data["ucx"]), np.array(TI_data["ucy"]), np.array(TI_data["ucz"]) + ) + + neg_index = np.where(TI_data["turkin1"] < 0) + zero_bool = np.isclose( + TI_data["turkin1"][TI_data["turkin1"] < 0].array, + np.zeros(len(TI_data["turkin1"][TI_data["turkin1"] < 0].array)), + atol=1.0e-4, + ) + zero_ind = neg_index[0][zero_bool] + non_zero_ind = neg_index[0][~zero_bool] + TI_data.loc[zero_ind, "turkin1"] = np.zeros(len(zero_ind)) + TI_data.loc[non_zero_ind, "turkin1"] = [np.nan] * len(non_zero_ind) + + TI_data["turbulent_intensity"] = ( + np.sqrt(2 / 3 * TI_data["turkin1"]) / u_mag * 100 + ) # % + if intermediate_values == False: - TI_data= TI_data.drop(TI_vars, axis = 1) - + TI_data = TI_data.drop(TI_vars, axis=1) + + if not to_pandas: + TI_data = TI_data.to_dataset() + return TI_data diff --git a/mhkit/river/io/usgs.py b/mhkit/river/io/usgs.py index 4583d458c..54c97966c 100644 --- a/mhkit/river/io/usgs.py +++ b/mhkit/river/io/usgs.py @@ -1,28 +1,38 @@ -import pandas as pd -import numpy as np +import os import json import requests +import shutil +import pandas as pd +from mhkit.utils.cache import handle_caching -def _read_usgs_json(text): - + +def _read_usgs_json(text, to_pandas=True): data = pd.DataFrame() - for i in range(len(text['value']['timeSeries'])): + for i in range(len(text["value"]["timeSeries"])): try: - site_name = text['value']['timeSeries'][i]['variable']['variableDescription'] #text['value']['timeSeries'][i]['sourceInfo']['siteName'] - site_data = pd.DataFrame(text['value']['timeSeries'][i]['values'][0]['value']) - site_data.set_index('dateTime', drop=True, inplace=True) + site_name = text["value"]["timeSeries"][i]["variable"][ + "variableDescription" + ] + site_data = pd.DataFrame( + text["value"]["timeSeries"][i]["values"][0]["value"] + ) + site_data.set_index("dateTime", drop=True, inplace=True) site_data.index = pd.to_datetime(site_data.index, utc=True) - site_data.rename(columns={'value': site_name}, inplace=True) + site_data.rename(columns={"value": site_name}, inplace=True) site_data[site_name] = pd.to_numeric(site_data[site_name]) site_data.index.name = None - del site_data['qualifiers'] + del site_data["qualifiers"] data = data.combine_first(site_data) except: pass - - return data # we could also extract metadata and return that here -def read_usgs_file(file_name): + if not to_pandas: + data = data.to_dataset() + + return data + + +def read_usgs_file(file_name, to_pandas=True): """ Reads a USGS JSON data file (from https://waterdata.usgs.gov/nwis) @@ -30,27 +40,41 @@ def read_usgs_file(file_name): ---------- file_name : str Name of USGS JSON data file - + to_pandas: bool (optional) + Flag to output pandas instead of xarray. Default = True. + Returns ------- - data : pandas DataFrame - Data indexed by datetime with columns named according to the parameter's + data : pandas DataFrame or xarray Dataset + Data indexed by datetime with columns named according to the parameter's variable description """ + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type bool. Got: {type(to_pandas)}") + with open(file_name) as json_file: text = json.load(json_file) - - data = _read_usgs_json(text) - - return data + + data = _read_usgs_json(text, to_pandas) + + return data -def request_usgs_data(station, parameter, start_date, end_date, - data_type='Daily', proxy=None, write_json=None): +def request_usgs_data( + station, + parameter, + start_date, + end_date, + data_type="Daily", + proxy=None, + write_json=None, + clear_cache=False, + to_pandas=True, +): """ - Loads USGS data directly from https://waterdata.usgs.gov/nwis using a + Loads USGS data directly from https://waterdata.usgs.gov/nwis using a GET request - + The request URL prints to the screen. Parameters @@ -64,43 +88,89 @@ def request_usgs_data(station, parameter, start_date, end_date, end_date : str End date in the format 'YYYY-MM-DD' (e.g. '2018-12-31') data_type : str - Data type, options include 'Daily' (return the mean daily value) and + Data type, options include 'Daily' (return the mean daily value) and 'Instantaneous'. proxy : dict or None - To request data from behind a firewall, define a dictionary of proxy settings, + To request data from behind a firewall, define a dictionary of proxy settings, for example {"http": 'localhost:8080'} write_json : str or None Name of json file to write data - + clear_cache : bool + If True, the cache for this specific request will be cleared. + to_pandas: bool (optional) + Flag to output pandas instead of xarray. Default = True. + Returns ------- - data : pandas DataFrame - Data indexed by datetime with columns named according to the parameter's + data : pandas DataFrame or xarray Dataset + Data indexed by datetime with columns named according to the parameter's variable description """ - assert data_type in ['Daily', 'Instantaneous'], 'data_type must be Daily or Instantaneous' - - if data_type == 'Daily': - data_url = 'https://waterservices.usgs.gov/nwis/dv' - api_query = '/?format=json&sites='+station+ \ - '&startDT='+start_date+'&endDT='+end_date+ \ - '&statCd=00003'+ \ - '¶meterCd='+parameter+'&siteStatus=all' + if not data_type in ["Daily", "Instantaneous"]: + raise ValueError(f"data_type must be Daily or Instantaneous. Got: {data_type}") + + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type bool. Got: {type(to_pandas)}") + + # Define the path to the cache directory + cache_dir = os.path.join(os.path.expanduser("~"), ".cache", "mhkit", "usgs") + + # Create a unique filename based on the function parameters + hash_params = f"{station}_{parameter}_{start_date}_{end_date}_{data_type}" + + # Use handle_caching to manage cache + cached_data, metadata, cache_filepath = handle_caching( + hash_params, cache_dir, write_json, clear_cache + ) + + if cached_data is not None: + return cached_data + + # If no cached data, proceed with the API request + if data_type == "Daily": + data_url = "https://waterservices.usgs.gov/nwis/dv" + api_query = ( + "/?format=json&sites=" + + station + + "&startDT=" + + start_date + + "&endDT=" + + end_date + + "&statCd=00003" + + "¶meterCd=" + + parameter + + "&siteStatus=all" + ) else: - data_url = 'https://waterservices.usgs.gov/nwis/iv' - api_query = '/?format=json&sites='+station+ \ - '&startDT='+start_date+'&endDT='+end_date+ \ - '¶meterCd='+parameter+'&siteStatus=all' - - print('Data request URL: ', data_url+api_query) - - response = requests.get(url=data_url+api_query,proxies=proxy) + data_url = "https://waterservices.usgs.gov/nwis/iv" + api_query = ( + "/?format=json&sites=" + + station + + "&startDT=" + + start_date + + "&endDT=" + + end_date + + "¶meterCd=" + + parameter + + "&siteStatus=all" + ) + + print("Data request URL: ", data_url + api_query) + + response = requests.get(url=data_url + api_query, proxies=proxy) text = json.loads(response.text) - - if write_json is not None: - with open(write_json, 'w') as outfile: - json.dump(text, outfile) - - data = _read_usgs_json(text) - - return data + + # handle_caching is only set-up for pandas, so force this data to output as pandas for now + data = _read_usgs_json(text, True) + + # After making the API request and processing the response, write the + # response to a cache file + handle_caching(hash_params, cache_dir, data=data, clear_cache_file=clear_cache) + + if write_json: + shutil.copy(cache_filepath, write_json) + + if not to_pandas: + data = data.to_dataset() + + return data diff --git a/mhkit/river/performance.py b/mhkit/river/performance.py index ac4529793..c805517ab 100644 --- a/mhkit/river/performance.py +++ b/mhkit/river/performance.py @@ -1,15 +1,16 @@ import numpy as np + def circular(diameter): """ - Calculates the equivalent diameter and projected capture area of a + Calculates the equivalent diameter and projected capture area of a circular turbine - + Parameters ------------ diameter : int/float Turbine diameter [m] - + Returns --------- equivalent_diameter : float @@ -17,23 +18,25 @@ def circular(diameter): projected_capture_area : float Projected capture area [m^2] """ - assert isinstance(diameter, (int,float)), 'diameter must be of type int or float' - + if not isinstance(diameter, (int, float)): + raise TypeError(f"diameter must be of type int or float. Got: {type(diameter)}") + equivalent_diameter = diameter - projected_capture_area = (1/4)*np.pi*(equivalent_diameter**2) - + projected_capture_area = (1 / 4) * np.pi * (equivalent_diameter**2) + return equivalent_diameter, projected_capture_area + def ducted(duct_diameter): """ Calculates the equivalent diameter and projected capture area of a ducted turbine - + Parameters ------------ duct_diameter : int/float Duct diameter [m] - + Returns --------- equivalent_diameter : float @@ -41,25 +44,29 @@ def ducted(duct_diameter): projected_capture_area : float Projected capture area [m^2] """ - assert isinstance(duct_diameter, (int,float)), 'duct_diameter must be of type int or float' - + if not isinstance(duct_diameter, (int, float)): + raise TypeError( + f"duct_diameter must be of type int or float. Got: {type(duct_diameter)}" + ) + equivalent_diameter = duct_diameter - projected_capture_area = (1/4)*np.pi*(equivalent_diameter**2) + projected_capture_area = (1 / 4) * np.pi * (equivalent_diameter**2) return equivalent_diameter, projected_capture_area + def rectangular(h, w): """ - Calculates the equivalent diameter and projected capture area of a + Calculates the equivalent diameter and projected capture area of a retangular turbine - + Parameters ------------ h : int/float Turbine height [m] w : int/float Turbine width [m] - + Returns --------- equivalent_diameter : float @@ -67,24 +74,27 @@ def rectangular(h, w): projected_capture_area : float Projected capture area [m^2] """ - assert isinstance(h, (int,float)), 'h must be of type int or float' - assert isinstance(w, (int,float)), 'w must be of type int or float' - - equivalent_diameter = np.sqrt(4.*h*w / np.pi) - projected_capture_area = h*w + if not isinstance(h, (int, float)): + raise TypeError(f"h must be of type int or float. Got: {type(h)}") + if not isinstance(w, (int, float)): + raise TypeError(f"w must be of type int or float. Got: {type(w)}") + + equivalent_diameter = np.sqrt(4.0 * h * w / np.pi) + projected_capture_area = h * w return equivalent_diameter, projected_capture_area + def multiple_circular(diameters): """ - Calculates the equivalent diameter and projected capture area of a + Calculates the equivalent diameter and projected capture area of a multiple circular turbine - + Parameters ------------ - diameters: list + diameters: list List of device diameters [m] - + Returns --------- equivalent_diameter : float @@ -92,16 +102,18 @@ def multiple_circular(diameters): projected_capture_area : float Projected capture area [m^2] """ - assert isinstance(diameters, list), 'diameters must be of type list' - + if not isinstance(diameters, list): + raise TypeError(f"diameters must be of type list. Got: {type(diameters)}") + diameters_squared = [x**2 for x in diameters] equivalent_diameter = np.sqrt(sum(diameters_squared)) - projected_capture_area = 0.25*np.pi*sum(diameters_squared) + projected_capture_area = 0.25 * np.pi * sum(diameters_squared) return equivalent_diameter, projected_capture_area -def tip_speed_ratio(rotor_speed,rotor_diameter,inflow_speed): - ''' + +def tip_speed_ratio(rotor_speed, rotor_diameter, inflow_speed): + """ Function used to calculate the tip speed ratio (TSR) of a MEC device with rotor Parameters @@ -117,24 +129,31 @@ def tip_speed_ratio(rotor_speed,rotor_diameter,inflow_speed): -------- TSR : numpy array Calculated tip speed ratio (TSR) - ''' - - try: rotor_speed = np.asarray(rotor_speed) - except: 'rotor_speed must be of type np.ndarray' - try: inflow_speed = np.asarray(inflow_speed) - except: 'inflow_speed must be of type np.ndarray' - - assert isinstance(rotor_diameter, (float,int)), 'rotor diameter must be of type int or float' + """ + try: + rotor_speed = np.asarray(rotor_speed) + except: + "rotor_speed must be of type np.ndarray" + try: + inflow_speed = np.asarray(inflow_speed) + except: + "inflow_speed must be of type np.ndarray" - rotor_velocity = rotor_speed * np.pi*rotor_diameter + if not isinstance(rotor_diameter, (float, int)): + raise TypeError( + f"rotor_diameter must be of type int or float. Got: {type(rotor_diameter)}" + ) + + rotor_velocity = rotor_speed * np.pi * rotor_diameter TSR = rotor_velocity / inflow_speed return TSR -def power_coefficient(power,inflow_speed,capture_area,rho): - ''' + +def power_coefficient(power, inflow_speed, capture_area, rho): + """ Function that calculates the power coefficient of MEC device Parameters @@ -152,20 +171,27 @@ def power_coefficient(power,inflow_speed,capture_area,rho): -------- Cp : numpy array Power coefficient of device [-] - ''' - - try: power = np.asarray(power) - except: 'power must be of type np.ndarray' - try: inflow_speed = np.asarray(inflow_speed) - except: 'inflow_speed must be of type np.ndarray' - - assert isinstance(capture_area, (float,int)), 'capture_area must be of type int or float' - assert isinstance(rho, (float,int)), 'rho must be of type int or float' + """ + + try: + power = np.asarray(power) + except: + "power must be of type np.ndarray" + try: + inflow_speed = np.asarray(inflow_speed) + except: + "inflow_speed must be of type np.ndarray" + + if not isinstance(capture_area, (float, int)): + raise TypeError( + f"capture_area must be of type int or float. Got: {type(capture_area)}" + ) + if not isinstance(rho, (float, int)): + raise TypeError(f"rho must be of type int or float. Got: {type(rho)}") # Predicted power from inflow - power_in = (0.5 * rho * capture_area * inflow_speed**3) + power_in = 0.5 * rho * capture_area * inflow_speed**3 - Cp = power / power_in + Cp = power / power_in return Cp - diff --git a/mhkit/river/resource.py b/mhkit/river/resource.py index c4a0e760c..2a0e06ffd 100644 --- a/mhkit/river/resource.py +++ b/mhkit/river/resource.py @@ -1,20 +1,21 @@ -import pandas as pd +import xarray as xr import numpy as np from scipy.stats import linregress as _linregress from scipy.stats import rv_histogram as _rv_histogram +from mhkit.utils import convert_to_dataarray def Froude_number(v, h, g=9.80665): """ Calculate the Froude Number of the river, channel or duct flow, to check subcritical flow assumption (if Fr <1). - + Parameters ------------ - v : int/float + v : int/float Average velocity [m/s]. h : int/float - Mean hydrolic depth float [m]. + Mean hydraulic depth float [m]. g : int/float Gravitational acceleration [m/s2]. @@ -24,40 +25,60 @@ def Froude_number(v, h, g=9.80665): Froude Number of the river [unitless]. """ - assert isinstance(v, (int,float)), 'v must be of type int or float' - assert isinstance(h, (int,float)), 'h must be of type int or float' - assert isinstance(g, (int,float)), 'g must be of type int or float' - - Fr = v / np.sqrt( g * h ) - - return Fr + if not isinstance(v, (int, float)): + raise TypeError(f"v must be of type int or float. Got: {type(v)}") + if not isinstance(h, (int, float)): + raise TypeError(f"h must be of type int or float. Got: {type(h)}") + if not isinstance(g, (int, float)): + raise TypeError(f"g must be of type int or float. Got: {type(g)}") + + Fr = v / np.sqrt(g * h) + + return Fr -def exceedance_probability(D): +def exceedance_probability(D, dimension="", to_pandas=True): """ Calculates the exceedance probability - + Parameters ---------- - D : pandas Series - Data indexed by time [datetime or s]. - - Returns + D : pandas Series, pandas DataFrame, xarray DataArray, or xarray Dataset + Discharge indexed by time [datetime or s]. + + dimension: string (optional) + Name of the relevant xarray dimension. If not supplied, + defaults to the first dimension. Does not affect pandas input. + + to_pandas: bool (optional) + Flag to output pandas instead of xarray. Default = True. + + Returns ------- - F : pandas DataFrame + F : pandas DataFrame or xarray Dataset Exceedance probability [unitless] indexed by time [datetime or s] - """ - assert isinstance(D, (pd.DataFrame, pd.Series)), 'D must be of type pd.Series' # dataframe allowed for matlab - - if isinstance(D, pd.DataFrame) and len(D.columns) == 1: # for matlab - D = D.squeeze().copy() - - # Calculate exceedence probability (F) - rank = D.rank(method='max', ascending=False) - F = 100* (rank / (len(D)+1) ) - - F = F.to_frame('F') # for matlab - + """ + if not isinstance(dimension, str): + raise TypeError(f"dimension must be of type str. Got: {type(dimension)}") + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type bool. Got: {type(to_pandas)}") + + D = convert_to_dataarray(D) + + if dimension == "": + dimension = list(D.coords)[0] + + # Calculate exceedance probability (F) + rank = D.rank(dim=dimension) + rank = len(D[dimension]) - rank + 1 # convert to descending rank + F = 100 * rank / (len(D[dimension]) + 1) + F.name = "F" + + F = F.to_dataset() # for matlab + + if to_pandas: + F = F.to_pandas() + return F @@ -81,7 +102,7 @@ def polynomial_fit(x, y, n): List of polynomial coefficients R2 : float Polynomical fit coeffcient of determination - + """ try: x = np.array(x) @@ -91,132 +112,176 @@ def polynomial_fit(x, y, n): y = np.array(y) except: pass - assert isinstance(x, np.ndarray), 'x must be of type np.ndarray' - assert isinstance(y, np.ndarray), 'y must be of type np.ndarray' - assert isinstance(n, int), 'n must be of type int' - - # Get coeffcients of polynomial of order n + if not isinstance(x, np.ndarray): + raise TypeError(f"x must be of type np.ndarray. Got: {type(x)}") + if not isinstance(y, np.ndarray): + raise TypeError(f"y must be of type np.ndarray. Got: {type(y)}") + if not isinstance(n, int): + raise TypeError(f"n must be of type int. Got: {type(n)}") + + # Get coeffcients of polynomial of order n polynomial_coefficients = np.poly1d(np.polyfit(x, y, n)) - + # Calculate the coeffcient of determination - slope, intercept, r_value, p_value, std_err = _linregress(y, polynomial_coefficients(x)) + slope, intercept, r_value, p_value, std_err = _linregress( + y, polynomial_coefficients(x) + ) R2 = r_value**2 - + return polynomial_coefficients, R2 - -def discharge_to_velocity(D, polynomial_coefficients): + +def discharge_to_velocity(D, polynomial_coefficients, dimension="", to_pandas=True): """ - Calculates velocity given discharge data and the relationship between + Calculates velocity given discharge data and the relationship between discharge and velocity at an individual turbine - + Parameters ------------ - D : pandas Series + D : numpy ndarray, pandas DataFrame, pandas Series, xarray DataArray, or xarray Dataset Discharge data [m3/s] indexed by time [datetime or s] polynomial_coefficients : numpy polynomial - List of polynomial coefficients that discribe the relationship between + List of polynomial coefficients that describe the relationship between discharge and velocity at an individual turbine - - Returns + dimension: string (optional) + Name of the relevant xarray dimension. If not supplied, + defaults to the first dimension. Does not affect pandas input. + to_pandas: bool (optional) + Flag to output pandas instead of xarray. Default = True. + + Returns ------------ - V: pandas DataFrame + V: pandas DataFrame or xarray Dataset Velocity [m/s] indexed by time [datetime or s] - """ - assert isinstance(D, (pd.DataFrame, pd.Series)), 'D must be of type pd.Series' # dataframe allowed for matlab - assert isinstance(polynomial_coefficients, np.poly1d), 'polynomial_coefficients must be of type np.poly1d' - - if isinstance(D, pd.DataFrame) and len(D.columns) == 1: # for matlab - D = D.squeeze().copy() - + """ + if not isinstance(polynomial_coefficients, np.poly1d): + raise TypeError( + f"polynomial_coefficients must be of type np.poly1d. Got: {type(polynomial_coefficients)}" + ) + if not isinstance(dimension, str): + raise TypeError(f"dimension must be of type str. Got: {type(dimension)}") + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type str. Got: {type(to_pandas)}") + + D = convert_to_dataarray(D) + + if dimension == "": + dimension = list(D.coords)[0] + # Calculate velocity using polynomial - vals = polynomial_coefficients(D) - V = pd.Series(vals, index=D.index) - - V = V.to_frame('V') # for matlab - + V = xr.DataArray( + data=polynomial_coefficients(D), + dims=dimension, + coords={dimension: D[dimension]}, + ) + V.name = "V" + + V = V.to_dataset() # for matlab + + if to_pandas: + V = V.to_pandas() + return V - -def velocity_to_power(V, polynomial_coefficients, cut_in, cut_out): + +def velocity_to_power( + V, polynomial_coefficients, cut_in, cut_out, dimension="", to_pandas=True +): """ - Calculates power given velocity data and the relationship + Calculates power given velocity data and the relationship between velocity and power from an individual turbine - + Parameters ---------- - V : pandas Series + V : numpy ndarray, pandas DataFrame, pandas Series, xarray DataArray, or xarray Dataset Velocity [m/s] indexed by time [datetime or s] polynomial_coefficients : numpy polynomial - List of polynomial coefficients that discribe the relationship between + List of polynomial coefficients that describe the relationship between velocity and power at an individual turbine cut_in: int/float Velocity values below cut_in are not used to compute P cut_out: int/float Velocity values above cut_out are not used to compute P - - Returns + dimension: string (optional) + Name of the relevant xarray dimension. If not supplied, + defaults to the first dimension. Does not affect pandas input. + to_pandas: bool (optional) + Flag to output pandas instead of xarray. Default = True. + + Returns ------- - P : pandas DataFrame + P : pandas DataFrame or xarray Dataset Power [W] indexed by time [datetime or s] - """ - assert isinstance(V, (pd.DataFrame, pd.Series)), 'V must be of type pd.Series' # dataframe allowed for matlab - assert isinstance(polynomial_coefficients, np.poly1d), 'polynomial_coefficients must be of type np.poly1d' - assert isinstance(cut_in, (int,float)), 'cut_in must be of type int or float' - assert isinstance(cut_out, (int,float)), 'cut_out must be of type int or float' - - if isinstance(V, pd.DataFrame) and len(V.columns) == 1: - V = V.squeeze().copy() - - # Calculate power using tranfer function and FDC - vals = polynomial_coefficients(V) - + """ + if not isinstance(polynomial_coefficients, np.poly1d): + raise TypeError( + f"polynomial_coefficients must be of type np.poly1d. Got: {type(polynomial_coefficients)}" + ) + if not isinstance(cut_in, (int, float)): + raise TypeError(f"cut_in must be of type int or float. Got: {type(cut_in)}") + if not isinstance(cut_out, (int, float)): + raise TypeError(f"cut_out must be of type int or float. Got: {type(cut_out)}") + if not isinstance(dimension, str): + raise TypeError(f"dimension must be of type str. Got: {type(dimension)}") + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type str. Got: {type(to_pandas)}") + + V = convert_to_dataarray(V) + + if dimension == "": + dimension = list(V.coords)[0] + + # Calculate velocity using polynomial + power = polynomial_coefficients(V) + # Power for velocity values outside lower and upper bounds Turbine produces 0 power - vals[V < cut_in] = 0. - vals[V > cut_out] = 0. + power[V < cut_in] = 0.0 + power[V > cut_out] = 0.0 + + P = xr.DataArray(data=power, dims=dimension, coords={dimension: V[dimension]}) + P.name = "P" + + P = P.to_dataset() + + if to_pandas: + P = P.to_pandas() - P = pd.Series(vals, index=V.index) - - P = P.to_frame('P') # for matlab - return P def energy_produced(P, seconds): """ Returns the energy produced for a given time period provided - exceedence probability and power. - + exceedance probability and power. + Parameters ---------- - P : pandas Series + P : numpy ndarray, pandas DataFrame, pandas Series, xarray DataArray, or xarray Dataset Power [W] indexed by time [datetime or s] seconds: int or float Seconds in the time period of interest - + Returns ------- E : float - Energy [J] produced in the given time frame + Energy [J] produced in the given length of time """ - assert isinstance(P, (pd.DataFrame, pd.Series)), 'D must be of type pd.Series' # dataframe allowed for matlab - assert isinstance(seconds, (int, float)), 'seconds must be of type int or float' + if not isinstance(seconds, (int, float)): + raise TypeError(f"seconds must be of type int or float. Got: {type(seconds)}") + + P = convert_to_dataarray(P) - if isinstance(P, pd.DataFrame) and len(P.columns) == 1: # for matlab - P = P.squeeze().copy() - # Calculate Histogram of power - H, edges = np.histogram(P, 100 ) + H, edges = np.histogram(P, 100) # Create a distribution - hist_dist = _rv_histogram([H,edges]) + hist_dist = _rv_histogram([H, edges]) # Sample range for pdf - x = np.linspace(edges.min(),edges.max(),1000) + x = np.linspace(edges.min(), edges.max(), 1000) # Calculate the expected value of Power - expected_val_of_power = np.trapz(x*hist_dist.pdf(x),x=x) + expected_val_of_power = np.trapz(x * hist_dist.pdf(x), x=x) # Note: Built-in Expected Value method often throws warning - #EV = hist_dist.expect(lb=edges.min(), ub=edges.max()) + # EV = hist_dist.expect(lb=edges.min(), ub=edges.max()) # Energy - E = seconds * expected_val_of_power - - return E + E = seconds * expected_val_of_power + return E diff --git a/mhkit/tests/dolfyn/base.py b/mhkit/tests/dolfyn/base.py index 13327baa4..780b9688c 100644 --- a/mhkit/tests/dolfyn/base.py +++ b/mhkit/tests/dolfyn/base.py @@ -7,15 +7,16 @@ def rfnm(filename): testdir = dirname(abspath(__file__)) - datadir = normpath(join(testdir, relpath( - '../../../examples/data/dolfyn/test_data/'))) - return datadir + '/' + filename + datadir = normpath( + join(testdir, relpath("../../../examples/data/dolfyn/test_data/")) + ) + return datadir + "/" + filename def exdt(filename): testdir = dirname(abspath(__file__)) - exdir = normpath(join(testdir, relpath('../../../examples/data/dolfyn/'))) - return exdir + '/' + filename + exdir = normpath(join(testdir, relpath("../../../examples/data/dolfyn/"))) + return exdir + "/" + filename def assert_allclose(dat0, dat1, *args, **kwargs): @@ -30,8 +31,9 @@ def assert_allclose(dat0, dat1, *args, **kwargs): _assert_allclose(dat0, dat1, *args, **kwargs) # Check attributes for nm in dat0.attrs: - assert dat0.attrs[nm] == dat1.attrs[nm], "The " + \ - nm + " attribute does not match." + assert dat0.attrs[nm] == dat1.attrs[nm], ( + "The " + nm + " attribute does not match." + ) # If test debugging for v in names: dat0[v] = time.epoch2dt64(dat0[v]) @@ -46,9 +48,9 @@ def save_netcdf(data, name, *args, **kwargs): io.save(data, rfnm(name), *args, **kwargs) -def load_matlab(name, *args, **kwargs): +def load_matlab(name, *args, **kwargs): return io.load_mat(rfnm(name), *args, **kwargs) -def save_matlab(data, name, *args, **kwargs): +def save_matlab(data, name, *args, **kwargs): io.save_mat(data, rfnm(name), *args, **kwargs) diff --git a/mhkit/tests/dolfyn/test_analysis.py b/mhkit/tests/dolfyn/test_analysis.py index f75d5e952..da10f5449 100644 --- a/mhkit/tests/dolfyn/test_analysis.py +++ b/mhkit/tests/dolfyn/test_analysis.py @@ -1,5 +1,9 @@ from . import test_read_adp as tr, test_read_adv as tv -from mhkit.tests.dolfyn.base import load_netcdf as load, save_netcdf as save, assert_allclose +from mhkit.tests.dolfyn.base import ( + load_netcdf as load, + save_netcdf as save, + assert_allclose, +) from mhkit.dolfyn import VelBinner, read_example import mhkit.dolfyn.adv.api as avm import mhkit.dolfyn.adp.api as apm @@ -15,14 +19,14 @@ class analysis_testcase(unittest.TestCase): @classmethod def setUpClass(self): self.adv1 = tv.dat.copy(deep=True) - self.adv2 = read_example('vector_burst_mode01.VEC', nens=90) + self.adv2 = read_example("vector_burst_mode01.VEC", nens=90) self.adv_tool = VelBinner(n_bin=self.adv1.fs, fs=self.adv1.fs) self.adp = tr.dat_sig.copy(deep=True) with pytest.warns(UserWarning): - self.adp_tool = VelBinner(n_bin=self.adp.fs*20, - fs=self.adp.fs, - n_fft=self.adp.fs*40) + self.adp_tool = VelBinner( + n_bin=self.adp.fs * 20, fs=self.adp.fs, n_fft=self.adp.fs * 40 + ) @classmethod def tearDownClass(self): @@ -33,19 +37,19 @@ def test_do_func(self): ds_vec = self.adv_tool.bin_variance(self.adv1, out_ds=ds_vec) # test non-integer bin sizes - mean_test = self.adv_tool.mean(self.adv1['vel'].values, n_bin=ds_vec.fs*1.01) + mean_test = self.adv_tool.mean(self.adv1["vel"].values, n_bin=ds_vec.fs * 1.01) ds_sig = self.adp_tool.bin_average(self.adp) ds_sig = self.adp_tool.bin_variance(self.adp, out_ds=ds_sig) if make_data: - save(ds_vec, 'vector_data01_avg.nc') - save(ds_sig, 'BenchFile01_avg.nc') + save(ds_vec, "vector_data01_avg.nc") + save(ds_sig, "BenchFile01_avg.nc") return - assert np.sum(mean_test-ds_vec.vel.values) == 0, "Mean test failed" - assert_allclose(ds_vec, load('vector_data01_avg.nc'), atol=1e-6) - assert_allclose(ds_sig, load('BenchFile01_avg.nc'), atol=1e-6) + assert np.sum(mean_test - ds_vec.vel.values) == 0, "Mean test failed" + assert_allclose(ds_vec, load("vector_data01_avg.nc"), atol=1e-6) + assert_allclose(ds_sig, load("BenchFile01_avg.nc"), atol=1e-6) def test_calc_func(self): c = self.adv_tool @@ -54,94 +58,144 @@ def test_calc_func(self): test_ds = type(self.adv1)() test_ds_adp = type(self.adp)() - test_ds['acov'] = c.autocovariance(self.adv1.vel) - test_ds['tke_vec_detrend'] = c.turbulent_kinetic_energy( - self.adv1.vel, detrend=True) - test_ds['tke_vec_demean'] = c.turbulent_kinetic_energy( - self.adv1.vel, detrend=False) - test_ds['psd'] = c.power_spectral_density( - self.adv1.vel, freq_units='Hz') + test_ds["acov"] = c.autocovariance(self.adv1.vel) + test_ds["tke_vec_detrend"] = c.turbulent_kinetic_energy( + self.adv1.vel, detrend=True + ) + test_ds["tke_vec_demean"] = c.turbulent_kinetic_energy( + self.adv1.vel, detrend=False + ) + test_ds["psd"] = c.power_spectral_density(self.adv1.vel, freq_units="Hz") # Test ADCP single vector spectra, cross-spectra to test radians code - test_ds_adp['psd_b5'] = c2.power_spectral_density( - self.adp.vel_b5.isel(range_b5=5), freq_units='rad', window='hamm') - test_ds_adp['tke_b5'] = c2.turbulent_kinetic_energy(self.adp.vel_b5) + test_ds_adp["psd_b5"] = c2.power_spectral_density( + self.adp.vel_b5.isel(range_b5=5), freq_units="rad", window="hamm" + ) + test_ds_adp["tke_b5"] = c2.turbulent_kinetic_energy(self.adp.vel_b5) if make_data: - save(test_ds, 'vector_data01_func.nc') - save(test_ds_adp, 'BenchFile01_func.nc') + save(test_ds, "vector_data01_func.nc") + save(test_ds_adp, "BenchFile01_func.nc") return - assert_allclose(test_ds, load('vector_data01_func.nc'), atol=1e-6) - assert_allclose(test_ds_adp, load('BenchFile01_func.nc'), atol=1e-6) + assert_allclose(test_ds, load("vector_data01_func.nc"), atol=1e-6) + assert_allclose(test_ds_adp, load("BenchFile01_func.nc"), atol=1e-6) def test_fft_freq(self): - f = self.adv_tool._fft_freq(units='Hz') - omega = self.adv_tool._fft_freq(units='rad/s') + f = self.adv_tool._fft_freq(units="Hz") + omega = self.adv_tool._fft_freq(units="rad/s") - np.testing.assert_equal(f, np.arange(1, 17, 1, dtype='float')) - np.testing.assert_equal(omega, np.arange( - 1, 17, 1, dtype='float')*(2*np.pi)) + np.testing.assert_equal(f, np.arange(1, 17, 1, dtype="float")) + np.testing.assert_equal(omega, np.arange(1, 17, 1, dtype="float") * (2 * np.pi)) def test_adv_turbulence(self): dat = tv.dat.copy(deep=True) bnr = avm.ADVBinner(n_bin=20.0, fs=dat.fs) tdat = bnr(dat) - acov = bnr.autocovariance(dat.vel) - - assert_identical(tdat, avm.turbulence_statistics( - dat, n_bin=20.0, fs=dat.fs)) - - tdat['stress_detrend'] = bnr.reynolds_stress(dat.vel) - tdat['stress_demean'] = bnr.reynolds_stress(dat.vel, detrend=False) - tdat['csd'] = bnr.cross_spectral_density( - dat.vel, freq_units='rad', window='hamm', n_fft_coh=10) - tdat['LT83'] = bnr.dissipation_rate_LT83(tdat.psd, tdat.velds.U_mag) - tdat['SF'] = bnr.dissipation_rate_SF(dat.vel[0], tdat.velds.U_mag) - tdat['TE01'] = bnr.dissipation_rate_TE01(dat, tdat) - tdat['L'] = bnr.integral_length_scales(acov, tdat.velds.U_mag) + acov = bnr.autocovariance(dat["vel"]) + + assert_identical(tdat, avm.turbulence_statistics(dat, n_bin=20.0, fs=dat.fs)) + + tdat["stress_detrend"] = bnr.reynolds_stress(dat["vel"]) + tdat["stress_demean"] = bnr.reynolds_stress(dat["vel"], detrend=False) + tdat["csd"] = bnr.cross_spectral_density( + dat["vel"], freq_units="rad", window="hamm", n_fft_coh=10 + ) + tdat["LT83"] = bnr.dissipation_rate_LT83(tdat["psd"], tdat.velds.U_mag) + tdat["noise"] = bnr.doppler_noise_level(tdat["psd"], pct_fN=0.8) + tdat["LT83_noise"] = bnr.dissipation_rate_LT83( + tdat["psd"], tdat.velds.U_mag, noise=tdat["noise"] + ) + tdat["SF"] = bnr.dissipation_rate_SF(dat["vel"][0], tdat.velds.U_mag) + tdat["TE01"] = bnr.dissipation_rate_TE01(dat, tdat) + tdat["L"] = bnr.integral_length_scales(acov, tdat.velds.U_mag) slope_check = bnr.check_turbulence_cascade_slope( - tdat['psd'][-1].mean('time'), freq_range=[10, 100]) + tdat["psd"][-1].mean("time"), freq_range=[10, 100] + ) + tdat["psd_noise"] = bnr.power_spectral_density( + dat["vel"], freq_units="rad", noise=[0.06, 0.04, 0.01] + ) if make_data: - save(tdat, 'vector_data01_bin.nc') + save(tdat, "vector_data01_bin.nc") return assert np.round(slope_check[0].values, 4), 0.1713 - assert_allclose(tdat, load('vector_data01_bin.nc'), atol=1e-6) - + assert_allclose(tdat, load("vector_data01_bin.nc"), atol=1e-6) def test_adcp_turbulence(self): - dat = tr.dat_sig_i.copy(deep=True) - bnr = apm.ADPBinner(n_bin=20.0, fs=dat.fs, diff_style='centered') + dat = tr.dat_sig_tide.copy(deep=True) + dat.velds.rotate2("earth") + dat.attrs["principal_heading"] = apm.calc_principal_heading( + dat.vel.mean("range") + ) + bnr = apm.ADPBinner(n_bin=20.0, fs=dat.fs, diff_style="centered") tdat = bnr.bin_average(dat) - tdat['dudz'] = bnr.dudz(tdat.vel) - tdat['dvdz'] = bnr.dvdz(tdat.vel) - tdat['dwdz'] = bnr.dwdz(tdat.vel) - tdat['tau2'] = bnr.shear_squared(tdat.vel) - tdat['psd'] = bnr.power_spectral_density(dat['vel'].isel( - dir=2, range=len(dat.range)//2), freq_units='Hz') - tdat['noise'] = bnr.doppler_noise_level(tdat['psd'], pct_fN=0.8) - tdat['stress_vec4'] = bnr.reynolds_stress_4beam( - dat, noise=tdat['noise'], orientation='up', beam_angle=25) - tdat['tke_vec5'], tdat['stress_vec5'] = bnr.stress_tensor_5beam( - dat, noise=tdat['noise'], orientation='up', beam_angle=25, tke_only=False) - tdat['tke'] = bnr.total_turbulent_kinetic_energy( - dat, noise=tdat['noise'], orientation='up', beam_angle=25) + + tdat["dudz"] = bnr.dudz(tdat["vel"]) + tdat["dvdz"] = bnr.dvdz(tdat["vel"]) + tdat["dwdz"] = bnr.dwdz(tdat["vel"]) + tdat["tau2"] = bnr.shear_squared(tdat["vel"]) + tdat["I"] = tdat.velds.I + tdat["ti"] = bnr.turbulence_intensity(dat.velds.U_mag, detrend=False) + dat.velds.rotate2("beam") + + tdat["psd"] = bnr.power_spectral_density( + dat["vel"].isel(dir=2, range=len(dat.range) // 2), freq_units="Hz" + ) + tdat["noise"] = bnr.doppler_noise_level(tdat["psd"], pct_fN=0.8) + tdat["stress_vec4"] = bnr.reynolds_stress_4beam( + dat, noise=tdat["noise"], orientation="up", beam_angle=25 + ) + tdat["tke_vec5"], tdat["stress_vec5"] = bnr.stress_tensor_5beam( + dat, noise=tdat["noise"], orientation="up", beam_angle=25, tke_only=False + ) + tdat["tke"] = bnr.total_turbulent_kinetic_energy( + dat, noise=tdat["noise"], orientation="up", beam_angle=25 + ) + tdat["ti_noise"] = bnr.turbulence_intensity( + dat.velds.U_mag, detrend=False, noise=tdat["noise"] + ) # This is "negative" for this code check - tdat['wpwp'] = bnr.turbulent_kinetic_energy(dat['vel_b5'], noise=tdat['noise']) - tdat['dissipation_rate_LT83'] = bnr.dissipation_rate_LT83( - tdat['psd'], tdat.velds.U_mag.isel(range=len(dat.range)//2), freq_range=[0.2, 0.4]) - tdat['dissipation_rate_SF'], tdat['noise_SF'], tdat['D_SF'] = bnr.dissipation_rate_SF( - dat.vel.isel(dir=2), r_range=[1, 5]) - tdat['friction_vel'] = bnr.friction_velocity( - tdat, upwp_=tdat['stress_vec5'].sel(tau='upwp_'), z_inds=slice(1, 5), H=50) + tdat["wpwp"] = bnr.turbulent_kinetic_energy(dat["vel_b5"], noise=tdat["noise"]) + tdat["dissipation_rate_LT83"] = bnr.dissipation_rate_LT83( + tdat["psd"], + tdat.velds.U_mag.isel(range=len(dat.range) // 2), + freq_range=[0.2, 0.4], + ) + tdat["dissipation_rate_LT83_noise"] = bnr.dissipation_rate_LT83( + tdat["psd"], + tdat.velds.U_mag.isel(range=len(dat.range) // 2), + freq_range=[0.2, 0.4], + noise=tdat["noise"], + ) + ( + tdat["dissipation_rate_SF"], + tdat["noise_SF"], + tdat["D_SF"], + ) = bnr.dissipation_rate_SF(dat.vel.isel(dir=2), r_range=[1, 5]) + tdat["friction_vel"] = bnr.friction_velocity( + tdat, upwp_=tdat["stress_vec5"].sel(tau="upwp_"), z_inds=slice(1, 5), H=50 + ) slope_check = bnr.check_turbulence_cascade_slope( - tdat['psd'].mean('time'), freq_range=[0.4, 4]) + tdat["psd"].mean("time"), freq_range=[0.4, 4] + ) + tdat["psd_noise"] = bnr.power_spectral_density( + dat["vel"].isel(dir=2, range=len(dat.range) // 2), + freq_units="Hz", + noise=0.01, + ) if make_data: - save(tdat, 'Sig1000_IMU_bin.nc') + save(tdat, "Sig1000_tidal_bin.nc") return + with pytest.raises(Exception): + bnr.calc_psd(dat["vel"], freq_units="Hz", noise=0.01) + + with pytest.raises(Exception): + bnr.calc_psd(dat["vel"][0], freq_units="Hz", noise=0.01) + assert np.round(slope_check[0].values, 4), -1.0682 - assert_allclose(tdat, load('Sig1000_IMU_bin.nc'), atol=1e-6) + + assert_allclose(tdat, load("Sig1000_tidal_bin.nc"), atol=1e-6) diff --git a/mhkit/tests/dolfyn/test_api.py b/mhkit/tests/dolfyn/test_api.py index 57320cb71..272ff1215 100644 --- a/mhkit/tests/dolfyn/test_api.py +++ b/mhkit/tests/dolfyn/test_api.py @@ -3,22 +3,24 @@ make_data = False -vec = load('vector_data01.nc') -sig = load('BenchFile01.nc') -rdi = load('RDI_test01.nc') +vec = load("vector_data01.nc") +sig = load("BenchFile01.nc") +rdi = load("RDI_test01.nc") class api_testcase(unittest.TestCase): def test_repr(self): _str = [] - for dat, fnm in [(vec, rfnm('vector_data01.repr.txt')), - (sig, rfnm('BenchFile01.repr.txt')), - (rdi, rfnm('RDI_test01.repr.txt')), ]: + for dat, fnm in [ + (vec, rfnm("vector_data01.repr.txt")), + (sig, rfnm("BenchFile01.repr.txt")), + (rdi, rfnm("RDI_test01.repr.txt")), + ]: _str = dat.velds.__repr__() if make_data: - with open(fnm, 'w') as fl: + with open(fnm, "w") as fl: fl.write(_str) else: - with open(fnm, 'r') as fl: + with open(fnm, "r") as fl: test_str = fl.read() assert test_str == _str diff --git a/mhkit/tests/dolfyn/test_clean.py b/mhkit/tests/dolfyn/test_clean.py index e237bd569..17c3d3f3e 100644 --- a/mhkit/tests/dolfyn/test_clean.py +++ b/mhkit/tests/dolfyn/test_clean.py @@ -15,50 +15,48 @@ def test_GN2002(self): td_imu = tv.dat_imu.copy(deep=True) mask = avm.clean.GN2002(td.vel, npt=20) - td['vel'] = avm.clean.clean_fill( - td.vel, mask, method='cubic', maxgap=6) - td['vel_clean_1D'] = avm.clean.fill_nan_ensemble_mean( - td.vel[0], mask[0], fs=1, window=45) - td['vel_clean_2D'] = avm.clean.fill_nan_ensemble_mean( - td.vel, mask, fs=1, window=45) + td["vel"] = avm.clean.clean_fill(td.vel, mask, method="cubic", maxgap=6) + td["vel_clean_1D"] = avm.clean.fill_nan_ensemble_mean( + td.vel[0], mask[0], fs=1, window=45 + ) + td["vel_clean_2D"] = avm.clean.fill_nan_ensemble_mean( + td.vel, mask, fs=1, window=45 + ) mask = avm.clean.GN2002(td_imu.vel, npt=20) - td_imu['vel'] = avm.clean.clean_fill( - td_imu.vel, mask, method='cubic', maxgap=6) + td_imu["vel"] = avm.clean.clean_fill(td_imu.vel, mask, method="cubic", maxgap=6) if make_data: - save(td, 'vector_data01_GN.nc') - save(td_imu, 'vector_data_imu01_GN.nc') + save(td, "vector_data01_GN.nc") + save(td_imu, "vector_data_imu01_GN.nc") return - assert_allclose(td, load('vector_data01_GN.nc'), atol=1e-6) - assert_allclose(td_imu, load('vector_data_imu01_GN.nc'), atol=1e-6) + assert_allclose(td, load("vector_data01_GN.nc"), atol=1e-6) + assert_allclose(td_imu, load("vector_data_imu01_GN.nc"), atol=1e-6) def test_spike_thresh(self): td = tv.dat_imu.copy(deep=True) mask = avm.clean.spike_thresh(td.vel, thresh=10) - td['vel'] = avm.clean.clean_fill( - td.vel, mask, method='cubic', maxgap=6) + td["vel"] = avm.clean.clean_fill(td.vel, mask, method="cubic", maxgap=6) if make_data: - save(td, 'vector_data01_sclean.nc') + save(td, "vector_data01_sclean.nc") return - assert_allclose(td, load('vector_data01_sclean.nc'), atol=1e-6) + assert_allclose(td, load("vector_data01_sclean.nc"), atol=1e-6) def test_range_limit(self): td = tv.dat_imu.copy(deep=True) mask = avm.clean.range_limit(td.vel) - td['vel'] = avm.clean.clean_fill( - td.vel, mask, method='cubic', maxgap=6) + td["vel"] = avm.clean.clean_fill(td.vel, mask, method="cubic", maxgap=6) if make_data: - save(td, 'vector_data01_rclean.nc') + save(td, "vector_data01_rclean.nc") return - assert_allclose(td, load('vector_data01_rclean.nc'), atol=1e-6) + assert_allclose(td, load("vector_data01_rclean.nc"), atol=1e-6) def test_clean_upADCP(self): td_awac = tp.dat_awac.copy(deep=True) @@ -73,22 +71,22 @@ def test_clean_upADCP(self): td_sig = apm.clean.correlation_filter(td_sig, thresh=50) if make_data: - save(td_awac, 'AWAC_test01_clean.nc') - save(td_sig, 'Sig1000_tidal_clean.nc') + save(td_awac, "AWAC_test01_clean.nc") + save(td_sig, "Sig1000_tidal_clean.nc") return - assert_allclose(td_awac, load('AWAC_test01_clean.nc'), atol=1e-6) - assert_allclose(td_sig, load('Sig1000_tidal_clean.nc'), atol=1e-6) + assert_allclose(td_awac, load("AWAC_test01_clean.nc"), atol=1e-6) + assert_allclose(td_sig, load("Sig1000_tidal_clean.nc"), atol=1e-6) def test_clean_downADCP(self): td = tp.dat_sig_ie.copy(deep=True) # First remove bad data - td['vel'] = apm.clean.val_exceeds_thresh(td.vel, thresh=3) - td['vel'] = apm.clean.fillgaps_time(td.vel) - td['vel_b5'] = apm.clean.fillgaps_time(td.vel_b5) - td['vel'] = apm.clean.fillgaps_depth(td.vel) - td['vel_b5'] = apm.clean.fillgaps_depth(td.vel_b5) + td["vel"] = apm.clean.val_exceeds_thresh(td.vel, thresh=3) + td["vel"] = apm.clean.fillgaps_time(td.vel) + td["vel_b5"] = apm.clean.fillgaps_time(td.vel_b5) + td["vel"] = apm.clean.fillgaps_depth(td.vel) + td["vel_b5"] = apm.clean.fillgaps_depth(td.vel_b5) # Then clean below seabed apm.clean.set_range_offset(td, 0.5) @@ -96,24 +94,24 @@ def test_clean_downADCP(self): td = apm.clean.nan_beyond_surface(td) if make_data: - save(td, 'Sig500_Echo_clean.nc') + save(td, "Sig500_Echo_clean.nc") return - assert_allclose(td, load('Sig500_Echo_clean.nc'), atol=1e-6) + assert_allclose(td, load("Sig500_Echo_clean.nc"), atol=1e-6) def test_orient_filter(self): td_sig = tp.dat_sig_i.copy(deep=True) td_sig = apm.clean.medfilt_orient(td_sig) - apm.rotate2(td_sig, 'earth', inplace=True) + apm.rotate2(td_sig, "earth", inplace=True) td_rdi = tp.dat_rdi.copy(deep=True) td_rdi = apm.clean.medfilt_orient(td_rdi) - apm.rotate2(td_rdi, 'earth', inplace=True) + apm.rotate2(td_rdi, "earth", inplace=True) if make_data: - save(td_sig, 'Sig1000_IMU_ofilt.nc') - save(td_rdi, 'RDI_test01_ofilt.nc') + save(td_sig, "Sig1000_IMU_ofilt.nc") + save(td_rdi, "RDI_test01_ofilt.nc") return - assert_allclose(td_sig, load('Sig1000_IMU_ofilt.nc'), atol=1e-6) - assert_allclose(td_rdi, load('RDI_test01_ofilt.nc'), atol=1e-6) + assert_allclose(td_sig, load("Sig1000_IMU_ofilt.nc"), atol=1e-6) + assert_allclose(td_rdi, load("RDI_test01_ofilt.nc"), atol=1e-6) diff --git a/mhkit/tests/dolfyn/test_motion.py b/mhkit/tests/dolfyn/test_motion.py index 47c193a95..e066058e0 100644 --- a/mhkit/tests/dolfyn/test_motion.py +++ b/mhkit/tests/dolfyn/test_motion.py @@ -3,7 +3,11 @@ from mhkit.dolfyn.adv.motion import correct_motion from . import test_read_adv as tv -from mhkit.tests.dolfyn.base import load_netcdf as load, save_netcdf as save, assert_allclose +from mhkit.tests.dolfyn.base import ( + load_netcdf as load, + save_netcdf as save, + assert_allclose, +) from mhkit.dolfyn.adv import api from mhkit.dolfyn.io.api import read_example as read import unittest @@ -29,50 +33,49 @@ def test_motion_adv(self): tdm0 = tv.dat_imu.copy(deep=True) tdm0.velds.set_declination(0.0, inplace=True) tdm0 = api.correct_motion(tdm0) - tdm0.attrs.pop('declination') - tdm0.attrs.pop('declination_in_orientmat') + tdm0.attrs.pop("declination") + tdm0.attrs.pop("declination_in_orientmat") # test motion-corrected data rotation tdmE = tv.dat_imu.copy(deep=True) tdmE.velds.set_declination(10.0, inplace=True) - tdmE.velds.rotate2('earth', inplace=True) + tdmE.velds.rotate2("earth", inplace=True) tdmE = api.correct_motion(tdmE) # ensure trailing nans are removed from AHRS data - ahrs = read('vector_data_imu01.VEC', userdata=True) - for var in ['accel', 'angrt', 'mag']: - assert not ahrs[var].isnull().any( - ), "nan's in {} variable".format(var) + ahrs = read("vector_data_imu01.VEC", userdata=True) + for var in ["accel", "angrt", "mag"]: + assert not ahrs[var].isnull().any(), "nan's in {} variable".format(var) if make_data: - save(tdm, 'vector_data_imu01_mc.nc') - save(tdm10, 'vector_data_imu01_mcDeclin10.nc') - save(tdmj, 'vector_data_imu01-json_mc.nc') + save(tdm, "vector_data_imu01_mc.nc") + save(tdm10, "vector_data_imu01_mcDeclin10.nc") + save(tdmj, "vector_data_imu01-json_mc.nc") return - cdm10 = load('vector_data_imu01_mcDeclin10.nc') + cdm10 = load("vector_data_imu01_mcDeclin10.nc") - assert_allclose(tdm, load('vector_data_imu01_mc.nc'), atol=1e-7) + assert_allclose(tdm, load("vector_data_imu01_mc.nc"), atol=1e-7) assert_allclose(tdm10, tdmj, atol=1e-7) assert_allclose(tdm0, tdm, atol=1e-7) assert_allclose(tdm10, cdm10, atol=1e-7) assert_allclose(tdmE, cdm10, atol=1e-7) - assert_allclose(tdmj, load('vector_data_imu01-json_mc.nc'), atol=1e-7) + assert_allclose(tdmj, load("vector_data_imu01-json_mc.nc"), atol=1e-7) def test_sep_probes(self): tdm = tv.dat_imu.copy(deep=True) tdm = api.correct_motion(tdm, separate_probes=True) if make_data: - save(tdm, 'vector_data_imu01_mcsp.nc') + save(tdm, "vector_data_imu01_mcsp.nc") return - assert_allclose(tdm, load('vector_data_imu01_mcsp.nc'), atol=1e-7) + assert_allclose(tdm, load("vector_data_imu01_mcsp.nc"), atol=1e-7) def test_duty_cycle(self): - tdc = load('vector_duty_cycle.nc') + tdc = load("vector_duty_cycle.nc") tdc.velds.set_inst2head_rotmat(np.eye(3)) - tdc.attrs['inst2head_vec'] = [0.5, 0, 0.1] + tdc.attrs["inst2head_vec"] = [0.5, 0, 0.1] # with duty cycle code td = correct_motion(tdc, accel_filtfreq=0.03, to_earth=False) @@ -80,16 +83,16 @@ def test_duty_cycle(self): # Wrapped function n_burst = 50 - n_ensembles = len(tdc.time)//n_burst + n_ensembles = len(tdc.time) // n_burst cd = xr.Dataset() - tdc.attrs.pop('duty_cycle_n_burst') + tdc.attrs.pop("duty_cycle_n_burst") for i in range(n_ensembles): - cd0 = tdc.isel(time=slice(n_burst*i, n_burst*i+n_burst)) + cd0 = tdc.isel(time=slice(n_burst * i, n_burst * i + n_burst)) cd0 = correct_motion(cd0, accel_filtfreq=0.03, to_earth=False) - cd = xr.merge((cd, cd0), combine_attrs='no_conflicts') - cd.attrs['duty_cycle_n_burst'] = n_burst + cd = xr.merge((cd, cd0), combine_attrs="no_conflicts") + cd.attrs["duty_cycle_n_burst"] = n_burst - cd_ENU = cd.velds.rotate2('earth', inplace=False) + cd_ENU = cd.velds.rotate2("earth", inplace=False) assert_allclose(td, cd, atol=1e-7) assert_allclose(td_ENU, cd_ENU, atol=1e-7) diff --git a/mhkit/tests/dolfyn/test_orient.py b/mhkit/tests/dolfyn/test_orient.py index 72afb4e92..1cee3aed4 100644 --- a/mhkit/tests/dolfyn/test_orient.py +++ b/mhkit/tests/dolfyn/test_orient.py @@ -8,12 +8,25 @@ def check_hpr(h, p, r, omatin): omat = euler2orient(h, p, r) - assert_allclose(omat, omatin, atol=1e-13, err_msg='Orientation matrix different than expected!\nExpected:\n{}\nGot:\n{}' - .format(np.array(omatin), omat)) + assert_allclose( + omat, + omatin, + atol=1e-13, + err_msg="Orientation matrix different than expected!\nExpected:\n{}\nGot:\n{}".format( + np.array(omatin), omat + ), + ) hpr = orient2euler(omat) - assert_allclose(hpr, [h, p, r], atol=1e-13, err_msg="Angles different than specified, orient2euler and euler2orient are " - "antisymmetric!\nExpected:\n{}\nGot:\n{}" - .format(hpr, np.array([h, p, r]), )) + assert_allclose( + hpr, + [h, p, r], + atol=1e-13, + err_msg="Angles different than specified, orient2euler and euler2orient are " + "antisymmetric!\nExpected:\n{}\nGot:\n{}".format( + hpr, + np.array([h, p, r]), + ), + ) class orient_testcase(unittest.TestCase): @@ -42,67 +55,133 @@ def test_hpr_defs(self): DOCUMENTATION. """ - check_hpr(0, 0, 0, [[0, 1, 0], - [-1, 0, 0], - [0, 0, 1], ]) - - check_hpr(90, 0, 0, [[1, 0, 0], - [0, 1, 0], - [0, 0, 1], ]) - - check_hpr(90, 0, 90, [[1, 0, 0], - [0, 0, 1], - [0, -1, 0], ]) - - sq2 = 1. / np.sqrt(2) - check_hpr(45, 0, 0, [[sq2, sq2, 0], - [-sq2, sq2, 0], - [0, 0, 1], ]) - - check_hpr(0, 45, 0, [[0, sq2, sq2], - [-1, 0, 0], - [0, -sq2, sq2], ]) - - check_hpr(0, 0, 45, [[0, 1, 0], - [-sq2, 0, sq2], - [sq2, 0, sq2], ]) - - check_hpr(90, 45, 90, [[sq2, 0, sq2], - [-sq2, 0, sq2], - [0, -1, 0], ]) + check_hpr( + 0, + 0, + 0, + [ + [0, 1, 0], + [-1, 0, 0], + [0, 0, 1], + ], + ) + + check_hpr( + 90, + 0, + 0, + [ + [1, 0, 0], + [0, 1, 0], + [0, 0, 1], + ], + ) + + check_hpr( + 90, + 0, + 90, + [ + [1, 0, 0], + [0, 0, 1], + [0, -1, 0], + ], + ) + + sq2 = 1.0 / np.sqrt(2) + check_hpr( + 45, + 0, + 0, + [ + [sq2, sq2, 0], + [-sq2, sq2, 0], + [0, 0, 1], + ], + ) + + check_hpr( + 0, + 45, + 0, + [ + [0, sq2, sq2], + [-1, 0, 0], + [0, -sq2, sq2], + ], + ) + + check_hpr( + 0, + 0, + 45, + [ + [0, 1, 0], + [-sq2, 0, sq2], + [sq2, 0, sq2], + ], + ) + + check_hpr( + 90, + 45, + 90, + [ + [sq2, 0, sq2], + [-sq2, 0, sq2], + [0, -1, 0], + ], + ) c30 = np.cos(np.deg2rad(30)) s30 = np.sin(np.deg2rad(30)) - check_hpr(30, 0, 0, [[s30, c30, 0], - [-c30, s30, 0], - [0, 0, 1], ]) + check_hpr( + 30, + 0, + 0, + [ + [s30, c30, 0], + [-c30, s30, 0], + [0, 0, 1], + ], + ) def test_pr_declination(self): # Test to confirm that pitch and roll don't change when you set # declination declin = 15.37 - dat = load('vector_data_imu01.nc') - h0, p0, r0 = orient2euler(dat['orientmat'].values) + dat = load("vector_data_imu01.nc") + h0, p0, r0 = orient2euler(dat["orientmat"].values) set_declination(dat, declin, inplace=True) - h1, p1, r1 = orient2euler(dat['orientmat'].values) - - assert_allclose(p0, p1, atol=1e-5, - err_msg="Pitch changes when setting declination") - assert_allclose(r0, r1, atol=1e-5, - err_msg="Roll changes when setting declination") - assert_allclose(h0 + declin, h1, atol=1e-5, err_msg="incorrect heading change when " - "setting declination") + h1, p1, r1 = orient2euler(dat["orientmat"].values) + + assert_allclose( + p0, p1, atol=1e-5, err_msg="Pitch changes when setting declination" + ) + assert_allclose( + r0, r1, atol=1e-5, err_msg="Roll changes when setting declination" + ) + assert_allclose( + h0 + declin, + h1, + atol=1e-5, + err_msg="incorrect heading change when " "setting declination", + ) def test_q_hpr(self): - dat = load('Sig1000_IMU.nc') + dat = load("Sig1000_IMU.nc") dcm = quaternion2orient(dat.quaternions) - assert_allclose(dat.orientmat, dcm, atol=5e-4, - err_msg="Disagreement b/t quaternion-calc'd & HPR-calc'd orientmat") + assert_allclose( + dat.orientmat, + dcm, + atol=5e-4, + err_msg="Disagreement b/t quaternion-calc'd & HPR-calc'd orientmat", + ) -if __name__ == '__main__': +if __name__ == "__main__": unittest.main() diff --git a/mhkit/tests/dolfyn/test_read_adp.py b/mhkit/tests/dolfyn/test_read_adp.py index cfd7f306b..a64fca546 100644 --- a/mhkit/tests/dolfyn/test_read_adp.py +++ b/mhkit/tests/dolfyn/test_read_adp.py @@ -12,58 +12,63 @@ load = tb.load_netcdf save = tb.save_netcdf -dat_rdi = load('RDI_test01.nc') -dat_rdi_7f79 = load('RDI_7f79.nc') -dat_rdi_bt = load('RDI_withBT.nc') -dat_vm_ws = load('vmdas01_wh.nc') -dat_vm_os = load('vmdas02_os.nc') -dat_wr1 = load('winriver01.nc') -dat_wr2 = load('winriver02.nc') -dat_rp = load('RiverPro_test01.nc') -dat_trsc = load('winriver02_transect.nc') - -dat_awac = load('AWAC_test01.nc') -dat_awac_ud = load('AWAC_test01_ud.nc') -dat_hwac = load('H-AWAC_test01.nc') -dat_sig = load('BenchFile01.nc') -dat_sig_i = load('Sig1000_IMU.nc') -dat_sig_i_ud = load('Sig1000_IMU_ud.nc') -dat_sig_ieb = load('VelEchoBT01.nc') -dat_sig_ie = load('Sig500_Echo.nc') -dat_sig_tide = load('Sig1000_tidal.nc') -dat_sig_skip = load('Sig_SkippedPings01.nc') -dat_sig_badt = load('Sig1000_BadTime01.nc') -dat_sig5_leiw = load('Sig500_last_ensemble_is_whole.nc') +dat_rdi = load("RDI_test01.nc") +dat_rdi_7f79 = load("RDI_7f79.nc") +dat_rdi_7f79_2 = load("RDI_7f79_2.nc") +dat_rdi_bt = load("RDI_withBT.nc") +dat_vm_ws = load("vmdas01_wh.nc") +dat_vm_os = load("vmdas02_os.nc") +dat_wr1 = load("winriver01.nc") +dat_wr2 = load("winriver02.nc") +dat_rp = load("RiverPro_test01.nc") +dat_trsc = load("winriver02_transect.nc") + +dat_awac = load("AWAC_test01.nc") +dat_awac_ud = load("AWAC_test01_ud.nc") +dat_hwac = load("H-AWAC_test01.nc") +dat_sig = load("BenchFile01.nc") +dat_sig_i = load("Sig1000_IMU.nc") +dat_sig_i_ud = load("Sig1000_IMU_ud.nc") +dat_sig_ieb = load("VelEchoBT01.nc") +dat_sig_ie = load("Sig500_Echo.nc") +dat_sig_tide = load("Sig1000_tidal.nc") +dat_sig_skip = load("Sig_SkippedPings01.nc") +dat_sig_badt = load("Sig1000_BadTime01.nc") +dat_sig5_leiw = load("Sig500_last_ensemble_is_whole.nc") +dat_sig_dp2 = load("dual_profile.nc") class io_adp_testcase(unittest.TestCase): def test_io_rdi(self): - warnings.simplefilter('ignore', UserWarning) + warnings.simplefilter("ignore", UserWarning) nens = 100 - td_rdi = read('RDI_test01.000') - td_7f79 = read('RDI_7f79.000') - td_rdi_bt = read('RDI_withBT.000', nens=nens) - td_vm = read('vmdas01_wh.ENX', nens=nens) - td_os = read('vmdas02_os.ENR', nens=nens) - td_wr1 = read('winriver01.PD0') - td_wr2 = read('winriver02.PD0') - td_rp = read('RiverPro_test01.PD0', nens=nens) - td_transect = read('winriver02_transect.PD0', nens=nens) + td_rdi = read("RDI_test01.000") + td_7f79 = read("RDI_7f79.000") + td_7f79_2 = read("RDI_7f79_2.000") + td_rdi_bt = read("RDI_withBT.000", nens=nens) + td_vm = read("vmdas01_wh.ENX", nens=nens) + td_os = read("vmdas02_os.ENR", nens=nens) + td_wr1 = read("winriver01.PD0") + td_wr2 = read("winriver02.PD0") + td_rp = read("RiverPro_test01.PD0") + td_transect = read("winriver02_transect.PD0", nens=nens) if make_data: - save(td_rdi, 'RDI_test01.nc') - save(td_7f79, 'RDI_7f79.nc') - save(td_rdi_bt, 'RDI_withBT.nc') - save(td_vm, 'vmdas01_wh.nc') - save(td_os, 'vmdas02_os.nc') - save(td_wr1, 'winriver01.nc') - save(td_wr2, 'winriver02.nc') - save(td_rp, 'RiverPro_test01.nc') - save(td_transect, 'winriver02_transect.nc') + save(td_rdi, "RDI_test01.nc") + save(td_7f79, "RDI_7f79.nc") + save(td_7f79_2, "RDI_7f79_2.nc") + save(td_rdi_bt, "RDI_withBT.nc") + save(td_vm, "vmdas01_wh.nc") + save(td_os, "vmdas02_os.nc") + save(td_wr1, "winriver01.nc") + save(td_wr2, "winriver02.nc") + save(td_rp, "RiverPro_test01.nc") + save(td_transect, "winriver02_transect.nc") return assert_allclose(td_rdi, dat_rdi, atol=1e-6) assert_allclose(td_7f79, dat_rdi_7f79, atol=1e-6) + assert_allclose(td_7f79_2, dat_rdi_7f79_2, atol=1e-6) assert_allclose(td_rdi_bt, dat_rdi_bt, atol=1e-6) assert_allclose(td_vm, dat_vm_ws, atol=1e-6) assert_allclose(td_os, dat_vm_os, atol=1e-6) @@ -75,14 +80,14 @@ def test_io_rdi(self): def test_io_nortek(self): nens = 100 with pytest.warns(UserWarning): - td_awac = read('AWAC_test01.wpr', userdata=False, nens=[0, nens]) - td_awac_ud = read('AWAC_test01.wpr', nens=nens) - td_hwac = read('H-AWAC_test01.wpr') + td_awac = read("AWAC_test01.wpr", userdata=False, nens=[0, nens]) + td_awac_ud = read("AWAC_test01.wpr", nens=nens) + td_hwac = read("H-AWAC_test01.wpr") if make_data: - save(td_awac, 'AWAC_test01.nc') - save(td_awac_ud, 'AWAC_test01_ud.nc') - save(td_hwac, 'H-AWAC_test01.nc') + save(td_awac, "AWAC_test01.nc") + save(td_awac_ud, "AWAC_test01_ud.nc") + save(td_hwac, "H-AWAC_test01.nc") return assert_allclose(td_awac, dat_awac, atol=1e-6) @@ -91,44 +96,49 @@ def test_io_nortek(self): def test_io_nortek2(self): nens = 100 - td_sig = read('BenchFile01.ad2cp', nens=nens) - td_sig_i = read('Sig1000_IMU.ad2cp', userdata=False, nens=nens) - td_sig_i_ud = read('Sig1000_IMU.ad2cp', nens=nens) - td_sig_ieb = read('VelEchoBT01.ad2cp', nens=nens) - td_sig_ie = read('Sig500_Echo.ad2cp', nens=nens) - td_sig_tide = read('Sig1000_tidal.ad2cp', nens=nens) + td_sig = read("BenchFile01.ad2cp", nens=nens, rebuild_index=True) + td_sig_i = read( + "Sig1000_IMU.ad2cp", userdata=False, nens=nens, rebuild_index=True + ) + td_sig_i_ud = read("Sig1000_IMU.ad2cp", nens=nens, rebuild_index=True) + td_sig_ieb = read("VelEchoBT01.ad2cp", nens=nens, rebuild_index=True) + td_sig_ie = read("Sig500_Echo.ad2cp", nens=nens, rebuild_index=True) + td_sig_tide = read("Sig1000_tidal.ad2cp", nens=nens, rebuild_index=True) + # Only need to test 2nd dataset + td_sig_dp1, td_sig_dp2 = read("dual_profile.ad2cp") with pytest.warns(UserWarning): # This issues a warning... - td_sig_skip = read('Sig_SkippedPings01.ad2cp') + td_sig_skip = read("Sig_SkippedPings01.ad2cp") with pytest.warns(UserWarning): - td_sig_badt = sig.read_signature( - tb.rfnm('Sig1000_BadTime01.ad2cp')) + td_sig_badt = sig.read_signature(tb.rfnm("Sig1000_BadTime01.ad2cp")) # Make sure we read all the way to the end of the file. # This file ends exactly at the end of an ensemble. - td_sig5_leiw = read('Sig500_last_ensemble_is_whole.ad2cp') - - os.remove(tb.exdt('BenchFile01.ad2cp.index')) - os.remove(tb.exdt('Sig1000_IMU.ad2cp.index')) - os.remove(tb.exdt('VelEchoBT01.ad2cp.index')) - os.remove(tb.exdt('Sig500_Echo.ad2cp.index')) - os.remove(tb.exdt('Sig1000_tidal.ad2cp.index')) - os.remove(tb.exdt('Sig_SkippedPings01.ad2cp.index')) - os.remove(tb.exdt('Sig500_last_ensemble_is_whole.ad2cp.index')) - os.remove(tb.rfnm('Sig1000_BadTime01.ad2cp.index')) + td_sig5_leiw = read("Sig500_last_ensemble_is_whole.ad2cp") + + os.remove(tb.exdt("BenchFile01.ad2cp.index")) + os.remove(tb.exdt("Sig1000_IMU.ad2cp.index")) + os.remove(tb.exdt("VelEchoBT01.ad2cp.index")) + os.remove(tb.exdt("Sig500_Echo.ad2cp.index")) + os.remove(tb.exdt("Sig1000_tidal.ad2cp.index")) + os.remove(tb.exdt("Sig_SkippedPings01.ad2cp.index")) + os.remove(tb.exdt("Sig500_last_ensemble_is_whole.ad2cp.index")) + os.remove(tb.rfnm("Sig1000_BadTime01.ad2cp.index")) + os.remove(tb.exdt("dual_profile.ad2cp.index")) if make_data: - save(td_sig, 'BenchFile01.nc') - save(td_sig_i, 'Sig1000_IMU.nc') - save(td_sig_i_ud, 'Sig1000_IMU_ud.nc') - save(td_sig_ieb, 'VelEchoBT01.nc') - save(td_sig_ie, 'Sig500_Echo.nc') - save(td_sig_tide, 'Sig1000_tidal.nc') - save(td_sig_skip, 'Sig_SkippedPings01.nc') - save(td_sig_badt, 'Sig1000_BadTime01.nc') - save(td_sig5_leiw, 'Sig500_last_ensemble_is_whole.nc') + save(td_sig, "BenchFile01.nc") + save(td_sig_i, "Sig1000_IMU.nc") + save(td_sig_i_ud, "Sig1000_IMU_ud.nc") + save(td_sig_ieb, "VelEchoBT01.nc") + save(td_sig_ie, "Sig500_Echo.nc") + save(td_sig_tide, "Sig1000_tidal.nc") + save(td_sig_skip, "Sig_SkippedPings01.nc") + save(td_sig_badt, "Sig1000_BadTime01.nc") + save(td_sig5_leiw, "Sig500_last_ensemble_is_whole.nc") + save(td_sig_dp2, "dual_profile.nc") return assert_allclose(td_sig, dat_sig, atol=1e-6) @@ -140,25 +150,42 @@ def test_io_nortek2(self): assert_allclose(td_sig5_leiw, dat_sig5_leiw, atol=1e-6) assert_allclose(td_sig_skip, dat_sig_skip, atol=1e-6) assert_allclose(td_sig_badt, dat_sig_badt, atol=1e-6) + assert_allclose(td_sig_dp2, dat_sig_dp2, atol=1e-6) def test_nortek2_crop(self): # Test file cropping function - crop_ensembles(infile=tb.exdt('Sig500_Echo.ad2cp'), - outfile=tb.exdt('Sig500_Echo_crop.ad2cp'), - range=[50, 100]) - td_sig_ie_crop = read('Sig500_Echo_crop.ad2cp') + crop_ensembles( + infile=tb.exdt("Sig500_Echo.ad2cp"), + outfile=tb.exdt("Sig500_Echo_crop.ad2cp"), + range=[50, 100], + ) + td_sig_ie_crop = read("Sig500_Echo_crop.ad2cp") + + crop_ensembles( + infile=tb.exdt("BenchFile01.ad2cp"), + outfile=tb.exdt("BenchFile01_crop.ad2cp"), + range=[50, 100], + ) + td_sig_crop = read("BenchFile01_crop.ad2cp") if make_data: - save(td_sig_ie_crop, 'Sig500_Echo_crop.nc') + save(td_sig_ie_crop, "Sig500_Echo_crop.nc") + save(td_sig_crop, "BenchFile01_crop.nc") return - os.remove(tb.exdt('Sig500_Echo.ad2cp.index')) - os.remove(tb.exdt('Sig500_Echo_crop.ad2cp')) - os.remove(tb.exdt('Sig500_Echo_crop.ad2cp.index')) + os.remove(tb.exdt("Sig500_Echo.ad2cp.index")) + os.remove(tb.exdt("Sig500_Echo_crop.ad2cp")) + os.remove(tb.exdt("Sig500_Echo_crop.ad2cp.index")) + os.remove(tb.exdt("BenchFile01.ad2cp.index")) + os.remove(tb.exdt("BenchFile01_crop.ad2cp")) + os.remove(tb.exdt("BenchFile01_crop.ad2cp.index")) + + cd_sig_ie_crop = load("Sig500_Echo_crop.nc") + cd_sig_crop = load("BenchFile01_crop.nc") - cd_sig_ie_crop = load('Sig500_Echo_crop.nc') assert_allclose(td_sig_ie_crop, cd_sig_ie_crop, atol=1e-6) + assert_allclose(td_sig_crop, cd_sig_crop, atol=1e-6) -if __name__ == '__main__': +if __name__ == "__main__": unittest.main() diff --git a/mhkit/tests/dolfyn/test_read_adv.py b/mhkit/tests/dolfyn/test_read_adv.py index f1d03c7af..9143099a6 100644 --- a/mhkit/tests/dolfyn/test_read_adv.py +++ b/mhkit/tests/dolfyn/test_read_adv.py @@ -9,32 +9,34 @@ save = tb.save_netcdf assert_allclose = tb.assert_allclose -dat = load('vector_data01') -dat_imu = load('vector_data_imu01') -dat_imu_json = load('vector_data_imu01-json') -dat_burst = load('vector_burst_mode01') +dat = load("vector_data01") +dat_imu = load("vector_data_imu01") +dat_imu_json = load("vector_data_imu01-json") +dat_burst = load("vector_burst_mode01") class io_adv_testcase(unittest.TestCase): def test_io_adv(self): nens = 100 - td = read('vector_data01.VEC', nens=nens) - tdm = read('vector_data_imu01.VEC', userdata=False, nens=nens) - tdb = read('vector_burst_mode01.VEC', nens=nens) - tdm2 = read('vector_data_imu01.VEC', - userdata=tb.exdt('vector_data_imu01.userdata.json'), - nens=nens) + td = read("vector_data01.VEC", nens=nens) + tdm = read("vector_data_imu01.VEC", userdata=False, nens=nens) + tdb = read("vector_burst_mode01.VEC", nens=nens) + tdm2 = read( + "vector_data_imu01.VEC", + userdata=tb.exdt("vector_data_imu01.userdata.json"), + nens=nens, + ) # These values are not correct for this data but I'm adding them for # test purposes only. set_inst2head_rotmat(tdm, np.eye(3), inplace=True) - tdm.attrs['inst2head_vec'] = [-1.0, 0.5, 0.2] + tdm.attrs["inst2head_vec"] = [-1.0, 0.5, 0.2] if make_data: - save(td, 'vector_data01.nc') - save(tdm, 'vector_data_imu01.nc') - save(tdb, 'vector_burst_mode01.nc') - save(tdm2, 'vector_data_imu01-json.nc') + save(td, "vector_data01.nc") + save(tdm, "vector_data_imu01.nc") + save(tdb, "vector_burst_mode01.nc") + save(tdm2, "vector_data_imu01-json.nc") return assert_allclose(td, dat, atol=1e-6) @@ -43,5 +45,5 @@ def test_io_adv(self): assert_allclose(tdm2, dat_imu_json, atol=1e-6) -if __name__ == '__main__': +if __name__ == "__main__": unittest.main() diff --git a/mhkit/tests/dolfyn/test_read_io.py b/mhkit/tests/dolfyn/test_read_io.py index 16f1b2c6a..835acc6bd 100644 --- a/mhkit/tests/dolfyn/test_read_io.py +++ b/mhkit/tests/dolfyn/test_read_io.py @@ -1,6 +1,13 @@ from . import test_read_adp as tp from . import test_read_adv as tv -from mhkit.tests.dolfyn.base import assert_allclose, save_netcdf, save_matlab, load_matlab, exdt, rfnm +from mhkit.tests.dolfyn.base import ( + assert_allclose, + save_netcdf, + save_matlab, + load_matlab, + exdt, + rfnm, +) import mhkit.dolfyn.io.rdi as wh import mhkit.dolfyn.io.nortek as awac import mhkit.dolfyn.io.nortek2 as sig @@ -15,34 +22,40 @@ class io_testcase(unittest.TestCase): def test_save(self): ds = tv.dat.copy(deep=True) + ds2 = tp.dat_sig.copy(deep=True) + save_netcdf(ds, "test_save") + save_netcdf(ds2, "test_save_comp.nc", compression=True) + save_matlab(ds, "test_save") - save_netcdf(ds, 'test_save') - save_matlab(ds, 'test_save') + assert os.path.exists(rfnm("test_save.nc")) + assert os.path.exists(rfnm("test_save_comp.nc")) + assert os.path.exists(rfnm("test_save.mat")) - assert os.path.exists(rfnm('test_save.nc')) - assert os.path.exists(rfnm('test_save.mat')) + os.remove(rfnm("test_save.nc")) + os.remove(rfnm("test_save_comp.nc")) + os.remove(rfnm("test_save.mat")) def test_matlab_io(self): nens = 100 - td_vec = read('vector_data_imu01.VEC', nens=nens) - td_rdi_bt = read('RDI_withBT.000', nens=nens) + td_vec = read("vector_data_imu01.VEC", nens=nens) + td_rdi_bt = read("RDI_withBT.000", nens=nens) # This read should trigger a warning about the declination being # defined in two places (in the binary .ENX files), and in the # .userdata.json file. NOTE: DOLfYN defaults to using what is in # the .userdata.json file. - with pytest.warns(UserWarning, match='magnetic_var_deg'): - td_vm = read('vmdas01_wh.ENX', nens=nens) + with pytest.warns(UserWarning, match="magnetic_var_deg"): + td_vm = read("vmdas01_wh.ENX", nens=nens) if make_data: - save_matlab(td_vec, 'dat_vec') - save_matlab(td_rdi_bt, 'dat_rdi_bt') - save_matlab(td_vm, 'dat_vm') + save_matlab(td_vec, "dat_vec") + save_matlab(td_rdi_bt, "dat_rdi_bt") + save_matlab(td_vm, "dat_vm") return - mat_vec = load_matlab('dat_vec.mat') - mat_rdi_bt = load_matlab('dat_rdi_bt.mat') - mat_vm = load_matlab('dat_vm.mat') + mat_vec = load_matlab("dat_vec.mat") + mat_rdi_bt = load_matlab("dat_rdi_bt.mat") + mat_vm = load_matlab("dat_vm.mat") assert_allclose(td_vec, mat_vec, atol=1e-6) assert_allclose(td_rdi_bt, mat_rdi_bt, atol=1e-6) @@ -50,18 +63,18 @@ def test_matlab_io(self): def test_debugging(self): def read_txt(fname, loc): - with open(loc(fname), 'r') as f: + with open(loc(fname), "r") as f: string = f.read() return string def clip_file(fname): log = read_txt(fname, exdt) - newlines = [i for i, ltr in enumerate(log) if ltr == '\n'] + newlines = [i for i, ltr in enumerate(log) if ltr == "\n"] try: - log = log[:newlines[100]+1] + log = log[: newlines[100] + 1] except: pass - with open(rfnm(fname), 'w') as f: + with open(rfnm(fname), "w") as f: f.write(log) def read_file_and_test(fname): @@ -71,32 +84,36 @@ def read_file_and_test(fname): os.remove(exdt(fname)) nens = 100 - wh.read_rdi(exdt('RDI_withBT.000'), nens, debug_level=3) - awac.read_nortek(exdt('AWAC_test01.wpr'), nens, debug=True, do_checksum=True) - awac.read_nortek(exdt('vector_data_imu01.VEC'), nens, debug=True, do_checksum=True) - sig.read_signature(exdt('Sig500_Echo.ad2cp'), nens, rebuild_index=True, debug=True) - os.remove(exdt('Sig500_Echo.ad2cp.index')) + wh.read_rdi(exdt("RDI_withBT.000"), nens, debug_level=3) + awac.read_nortek(exdt("AWAC_test01.wpr"), nens, debug=True, do_checksum=True) + awac.read_nortek( + exdt("vector_data_imu01.VEC"), nens, debug=True, do_checksum=True + ) + sig.read_signature( + exdt("Sig500_Echo.ad2cp"), nens, rebuild_index=True, debug=True + ) + os.remove(exdt("Sig500_Echo.ad2cp.index")) if make_data: - clip_file('RDI_withBT.dolfyn.log') - clip_file('AWAC_test01.dolfyn.log') - clip_file('vector_data_imu01.dolfyn.log') - clip_file('Sig500_Echo.dolfyn.log') + clip_file("RDI_withBT.dolfyn.log") + clip_file("AWAC_test01.dolfyn.log") + clip_file("vector_data_imu01.dolfyn.log") + clip_file("Sig500_Echo.dolfyn.log") return - read_file_and_test('RDI_withBT.dolfyn.log') - read_file_and_test('AWAC_test01.dolfyn.log') - read_file_and_test('vector_data_imu01.dolfyn.log') - read_file_and_test('Sig500_Echo.dolfyn.log') + read_file_and_test("RDI_withBT.dolfyn.log") + read_file_and_test("AWAC_test01.dolfyn.log") + read_file_and_test("vector_data_imu01.dolfyn.log") + read_file_and_test("Sig500_Echo.dolfyn.log") def test_read_warnings(self): with self.assertRaises(Exception): - wh.read_rdi(exdt('H-AWAC_test01.wpr')) + wh.read_rdi(exdt("H-AWAC_test01.wpr")) with self.assertRaises(Exception): - awac.read_nortek(exdt('BenchFile01.ad2cp')) + awac.read_nortek(exdt("BenchFile01.ad2cp")) with self.assertRaises(Exception): - sig.read_signature(exdt('AWAC_test01.wpr')) + sig.read_signature(exdt("AWAC_test01.wpr")) with self.assertRaises(IOError): - read(rfnm('AWAC_test01.nc')) + read(rfnm("AWAC_test01.nc")) with self.assertRaises(Exception): - save_netcdf(tp.dat_rdi, 'test_save.fail') + save_netcdf(tp.dat_rdi, "test_save.fail") diff --git a/mhkit/tests/dolfyn/test_rotate_adp.py b/mhkit/tests/dolfyn/test_rotate_adp.py index 4ec21353d..5fa67f05e 100644 --- a/mhkit/tests/dolfyn/test_rotate_adp.py +++ b/mhkit/tests/dolfyn/test_rotate_adp.py @@ -4,28 +4,28 @@ import numpy as np import numpy.testing as npt import unittest + make_data = False class rotate_adp_testcase(unittest.TestCase): def test_rotate_beam2inst(self): - - td_rdi = rotate2(tr.dat_rdi, 'inst', inplace=False) - td_sig = rotate2(tr.dat_sig, 'inst', inplace=False) - td_sig_i = rotate2(tr.dat_sig_i, 'inst', inplace=False) - td_sig_ieb = rotate2(tr.dat_sig_ieb, 'inst', inplace=False) + td_rdi = rotate2(tr.dat_rdi, "inst", inplace=False) + td_sig = rotate2(tr.dat_sig, "inst", inplace=False) + td_sig_i = rotate2(tr.dat_sig_i, "inst", inplace=False) + td_sig_ieb = rotate2(tr.dat_sig_ieb, "inst", inplace=False) if make_data: - save(td_rdi, 'RDI_test01_rotate_beam2inst.nc') - save(td_sig, 'BenchFile01_rotate_beam2inst.nc') - save(td_sig_i, 'Sig1000_IMU_rotate_beam2inst.nc') - save(td_sig_ieb, 'VelEchoBT01_rotate_beam2inst.nc') + save(td_rdi, "RDI_test01_rotate_beam2inst.nc") + save(td_sig, "BenchFile01_rotate_beam2inst.nc") + save(td_sig_i, "Sig1000_IMU_rotate_beam2inst.nc") + save(td_sig_ieb, "VelEchoBT01_rotate_beam2inst.nc") return - cd_rdi = load('RDI_test01_rotate_beam2inst.nc') - cd_sig = load('BenchFile01_rotate_beam2inst.nc') - cd_sig_i = load('Sig1000_IMU_rotate_beam2inst.nc') - cd_sig_ieb = load('VelEchoBT01_rotate_beam2inst.nc') + cd_rdi = load("RDI_test01_rotate_beam2inst.nc") + cd_sig = load("BenchFile01_rotate_beam2inst.nc") + cd_sig_i = load("Sig1000_IMU_rotate_beam2inst.nc") + cd_sig_ieb = load("VelEchoBT01_rotate_beam2inst.nc") assert_allclose(td_rdi, cd_rdi, atol=1e-5) assert_allclose(td_sig, cd_sig, atol=1e-5) @@ -33,32 +33,31 @@ def test_rotate_beam2inst(self): assert_allclose(td_sig_ieb, cd_sig_ieb, atol=1e-5) def test_rotate_inst2beam(self): - - td = load('RDI_test01_rotate_beam2inst.nc') - rotate2(td, 'beam', inplace=True) - td_awac = load('AWAC_test01_earth2inst.nc') - rotate2(td_awac, 'beam', inplace=True) - td_sig = load('BenchFile01_rotate_beam2inst.nc') - rotate2(td_sig, 'beam', inplace=True) - td_sig_i = load('Sig1000_IMU_rotate_beam2inst.nc') - rotate2(td_sig_i, 'beam', inplace=True) - td_sig_ie = load('Sig500_Echo_earth2inst.nc') - rotate2(td_sig_ie, 'beam', inplace=True) + td = load("RDI_test01_rotate_beam2inst.nc") + rotate2(td, "beam", inplace=True) + td_awac = load("AWAC_test01_earth2inst.nc") + rotate2(td_awac, "beam", inplace=True) + td_sig = load("BenchFile01_rotate_beam2inst.nc") + rotate2(td_sig, "beam", inplace=True) + td_sig_i = load("Sig1000_IMU_rotate_beam2inst.nc") + rotate2(td_sig_i, "beam", inplace=True) + td_sig_ie = load("Sig500_Echo_earth2inst.nc") + rotate2(td_sig_ie, "beam", inplace=True) if make_data: - save(td_awac, 'AWAC_test01_inst2beam.nc') - save(td_sig_ie, 'Sig500_Echo_inst2beam.nc') + save(td_awac, "AWAC_test01_inst2beam.nc") + save(td_sig_ie, "Sig500_Echo_inst2beam.nc") return cd_td = tr.dat_rdi.copy(deep=True) - cd_awac = load('AWAC_test01_inst2beam.nc') + cd_awac = load("AWAC_test01_inst2beam.nc") cd_sig = tr.dat_sig.copy(deep=True) cd_sig_i = tr.dat_sig_i.copy(deep=True) - cd_sig_ie = load('Sig500_Echo_inst2beam.nc') + cd_sig_ie = load("Sig500_Echo_inst2beam.nc") # # The reverse RDI rotation doesn't work b/c of NaN's in one beam # # that propagate to others, so we impose that here. - cd_td['vel'].values[:, np.isnan(cd_td['vel'].values).any(0)] = np.NaN + cd_td["vel"].values[:, np.isnan(cd_td["vel"].values).any(0)] = np.NaN assert_allclose(td, cd_td, atol=1e-5) assert_allclose(td_awac, cd_awac, atol=1e-5) @@ -69,38 +68,35 @@ def test_rotate_inst2beam(self): def test_rotate_inst2earth(self): # AWAC & Sig500 are loaded in earth td_awac = tr.dat_awac.copy(deep=True) - rotate2(td_awac, 'inst', inplace=True) + rotate2(td_awac, "inst", inplace=True) td_sig_ie = tr.dat_sig_ie.copy(deep=True) - rotate2(td_sig_ie, 'inst', inplace=True) + rotate2(td_sig_ie, "inst", inplace=True) td_sig_o = td_sig_ie.copy(deep=True) - td = rotate2(tr.dat_rdi, 'earth', inplace=False) - tdwr2 = rotate2(tr.dat_wr2, 'earth', inplace=False) - td_sig = load('BenchFile01_rotate_beam2inst.nc') - rotate2(td_sig, 'earth', inplace=True) - td_sig_i = load('Sig1000_IMU_rotate_beam2inst.nc') - rotate2(td_sig_i, 'earth', inplace=True) + td = rotate2(tr.dat_rdi, "earth", inplace=False) + tdwr2 = rotate2(tr.dat_wr2, "earth", inplace=False) + td_sig = load("BenchFile01_rotate_beam2inst.nc") + rotate2(td_sig, "earth", inplace=True) + td_sig_i = load("Sig1000_IMU_rotate_beam2inst.nc") + rotate2(td_sig_i, "earth", inplace=True) if make_data: - save(td_awac, 'AWAC_test01_earth2inst.nc') - save(td, 'RDI_test01_rotate_inst2earth.nc') - save(tdwr2, 'winriver02_rotate_ship2earth.nc') - save(td_sig, 'BenchFile01_rotate_inst2earth.nc') - save(td_sig_i, 'Sig1000_IMU_rotate_inst2earth.nc') - save(td_sig_ie, 'Sig500_Echo_earth2inst.nc') + save(td_awac, "AWAC_test01_earth2inst.nc") + save(td, "RDI_test01_rotate_inst2earth.nc") + save(tdwr2, "winriver02_rotate_ship2earth.nc") + save(td_sig, "BenchFile01_rotate_inst2earth.nc") + save(td_sig_i, "Sig1000_IMU_rotate_inst2earth.nc") + save(td_sig_ie, "Sig500_Echo_earth2inst.nc") return - td_awac = rotate2(load('AWAC_test01_earth2inst.nc'), - 'earth', inplace=False) - td_sig_ie = rotate2(load('Sig500_Echo_earth2inst.nc'), - 'earth', inplace=False) - td_sig_o = rotate2(td_sig_o.drop_vars( - 'orientmat'), 'earth', inplace=False) + td_awac = rotate2(load("AWAC_test01_earth2inst.nc"), "earth", inplace=False) + td_sig_ie = rotate2(load("Sig500_Echo_earth2inst.nc"), "earth", inplace=False) + td_sig_o = rotate2(td_sig_o.drop_vars("orientmat"), "earth", inplace=False) - cd = load('RDI_test01_rotate_inst2earth.nc') - cdwr2 = load('winriver02_rotate_ship2earth.nc') - cd_sig = load('BenchFile01_rotate_inst2earth.nc') - cd_sig_i = load('Sig1000_IMU_rotate_inst2earth.nc') + cd = load("RDI_test01_rotate_inst2earth.nc") + cdwr2 = load("winriver02_rotate_ship2earth.nc") + cd_sig = load("BenchFile01_rotate_inst2earth.nc") + cd_sig_i = load("Sig1000_IMU_rotate_inst2earth.nc") assert_allclose(td, cd, atol=1e-5) assert_allclose(tdwr2, cdwr2, atol=1e-5) @@ -111,66 +107,66 @@ def test_rotate_inst2earth(self): npt.assert_allclose(td_sig_o.vel, tr.dat_sig_ie.vel, atol=1e-5) def test_rotate_earth2inst(self): - - td_rdi = load('RDI_test01_rotate_inst2earth.nc') - rotate2(td_rdi, 'inst', inplace=True) - tdwr2 = load('winriver02_rotate_ship2earth.nc') - rotate2(tdwr2, 'inst', inplace=True) + td_rdi = load("RDI_test01_rotate_inst2earth.nc") + rotate2(td_rdi, "inst", inplace=True) + tdwr2 = load("winriver02_rotate_ship2earth.nc") + rotate2(tdwr2, "inst", inplace=True) td_awac = tr.dat_awac.copy(deep=True) - rotate2(td_awac, 'inst', inplace=True) # AWAC is in earth coords - td_sig = load('BenchFile01_rotate_inst2earth.nc') - rotate2(td_sig, 'inst', inplace=True) - td_sig_i = load('Sig1000_IMU_rotate_inst2earth.nc') - rotate2(td_sig_i, 'inst', inplace=True) + rotate2(td_awac, "inst", inplace=True) # AWAC is in earth coords + td_sig = load("BenchFile01_rotate_inst2earth.nc") + rotate2(td_sig, "inst", inplace=True) + td_sig_i = load("Sig1000_IMU_rotate_inst2earth.nc") + rotate2(td_sig_i, "inst", inplace=True) - cd_rdi = load('RDI_test01_rotate_beam2inst.nc') + cd_rdi = load("RDI_test01_rotate_beam2inst.nc") cd_wr2 = tr.dat_wr2 # ship and inst are considered equivalent in dolfy - cd_wr2.attrs['coord_sys'] = 'inst' - cd_awac = load('AWAC_test01_earth2inst.nc') - cd_sig = load('BenchFile01_rotate_beam2inst.nc') - cd_sig_i = load('Sig1000_IMU_rotate_beam2inst.nc') + cd_wr2.attrs["coord_sys"] = "inst" + cd_awac = load("AWAC_test01_earth2inst.nc") + cd_sig = load("BenchFile01_rotate_beam2inst.nc") + cd_sig_i = load("Sig1000_IMU_rotate_beam2inst.nc") assert_allclose(td_rdi, cd_rdi, atol=1e-5) assert_allclose(tdwr2, cd_wr2, atol=1e-5) assert_allclose(td_awac, cd_awac, atol=1e-5) assert_allclose(td_sig, cd_sig, atol=1e-5) # known failure due to orientmat, see test_vs_nortek - #assert_allclose(td_sig_i, cd_sig_i, atol=1e-3) - npt.assert_allclose(td_sig_i.accel.values, - cd_sig_i.accel.values, atol=1e-3) + # assert_allclose(td_sig_i, cd_sig_i, atol=1e-3) + npt.assert_allclose(td_sig_i.accel.values, cd_sig_i.accel.values, atol=1e-3) def test_rotate_earth2principal(self): - - td_rdi = load('RDI_test01_rotate_inst2earth.nc') - td_sig = load('BenchFile01_rotate_inst2earth.nc') + td_rdi = load("RDI_test01_rotate_inst2earth.nc") + td_sig = load("BenchFile01_rotate_inst2earth.nc") td_awac = tr.dat_awac.copy(deep=True) - td_rdi.attrs['principal_heading'] = calc_principal_heading( - td_rdi.vel.mean('range')) - td_sig.attrs['principal_heading'] = calc_principal_heading( - td_sig.vel.mean('range')) - td_awac.attrs['principal_heading'] = calc_principal_heading(td_awac.vel.mean('range'), - tidal_mode=False) - rotate2(td_rdi, 'principal', inplace=True) - rotate2(td_sig, 'principal', inplace=True) - rotate2(td_awac, 'principal', inplace=True) + td_rdi.attrs["principal_heading"] = calc_principal_heading( + td_rdi.vel.mean("range") + ) + td_sig.attrs["principal_heading"] = calc_principal_heading( + td_sig.vel.mean("range") + ) + td_awac.attrs["principal_heading"] = calc_principal_heading( + td_awac.vel.mean("range"), tidal_mode=False + ) + rotate2(td_rdi, "principal", inplace=True) + rotate2(td_sig, "principal", inplace=True) + rotate2(td_awac, "principal", inplace=True) if make_data: - save(td_rdi, 'RDI_test01_rotate_earth2principal.nc') - save(td_sig, 'BenchFile01_rotate_earth2principal.nc') - save(td_awac, 'AWAC_test01_earth2principal.nc') + save(td_rdi, "RDI_test01_rotate_earth2principal.nc") + save(td_sig, "BenchFile01_rotate_earth2principal.nc") + save(td_awac, "AWAC_test01_earth2principal.nc") return - cd_rdi = load('RDI_test01_rotate_earth2principal.nc') - cd_sig = load('BenchFile01_rotate_earth2principal.nc') - cd_awac = load('AWAC_test01_earth2principal.nc') + cd_rdi = load("RDI_test01_rotate_earth2principal.nc") + cd_sig = load("BenchFile01_rotate_earth2principal.nc") + cd_awac = load("AWAC_test01_earth2principal.nc") assert_allclose(td_rdi, cd_rdi, atol=1e-5) assert_allclose(td_awac, cd_awac, atol=1e-5) assert_allclose(td_sig, cd_sig, atol=1e-5) -if __name__ == '__main__': +if __name__ == "__main__": unittest.main() diff --git a/mhkit/tests/dolfyn/test_rotate_adv.py b/mhkit/tests/dolfyn/test_rotate_adv.py index 26ab76d3c..b967c838d 100644 --- a/mhkit/tests/dolfyn/test_rotate_adv.py +++ b/mhkit/tests/dolfyn/test_rotate_adv.py @@ -1,11 +1,16 @@ from . import test_read_adv as tr from .base import load_netcdf as load, save_netcdf as save, assert_allclose -from mhkit.dolfyn.rotate.api import rotate2, calc_principal_heading, \ - set_declination, set_inst2head_rotmat +from mhkit.dolfyn.rotate.api import ( + rotate2, + calc_principal_heading, + set_declination, + set_inst2head_rotmat, +) from mhkit.dolfyn.rotate.base import euler2orient, orient2euler import numpy as np import numpy.testing as npt import unittest + make_data = False @@ -14,14 +19,14 @@ def test_heading(self): td = tr.dat_imu.copy(deep=True) head, pitch, roll = orient2euler(td) - td['pitch'].values = pitch - td['roll'].values = roll - td['heading'].values = head + td["pitch"].values = pitch + td["roll"].values = roll + td["heading"].values = head if make_data: - save(td, 'vector_data_imu01_head_pitch_roll.nc') + save(td, "vector_data_imu01_head_pitch_roll.nc") return - cd = load('vector_data_imu01_head_pitch_roll.nc') + cd = load("vector_data_imu01_head_pitch_roll.nc") assert_allclose(td, cd, atol=1e-6) @@ -30,9 +35,7 @@ def test_inst2head_rotmat(self): td = tr.dat.copy(deep=True) # Swap x,y, reverse z - set_inst2head_rotmat(td, [[0, 1, 0], - [1, 0, 0], - [0, 0, -1]], inplace=True) + set_inst2head_rotmat(td, [[0, 1, 0], [1, 0, 0], [0, 0, -1]], inplace=True) # Coords don't get altered here npt.assert_allclose(td.vel[0].values, tr.dat.vel[1].values, atol=1e-6) @@ -41,7 +44,7 @@ def test_inst2head_rotmat(self): # Validation for non-symmetric rotations td = tr.dat.copy(deep=True) - R = euler2orient(20, 30, 60, units='degrees') # arbitrary angles + R = euler2orient(20, 30, 60, units="degrees") # arbitrary angles td = set_inst2head_rotmat(td, R, inplace=False) vel1 = td.vel # validate that a head->inst rotation occurs (transpose of inst2head_rotmat) @@ -51,64 +54,64 @@ def test_inst2head_rotmat(self): def test_rotate_inst2earth(self): td = tr.dat.copy(deep=True) - rotate2(td, 'earth', inplace=True) + rotate2(td, "earth", inplace=True) tdm = tr.dat_imu.copy(deep=True) - rotate2(tdm, 'earth', inplace=True) + rotate2(tdm, "earth", inplace=True) tdo = tr.dat.copy(deep=True) - omat = tdo['orientmat'] - tdo = rotate2(tdo.drop_vars('orientmat'), 'earth', inplace=False) - tdo['orientmat'] = omat + omat = tdo["orientmat"] + tdo = rotate2(tdo.drop_vars("orientmat"), "earth", inplace=False) + tdo["orientmat"] = omat if make_data: - save(td, 'vector_data01_rotate_inst2earth.nc') - save(tdm, 'vector_data_imu01_rotate_inst2earth.nc') + save(td, "vector_data01_rotate_inst2earth.nc") + save(tdm, "vector_data_imu01_rotate_inst2earth.nc") return - cd = load('vector_data01_rotate_inst2earth.nc') - cdm = load('vector_data_imu01_rotate_inst2earth.nc') + cd = load("vector_data01_rotate_inst2earth.nc") + cdm = load("vector_data_imu01_rotate_inst2earth.nc") assert_allclose(td, cd, atol=1e-6) assert_allclose(tdm, cdm, atol=1e-6) assert_allclose(tdo, cd, atol=1e-6) def test_rotate_earth2inst(self): - td = load('vector_data01_rotate_inst2earth.nc') - rotate2(td, 'inst', inplace=True) - tdm = load('vector_data_imu01_rotate_inst2earth.nc') - rotate2(tdm, 'inst', inplace=True) + td = load("vector_data01_rotate_inst2earth.nc") + rotate2(td, "inst", inplace=True) + tdm = load("vector_data_imu01_rotate_inst2earth.nc") + rotate2(tdm, "inst", inplace=True) cd = tr.dat.copy(deep=True) cdm = tr.dat_imu.copy(deep=True) # The heading/pitch/roll data gets modified during rotation, so it # doesn't go back to what it was. - cdm = cdm.drop_vars(['heading', 'pitch', 'roll']) - tdm = tdm.drop_vars(['heading', 'pitch', 'roll']) + cdm = cdm.drop_vars(["heading", "pitch", "roll"]) + tdm = tdm.drop_vars(["heading", "pitch", "roll"]) assert_allclose(td, cd, atol=1e-6) assert_allclose(tdm, cdm, atol=1e-6) def test_rotate_inst2beam(self): td = tr.dat.copy(deep=True) - rotate2(td, 'beam', inplace=True) + rotate2(td, "beam", inplace=True) tdm = tr.dat_imu.copy(deep=True) - rotate2(tdm, 'beam', inplace=True) + rotate2(tdm, "beam", inplace=True) if make_data: - save(td, 'vector_data01_rotate_inst2beam.nc') - save(tdm, 'vector_data_imu01_rotate_inst2beam.nc') + save(td, "vector_data01_rotate_inst2beam.nc") + save(tdm, "vector_data_imu01_rotate_inst2beam.nc") return - cd = load('vector_data01_rotate_inst2beam.nc') - cdm = load('vector_data_imu01_rotate_inst2beam.nc') + cd = load("vector_data01_rotate_inst2beam.nc") + cdm = load("vector_data_imu01_rotate_inst2beam.nc") assert_allclose(td, cd, atol=1e-6) assert_allclose(tdm, cdm, atol=1e-6) def test_rotate_beam2inst(self): - td = load('vector_data01_rotate_inst2beam.nc') - rotate2(td, 'inst', inplace=True) - tdm = load('vector_data_imu01_rotate_inst2beam.nc') - rotate2(tdm, 'inst', inplace=True) + td = load("vector_data01_rotate_inst2beam.nc") + rotate2(td, "inst", inplace=True) + tdm = load("vector_data_imu01_rotate_inst2beam.nc") + rotate2(tdm, "inst", inplace=True) cd = tr.dat.copy(deep=True) cdm = tr.dat_imu.copy(deep=True) @@ -117,60 +120,59 @@ def test_rotate_beam2inst(self): assert_allclose(tdm, cdm, atol=1e-5) def test_rotate_earth2principal(self): - td = load('vector_data01_rotate_inst2earth.nc') - td.attrs['principal_heading'] = calc_principal_heading(td['vel']) - rotate2(td, 'principal', inplace=True) - tdm = load('vector_data_imu01_rotate_inst2earth.nc') - tdm.attrs['principal_heading'] = calc_principal_heading(tdm['vel']) - rotate2(tdm, 'principal', inplace=True) + td = load("vector_data01_rotate_inst2earth.nc") + td.attrs["principal_heading"] = calc_principal_heading(td["vel"]) + rotate2(td, "principal", inplace=True) + tdm = load("vector_data_imu01_rotate_inst2earth.nc") + tdm.attrs["principal_heading"] = calc_principal_heading(tdm["vel"]) + rotate2(tdm, "principal", inplace=True) if make_data: - save(td, 'vector_data01_rotate_earth2principal.nc') - save(tdm, 'vector_data_imu01_rotate_earth2principal.nc') + save(td, "vector_data01_rotate_earth2principal.nc") + save(tdm, "vector_data_imu01_rotate_earth2principal.nc") return - cd = load('vector_data01_rotate_earth2principal.nc') - cdm = load('vector_data_imu01_rotate_earth2principal.nc') + cd = load("vector_data01_rotate_earth2principal.nc") + cdm = load("vector_data_imu01_rotate_earth2principal.nc") assert_allclose(td, cd, atol=1e-6) assert_allclose(tdm, cdm, atol=1e-6) def test_rotate_earth2principal_set_declination(self): declin = 3.875 - td = load('vector_data01_rotate_inst2earth.nc') + td = load("vector_data01_rotate_inst2earth.nc") td0 = td.copy(deep=True) - td.attrs['principal_heading'] = calc_principal_heading(td['vel']) - rotate2(td, 'principal', inplace=True) + td.attrs["principal_heading"] = calc_principal_heading(td["vel"]) + rotate2(td, "principal", inplace=True) set_declination(td, declin, inplace=True) - rotate2(td, 'earth', inplace=True) + rotate2(td, "earth", inplace=True) set_declination(td0, -1, inplace=True) set_declination(td0, declin, inplace=True) - td0.attrs['principal_heading'] = calc_principal_heading(td0['vel']) - rotate2(td0, 'earth', inplace=True) + td0.attrs["principal_heading"] = calc_principal_heading(td0["vel"]) + rotate2(td0, "earth", inplace=True) assert_allclose(td0, td, atol=1e-6) def test_rotate_warnings(self): warn1 = tr.dat.copy(deep=True) warn2 = tr.dat.copy(deep=True) - warn2.attrs['coord_sys'] = 'flow' + warn2.attrs["coord_sys"] = "flow" warn3 = tr.dat.copy(deep=True) - warn3.attrs['inst_model'] = 'ADV' + warn3.attrs["inst_model"] = "ADV" warn4 = tr.dat.copy(deep=True) - warn4.attrs['inst_model'] = 'adv' + warn4.attrs["inst_model"] = "adv" with self.assertRaises(Exception): - rotate2(warn1, 'ship') + rotate2(warn1, "ship") with self.assertRaises(Exception): - rotate2(warn2, 'earth') + rotate2(warn2, "earth") with self.assertRaises(Exception): set_inst2head_rotmat(warn3, np.eye(3)) - set_inst2head_rotmat(warn3, np.eye(3)) with self.assertRaises(Exception): set_inst2head_rotmat(warn4, np.eye(3)) -if __name__ == '__main__': +if __name__ == "__main__": unittest.main() diff --git a/mhkit/tests/dolfyn/test_shortcuts.py b/mhkit/tests/dolfyn/test_shortcuts.py index 513660d1d..948736603 100644 --- a/mhkit/tests/dolfyn/test_shortcuts.py +++ b/mhkit/tests/dolfyn/test_shortcuts.py @@ -14,27 +14,26 @@ class analysis_testcase(unittest.TestCase): @classmethod def setUpClass(self): dat = tv.dat.copy(deep=True) - self.dat = rotate2(dat, 'earth', inplace=False) - self.tdat = avm.turbulence_statistics( - self.dat, n_bin=20.0, fs=self.dat.fs) + self.dat = rotate2(dat, "earth", inplace=False) + self.tdat = avm.turbulence_statistics(self.dat, n_bin=20.0, fs=self.dat.fs) short = xr.Dataset() - short['u'] = self.tdat.velds.u - short['v'] = self.tdat.velds.v - short['w'] = self.tdat.velds.w - short['U'] = self.tdat.velds.U - short['U_mag'] = self.tdat.velds.U_mag - short['U_dir'] = self.tdat.velds.U_dir + short["u"] = self.tdat.velds.u + short["v"] = self.tdat.velds.v + short["w"] = self.tdat.velds.w + short["U"] = self.tdat.velds.U + short["U_mag"] = self.tdat.velds.U_mag + short["U_dir"] = self.tdat.velds.U_dir short["upup_"] = self.tdat.velds.upup_ short["vpvp_"] = self.tdat.velds.vpvp_ short["wpwp_"] = self.tdat.velds.wpwp_ short["upvp_"] = self.tdat.velds.upvp_ short["upwp_"] = self.tdat.velds.upwp_ short["vpwp_"] = self.tdat.velds.vpwp_ - short['tke'] = self.tdat.velds.tke - short['I'] = self.tdat.velds.I - short['E_coh'] = self.tdat.velds.E_coh - short['I_tke'] = self.tdat.velds.I_tke + short["tke"] = self.tdat.velds.tke + short["I"] = self.tdat.velds.I + short["E_coh"] = self.tdat.velds.E_coh + short["I_tke"] = self.tdat.velds.I_tke self.short = short @classmethod @@ -44,15 +43,15 @@ def tearDownClass(self): def test_shortcuts(self): ds = self.short.copy(deep=True) if make_data: - save(ds, 'vector_data01_u.nc') + save(ds, "vector_data01_u.nc") return - assert_allclose(ds, load('vector_data01_u.nc'), atol=1e-6) + assert_allclose(ds, load("vector_data01_u.nc"), atol=1e-6) def test_save_complex_data(self): # netcdf4 cannot natively handle complex values # This test is a sanity check that ensures this code's # workaround functions ds_save = self.short.copy(deep=True) - save(ds_save, 'test_save.nc') - assert os.path.exists(rfnm('test_save.nc')) + save(ds_save, "test_save.nc") + assert os.path.exists(rfnm("test_save.nc")) diff --git a/mhkit/tests/dolfyn/test_time.py b/mhkit/tests/dolfyn/test_time.py index c7fecfdf2..9c1ae7597 100644 --- a/mhkit/tests/dolfyn/test_time.py +++ b/mhkit/tests/dolfyn/test_time.py @@ -20,11 +20,12 @@ def test_time_conversion(self): assert_equal(dt[0], datetime(2012, 6, 12, 12, 0, 2, 687283)) assert_equal(dt1, [datetime(2012, 6, 12, 12, 0, 2, 687283)]) assert_equal(dt_off[0], datetime(2012, 6, 12, 5, 0, 2, 687283)) - assert_equal(t_str[0], '2012-06-12 12:00:02.687283') + assert_equal(t_str[0], "2012-06-12 12:00:02.687283") # Validated based on data in ad2cp.index file - assert_equal(time.dt642date(dat_sig.time[0])[0], - datetime(2017, 7, 24, 17, 0, 0, 63500)) + assert_equal( + time.dt642date(dat_sig.time[0])[0], datetime(2017, 7, 24, 17, 0, 0, 63500) + ) # This should always be true assert_equal(time.epoch2date([0])[0], datetime(1970, 1, 1, 0, 0)) @@ -48,5 +49,5 @@ def test_datenum(self): assert_equal(dn[0], 735032.5000311028) -if __name__ == '__main__': +if __name__ == "__main__": unittest.main() diff --git a/mhkit/tests/dolfyn/test_tools.py b/mhkit/tests/dolfyn/test_tools.py index 611512f48..6aaa10a9c 100644 --- a/mhkit/tests/dolfyn/test_tools.py +++ b/mhkit/tests/dolfyn/test_tools.py @@ -1,4 +1,4 @@ -import mhkit.dolfyn.tools.misc as tools +import mhkit.dolfyn.tools as tools from numpy.testing import assert_equal, assert_allclose import numpy as np import unittest @@ -8,55 +8,111 @@ class tools_testcase(unittest.TestCase): @classmethod def setUpClass(self): self.array = np.arange(10, dtype=float) - self.nan = np.zeros(3)*np.NaN + self.nan = np.zeros(3) * np.NaN @classmethod def tearDownClass(self): pass def test_detrend_array(self): - d = tools.detrend_array(self.array) + d = tools.misc.detrend_array(self.array) assert_allclose(d, np.zeros(10), atol=1e-10) def test_group(self): array = np.concatenate((self.array, self.array)) - d = tools.group(array) + d = tools.misc.group(array) out = np.array([slice(1, 20, None)], dtype=object) assert_equal(d, out) def test_slice(self): - tensor = np.array([[[1, 2, 3], [4, 5, 6], [7, 8, 9]], - [[10, 11, 12], [13, 14, 15], [16, 17, 18]], - [[19, 20, 21], [22, 23, 24], [25, 26, 27]]]) + tensor = np.array( + [ + [[1, 2, 3], [4, 5, 6], [7, 8, 9]], + [[10, 11, 12], [13, 14, 15], [16, 17, 18]], + [[19, 20, 21], [22, 23, 24], [25, 26, 27]], + ] + ) out = np.zeros((3, 3, 3)) slices = list() - for slc in tools.slice1d_along_axis((3, 3, 3), axis=-1): + for slc in tools.misc.slice1d_along_axis((3, 3, 3), axis=-1): slices.append(slc) out[slc] = tensor[slc] - slc_out = [(0, 0, slice(None, None, None)), - (0, 1, slice(None, None, None)), - (0, 2, slice(None, None, None)), - (1, 0, slice(None, None, None)), - (1, 1, slice(None, None, None)), - (1, 2, slice(None, None, None)), - (2, 0, slice(None, None, None)), - (2, 1, slice(None, None, None)), - (2, 2, slice(None, None, None))] + slc_out = [ + (0, 0, slice(None, None, None)), + (0, 1, slice(None, None, None)), + (0, 2, slice(None, None, None)), + (1, 0, slice(None, None, None)), + (1, 1, slice(None, None, None)), + (1, 2, slice(None, None, None)), + (2, 0, slice(None, None, None)), + (2, 1, slice(None, None, None)), + (2, 2, slice(None, None, None)), + ] assert_equal(slc_out, slices) assert_allclose(tensor, out, atol=1e-10) def test_fillgaps(self): arr = np.concatenate((self.array, self.nan, self.array)) - d1 = tools.fillgaps(arr.copy()) - d2 = tools.fillgaps(arr.copy(), maxgap=1) + d1 = tools.misc.fillgaps(arr.copy()) + d2 = tools.misc.fillgaps(arr.copy(), maxgap=1) - out1 = np.array([0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 6.75, 4.5, 2.25, - 0, 1, 2, 3, 4, 5, 6, 7, 8, 9]) - out2 = np.array([0, 1, 2, 3, 4, 5, 6, 7, 8, 9, np.nan, np.nan, np.nan, - 0, 1, 2, 3, 4, 5, 6, 7, 8, 9]) + out1 = np.array( + [ + 0, + 1, + 2, + 3, + 4, + 5, + 6, + 7, + 8, + 9, + 6.75, + 4.5, + 2.25, + 0, + 1, + 2, + 3, + 4, + 5, + 6, + 7, + 8, + 9, + ] + ) + out2 = np.array( + [ + 0, + 1, + 2, + 3, + 4, + 5, + 6, + 7, + 8, + 9, + np.nan, + np.nan, + np.nan, + 0, + 1, + 2, + 3, + 4, + 5, + 6, + 7, + 8, + 9, + ] + ) assert_allclose(d1, out1, atol=1e-10) assert_allclose(d2, out2, atol=1e-10) @@ -65,13 +121,69 @@ def test_interpgaps(self): arr = np.concatenate((self.array, self.nan, self.array, self.nan)) t = np.arange(0, arr.shape[0], 0.1) - d1 = tools.interpgaps(arr.copy(), t, extrapFlg=True) - d2 = tools.interpgaps(arr.copy(), t, maxgap=1) + d1 = tools.misc.interpgaps(arr.copy(), t, extrapFlg=True) + d2 = tools.misc.interpgaps(arr.copy(), t, maxgap=1) - out1 = np.array([0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 6.75, 4.5, 2.25, - 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 9, 9, 9]) - out2 = np.array([0, 1, 2, 3, 4, 5, 6, 7, 8, 9, np.nan, np.nan, np.nan, - 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, np.nan, np.nan, np.nan]) + out1 = np.array( + [ + 0, + 1, + 2, + 3, + 4, + 5, + 6, + 7, + 8, + 9, + 6.75, + 4.5, + 2.25, + 0, + 1, + 2, + 3, + 4, + 5, + 6, + 7, + 8, + 9, + 9, + 9, + 9, + ] + ) + out2 = np.array( + [ + 0, + 1, + 2, + 3, + 4, + 5, + 6, + 7, + 8, + 9, + np.nan, + np.nan, + np.nan, + 0, + 1, + 2, + 3, + 4, + 5, + 6, + 7, + 8, + 9, + np.nan, + np.nan, + np.nan, + ] + ) assert_allclose(d1, out1, atol=1e-10) assert_allclose(d2, out2, atol=1e-10) @@ -80,22 +192,140 @@ def test_medfiltnan(self): arr = np.concatenate((self.array, self.nan, self.array)) a = np.concatenate((arr[None, :], arr[None, :]), axis=0) - d = tools.medfiltnan(a, [1, 5], thresh=3) + d = tools.misc.medfiltnan(a, [1, 5], thresh=3) - out = np.array([[0, 1, 2, 3, 4, 5, 6, 7, 7, 7, 8, 9, np.nan, np.nan, np.nan, 2, 3, 4, 5, - 6, 7, 7, 7], - [0, 1, 2, 3, 4, 5, 6, 7, 7, 7, 8, 9, np.nan, np.nan, np.nan, 2, 3, 4, 5, - 6, 7, 7, 7]]) + out = np.array( + [ + [ + 0, + 1, + 2, + 3, + 4, + 5, + 6, + 7, + 7, + 7, + 8, + 9, + np.nan, + np.nan, + np.nan, + 2, + 3, + 4, + 5, + 6, + 7, + 7, + 7, + ], + [ + 0, + 1, + 2, + 3, + 4, + 5, + 6, + 7, + 7, + 7, + 8, + 9, + np.nan, + np.nan, + np.nan, + 2, + 3, + 4, + 5, + 6, + 7, + 7, + 7, + ], + ] + ) assert_allclose(d, out, atol=1e-10) def test_deg_conv(self): - d = tools.convert_degrees(self.array) + d = tools.misc.convert_degrees(self.array) - out = np.array([90., 89., 88., 87., 86., 85., 84., 83., 82., 81.]) + out = np.array([90.0, 89.0, 88.0, 87.0, 86.0, 85.0, 84.0, 83.0, 82.0, 81.0]) assert_allclose(d, out, atol=1e-10) + def test_fft_frequency(self): + fs = 1000 # Sampling frequency + nfft = 512 # Number of samples in a window -if __name__ == '__main__': + # Test for full frequency range + freq_full = tools.fft.fft_frequency(nfft, fs, full=True) + assert_equal(len(freq_full), nfft) + + # Check symmetry of positive and negative frequencies, ignoring the zero frequency + positive_freqs = freq_full[1 : int(nfft / 2)] + negative_freqs = freq_full[int(nfft / 2) + 1 :] + assert_allclose(positive_freqs, -negative_freqs[::-1]) + + def test_stepsize(self): + # Case 1: l < nfft + step, nens, nfft = tools.fft._stepsize(100, 200) + assert_equal((step, nens, nfft), (0, 1, 100)) + + # Case 2: l == nfft + step, nens, nfft = tools.fft._stepsize(200, 200) + assert_equal((step, nens, nfft), (0, 1, 200)) + + # Case 3: l > nfft, no nens + step, nens, nfft = tools.fft._stepsize(300, 100) + expected_nens = int(2.0 * 300 / 100) + expected_step = int((300 - 100) / (expected_nens - 1)) + assert_equal((step, nens, nfft), (expected_step, expected_nens, 100)) + + # Case 4: l > nfft, with nens + step, nens, nfft = tools.fft._stepsize(300, 100, nens=5) + expected_step = int((300 - 100) / (5 - 1)) + assert_equal((step, nens, nfft), (expected_step, 5, 100)) + + # Case 5: l > nfft, with step + step, nens, nfft = tools.fft._stepsize(300, 100, step=50) + expected_nens = int((300 - 100) / 50 + 1) + assert_equal((step, nens, nfft), (50, expected_nens, 100)) + + # Case 6: nens is 1 + step, nens, nfft = tools.fft._stepsize(300, 100, nens=1) + assert_equal((step, nens, nfft), (0, 1, 100)) + + def test_cpsd_quasisync_1D(self): + fs = 1000 # Sample rate + nfft = 512 # Number of points in the fft + + # Test with signals of same length + a = np.random.normal(0, 1, 1000) + b = np.random.normal(0, 1, 1000) + cpsd = tools.fft.cpsd_quasisync_1D(a, b, nfft, fs) + self.assertEqual(cpsd.shape, (nfft // 2,)) + + # Test with signals of different lengths + a = np.random.normal(0, 1, 1500) + b = np.random.normal(0, 1, 1000) + cpsd = tools.fft.cpsd_quasisync_1D(a, b, nfft, fs) + self.assertEqual(cpsd.shape, (nfft // 2,)) + + # Test with different window types + for window in [None, 1, "hann"]: + cpsd = tools.fft.cpsd_quasisync_1D(a, b, nfft, fs, window=window) + self.assertEqual(cpsd.shape, (nfft // 2,)) + + # Test with a custom window + custom_window = np.hamming(nfft) + cpsd = tools.fft.cpsd_quasisync_1D(a, b, nfft, fs, window=custom_window) + self.assertEqual(cpsd.shape, (nfft // 2,)) + + +if __name__ == "__main__": unittest.main() diff --git a/mhkit/tests/dolfyn/test_vs_nortek.py b/mhkit/tests/dolfyn/test_vs_nortek.py index ac54e99e1..f1abdd406 100644 --- a/mhkit/tests/dolfyn/test_vs_nortek.py +++ b/mhkit/tests/dolfyn/test_vs_nortek.py @@ -14,42 +14,40 @@ def load_nortek_matfile(filename): - data = sio.loadmat(filename, - struct_as_record=False, - squeeze_me=True) - d = data['Data'] + data = sio.loadmat(filename, struct_as_record=False, squeeze_me=True) + d = data["Data"] # print(d._fieldnames) - burst = 'Burst' - bt = 'BottomTrack' + burst = "Burst" + bt = "BottomTrack" - beam = ['_VelBeam1', '_VelBeam2', '_VelBeam3', '_VelBeam4'] - b5 = 'IBurst_VelBeam5' - inst = ['_VelX', '_VelY', '_VelZ1', '_VelZ2'] - earth = ['_VelEast', '_VelNorth', '_VelUp1', '_VelUp2'] - axis = {'beam': beam, 'inst': inst, 'earth': earth} - AHRS = 'Burst_AHRSRotationMatrix' # , 'IBurst_AHRSRotationMatrix'] + beam = ["_VelBeam1", "_VelBeam2", "_VelBeam3", "_VelBeam4"] + b5 = "IBurst_VelBeam5" + inst = ["_VelX", "_VelY", "_VelZ1", "_VelZ2"] + earth = ["_VelEast", "_VelNorth", "_VelUp1", "_VelUp2"] + axis = {"beam": beam, "inst": inst, "earth": earth} + AHRS = "Burst_AHRSRotationMatrix" # , 'IBurst_AHRSRotationMatrix'] - vel = {'beam': {}, 'inst': {}, 'earth': {}} + vel = {"beam": {}, "inst": {}, "earth": {}} for ky in vel.keys(): for i in range(len(axis[ky])): - vel[ky][i] = np.transpose(getattr(d, burst+axis[ky][i])) - vel[ky] = np.stack((vel[ky][0], vel[ky][1], - vel[ky][2], vel[ky][3]), axis=0) + vel[ky][i] = np.transpose(getattr(d, burst + axis[ky][i])) + vel[ky] = np.stack((vel[ky][0], vel[ky][1], vel[ky][2], vel[ky][3]), axis=0) if AHRS in d._fieldnames: - vel['omat'] = np.transpose(getattr(d, AHRS)) + vel["omat"] = np.transpose(getattr(d, AHRS)) if b5 in d._fieldnames: - vel['b5'] = np.transpose(getattr(d, b5)) - #vel['omat5'] = getattr(d, AHRS[1]) + vel["b5"] = np.transpose(getattr(d, b5)) + # vel['omat5'] = getattr(d, AHRS[1]) - if bt+beam[0] in d._fieldnames: - vel_bt = {'beam': {}, 'inst': {}, 'earth': {}} + if bt + beam[0] in d._fieldnames: + vel_bt = {"beam": {}, "inst": {}, "earth": {}} for ky in vel_bt.keys(): for i in range(len(axis[ky])): - vel_bt[ky][i] = np.transpose(getattr(d, bt+axis[ky][i])) - vel_bt[ky] = np.stack((vel_bt[ky][0], vel_bt[ky][1], - vel_bt[ky][2], vel_bt[ky][3]), axis=0) + vel_bt[ky][i] = np.transpose(getattr(d, bt + axis[ky][i])) + vel_bt[ky] = np.stack( + (vel_bt[ky][0], vel_bt[ky][1], vel_bt[ky][2], vel_bt[ky][3]), axis=0 + ) return vel, vel_bt else: @@ -62,60 +60,61 @@ def rotate(axis): # Sig1000_IMU.ad2cp no userdata td_sig_i = rotate2(tr.dat_sig_i, axis, inplace=False) # VelEchoBT01.ad2cp - td_sig_ieb = rotate2(tr.dat_sig_ieb, axis, - inplace=False) + td_sig_ieb = rotate2(tr.dat_sig_ieb, axis, inplace=False) # Sig500_Echo.ad2cp - td_sig_ie = rotate2(tr.dat_sig_ie, axis, - inplace=False) + td_sig_ie = rotate2(tr.dat_sig_ie, axis, inplace=False) - td_sig_vel = load_nortek_matfile(base.rfnm('BenchFile01.mat')) - td_sig_i_vel = load_nortek_matfile(base.rfnm('Sig1000_IMU.mat')) - td_sig_ieb_vel, vel_bt = load_nortek_matfile(base.rfnm('VelEchoBT01.mat')) - td_sig_ie_vel = load_nortek_matfile(base.rfnm('Sig500_Echo.mat')) + td_sig_vel = load_nortek_matfile(base.rfnm("BenchFile01.mat")) + td_sig_i_vel = load_nortek_matfile(base.rfnm("Sig1000_IMU.mat")) + td_sig_ieb_vel, vel_bt = load_nortek_matfile(base.rfnm("VelEchoBT01.mat")) + td_sig_ie_vel = load_nortek_matfile(base.rfnm("Sig500_Echo.mat")) nens = 100 # ARHS inst2earth orientation matrix check # Checks the 1,1 element because the nortek orientmat's shape is [9,:] as # opposed to [3,3,:] - if axis == 'inst': - assert_allclose(td_sig_i.orientmat[0][0].values, - td_sig_i_vel['omat'][0, :nens], atol=1e-7) - assert_allclose(td_sig_ieb.orientmat[0][0].values, - td_sig_ieb_vel['omat'][0, :][..., :nens], atol=1e-7) + if axis == "inst": + assert_allclose( + td_sig_i.orientmat[0][0].values, td_sig_i_vel["omat"][0, :nens], atol=1e-7 + ) + assert_allclose( + td_sig_ieb.orientmat[0][0].values, + td_sig_ieb_vel["omat"][0, :][..., :nens], + atol=1e-7, + ) # 4-beam velocity assert_allclose(td_sig.vel.values, td_sig_vel[axis][..., :nens], atol=1e-5) - assert_allclose(td_sig_i.vel.values, - td_sig_i_vel[axis][..., :nens], atol=5e-3) - assert_allclose(td_sig_ieb.vel.values, - td_sig_ieb_vel[axis][..., :nens], atol=5e-3) - assert_allclose(td_sig_ie.vel.values, - td_sig_ie_vel[axis][..., :nens], atol=1e-5) + assert_allclose(td_sig_i.vel.values, td_sig_i_vel[axis][..., :nens], atol=5e-3) + assert_allclose(td_sig_ieb.vel.values, td_sig_ieb_vel[axis][..., :nens], atol=5e-3) + assert_allclose(td_sig_ie.vel.values, td_sig_ie_vel[axis][..., :nens], atol=1e-5) # 5th-beam velocity - if axis == 'beam': - assert_allclose(td_sig_i.vel_b5.values, - td_sig_i_vel['b5'][..., :nens], atol=1e-5) - assert_allclose(td_sig_ieb.vel_b5.values, - td_sig_ieb_vel['b5'][..., :nens], atol=1e-5) - assert_allclose(td_sig_ie.vel_b5.values, - td_sig_ie_vel['b5'][..., :nens], atol=1e-5) + if axis == "beam": + assert_allclose( + td_sig_i.vel_b5.values, td_sig_i_vel["b5"][..., :nens], atol=1e-5 + ) + assert_allclose( + td_sig_ieb.vel_b5.values, td_sig_ieb_vel["b5"][..., :nens], atol=1e-5 + ) + assert_allclose( + td_sig_ie.vel_b5.values, td_sig_ie_vel["b5"][..., :nens], atol=1e-5 + ) # bottom-track - assert_allclose(td_sig_ieb.vel_bt.values, - vel_bt[axis][..., :nens], atol=5e-3) + assert_allclose(td_sig_ieb.vel_bt.values, vel_bt[axis][..., :nens], atol=5e-3) class nortek_testcase(unittest.TestCase): def test_rotate2_beam(self): - rotate('beam') + rotate("beam") def test_rotate2_inst(self): - rotate('inst') + rotate("inst") def test_rotate2_earth(self): - rotate('earth') + rotate("earth") -if __name__ == '__main__': +if __name__ == "__main__": unittest.main() diff --git a/mhkit/tests/loads/test_extreme.py b/mhkit/tests/loads/test_extreme.py new file mode 100644 index 000000000..e0ede2e93 --- /dev/null +++ b/mhkit/tests/loads/test_extreme.py @@ -0,0 +1,50 @@ +import numpy as np +import unittest +import mhkit.loads as loads +from numpy.testing import assert_allclose + + +class TestExtreme(unittest.TestCase): + @classmethod + def setUpClass(self): + self.t, self.signal = self._example_waveform(self) + + def _example_waveform(self): + # Create simple wave form to analyse. + # This has been created to perform + # a simple independent calcuation that + # the mhkit functions can be tested against. + + A = np.array([0.5, 0.6, 0.3]) + T = np.array([3, 2, 1]) + w = 2 * np.pi / T + + t = np.linspace(0, 4.5, 100) + + signal = np.zeros(t.size) + for i in range(A.size): + signal += A[i] * np.sin(w[i] * t) + + return t, signal + + def _example_crest_analysis(self, t, signal): + # NB: This only works due to the construction + # of our test signal. It is not suitable as + # a general approach. + grad = np.diff(signal) + + # +1 to get the index at turning point + turning_points = np.flatnonzero(grad[1:] * grad[:-1] < 0) + 1 + + crest_inds = turning_points[signal[turning_points] > 0] + crests = signal[crest_inds] + + return crests, crest_inds + + def test_global_peaks(self): + peaks_t, peaks_val = loads.extreme.global_peaks(self.t, self.signal) + + test_crests, test_crests_ind = self._example_crest_analysis(self.t, self.signal) + + assert_allclose(peaks_t, self.t[test_crests_ind]) + assert_allclose(peaks_val, test_crests) diff --git a/mhkit/tests/loads/test_loads.py b/mhkit/tests/loads/test_loads.py index f17e89cc4..8c119a38e 100644 --- a/mhkit/tests/loads/test_loads.py +++ b/mhkit/tests/loads/test_loads.py @@ -2,7 +2,6 @@ from numpy.testing import assert_array_almost_equal, assert_allclose from pandas._testing.asserters import assert_series_equal from pandas.testing import assert_frame_equal -from mhkit import utils from mhkit.wave import resource import mhkit.loads as loads import pandas as pd @@ -13,123 +12,351 @@ import os testdir = dirname(abspath(__file__)) -datadir = normpath(join(testdir,relpath('../../../examples/data/loads'))) +datadir = normpath(join(testdir, relpath("../../../examples/data/loads"))) -class TestLoads(unittest.TestCase): +class TestLoads(unittest.TestCase): @classmethod def setUpClass(self): - loads_data_file = join(datadir, "loads_data_dict.json") - with open(loads_data_file, 'r') as fp: + with open(loads_data_file, "r") as fp: data_dict = json.load(fp) # convert dictionaries into dataframes - data = { - key: pd.DataFrame(data_dict[key]) - for key in data_dict - } + data = {key: pd.DataFrame(data_dict[key]) for key in data_dict} self.data = data self.fatigue_tower = 3804 self.fatigue_blade = 1388 # import blade cal data - blade_data = pd.read_csv(join(datadir,'blade_cal.csv'),header=None) - blade_data.columns = ['flap_raw','edge_raw','flap_scaled','edge_scaled'] + blade_data = pd.read_csv(join(datadir, "blade_cal.csv"), header=None) + blade_data.columns = ["flap_raw", "edge_raw", "flap_scaled", "edge_scaled"] self.blade_data = blade_data - self.flap_offset = 9.19906E-05 + self.flap_offset = 9.19906e-05 self.edge_offset = -0.000310854 - self.blade_matrix = [1034671.4,-126487.28,82507.959,1154090.7] + self.blade_matrix = [1034671.4, -126487.28, 82507.959, 1154090.7] def test_bin_statistics(self): # create array containg wind speeds to use as bin edges - bin_edges = np.arange(3,26,1) + bin_edges = np.arange(3, 26, 1) # Apply function to calculate means - load_means =self.data['means'] - bin_against = load_means['uWind_80m'] - [b_means, b_means_std] = loads.general.bin_statistics(load_means, bin_against, bin_edges) + load_means = self.data["means"] + bin_against = load_means["uWind_80m"] + [b_means, b_means_std] = loads.general.bin_statistics( + load_means, bin_against, bin_edges + ) + + # Ensure the data type of the index matches + b_means.index = b_means.index.astype(self.data["bin_means"].index.dtype) + b_means_std.index = b_means_std.index.astype( + self.data["bin_means_std"].index.dtype + ) + + b_means.index.name = None # compatibility with old test data + b_means_std.index.name = None # compatibility with old test data + + assert_frame_equal(self.data["bin_means"], b_means) + assert_frame_equal(self.data["bin_means_std"], b_means_std) - assert_frame_equal(self.data['bin_means'],b_means) - assert_frame_equal(self.data['bin_means_std'],b_means_std) + def test_bin_statistics_xarray(self): + # create array containing wind speeds to use as bin edges + bin_edges = np.arange(3, 26, 1) + + # Apply function to calculate means + load_means = self.data["means"] + load_means = load_means.to_xarray() + bin_against = load_means["uWind_80m"] + [b_means, b_means_std] = loads.general.bin_statistics( + load_means, bin_against, bin_edges + ) + + # Ensure the data type of the index matches + b_means.index = b_means.index.astype(self.data["bin_means"].index.dtype) + b_means_std.index = b_means_std.index.astype( + self.data["bin_means_std"].index.dtype + ) + + b_means.index.name = None # compatibility with old test data + b_means_std.index.name = None # compatibility with old test data + + assert_frame_equal(self.data["bin_means"], b_means) + assert_frame_equal(self.data["bin_means_std"], b_means_std) + + def test_bin_statistics_data_type_error(self): + bin_against = np.array([10, 20, 30]) + bin_edges = np.array([0, 15, 25, 35]) + data_signal = ["signal_1"] + to_pandas = True + with self.assertRaises(TypeError): + loads.general.bin_statistics( + "invalid_data_type", bin_against, bin_edges, data_signal, to_pandas + ) + + def test_bin_statistics_bin_against_type_error(self): + data = pd.DataFrame({"signal_1": [1, 2, 3]}) + bin_edges = np.array([0, 15, 25, 35]) + data_signal = ["signal_1"] + to_pandas = True + invalid_bin_against = "invalid_bin_against_type" + with self.assertRaises(TypeError): + loads.general.bin_statistics( + data, invalid_bin_against, bin_edges, data_signal, to_pandas + ) + + def test_bin_statistics_bin_edges_type_error(self): + data = pd.DataFrame({"signal_1": [1, 2, 3]}) + bin_against = np.array([10, 20, 30]) + data_signal = ["signal_1"] + to_pandas = True + with self.assertRaises(TypeError): + loads.general.bin_statistics( + data, bin_against, "invalid_bin_edges_type", data_signal, to_pandas + ) + + def test_bin_statistics_data_signal_type_error(self): + data = pd.DataFrame({"signal_1": [1, 2, 3]}) + bin_against = np.array([10, 20, 30]) + bin_edges = np.array([0, 15, 25, 35]) + data_signal = "invalid_data_signal_type" + to_pandas = True + with self.assertRaises(TypeError): + loads.general.bin_statistics( + data, bin_against, bin_edges, data_signal, to_pandas + ) + + def test_bin_statistics_to_pandas_type_error(self): + data = pd.DataFrame({"signal_1": [1, 2, 3]}) + bin_against = np.array([10, 20, 30]) + bin_edges = np.array([0, 15, 25, 35]) + data_signal = ["signal_1"] + to_pandas = "invalid_to_pandas_type" + with self.assertRaises(TypeError): + loads.general.bin_statistics( + data, bin_against, bin_edges, data_signal, to_pandas + ) def test_blade_moments(self): - flap_raw = self.blade_data['flap_raw'] + flap_raw = self.blade_data["flap_raw"] flap_offset = self.flap_offset - edge_raw = self.blade_data['edge_raw'] + edge_raw = self.blade_data["edge_raw"] edge_offset = self.edge_offset - M_flap, M_edge = loads.general.blade_moments(self.blade_matrix,flap_offset,flap_raw,edge_offset,edge_raw) - - for i,j in zip(M_flap,self.blade_data['flap_scaled']): - self.assertAlmostEqual(i,j,places=1) - for i,j in zip(M_edge,self.blade_data['edge_scaled']): - self.assertAlmostEqual(i,j,places=1) + M_flap, M_edge = loads.general.blade_moments( + self.blade_matrix, flap_offset, flap_raw, edge_offset, edge_raw + ) + for i, j in zip(M_flap, self.blade_data["flap_scaled"]): + self.assertAlmostEqual(i, j, places=1) + for i, j in zip(M_edge, self.blade_data["edge_scaled"]): + self.assertAlmostEqual(i, j, places=1) - def test_damage_equivalent_loads(self): - loads_data = self.data['loads'] - tower_load = loads_data['TB_ForeAft'] - blade_load = loads_data['BL1_FlapMom'] - DEL_tower = loads.general.damage_equivalent_load(tower_load, 4,bin_num=100,data_length=600) - DEL_blade = loads.general.damage_equivalent_load(blade_load,10,bin_num=100,data_length=600) + def test_blade_moments_wrong_types(self): + # Test with incorrect types + blade_coefficients = [1.0, 2.0, 3.0, 4.0] # Should be np.ndarray + flap_offset = "invalid" # Should be float + flap_raw = "invalid" # Should be np.ndarray + edge_offset = "invalid" # Should be float + edge_raw = "invalid" # Should be np.ndarray - self.assertAlmostEqual(DEL_tower,self.fatigue_tower,delta=self.fatigue_tower*0.04) - self.assertAlmostEqual(DEL_blade,self.fatigue_blade,delta=self.fatigue_blade*0.04) + with self.assertRaises(TypeError): + loads.general.blade_moments( + blade_coefficients, flap_offset, flap_raw, edge_offset, edge_raw + ) + def test_damage_equivalent_loads(self): + loads_data = self.data["loads"] + tower_load = loads_data["TB_ForeAft"] + blade_load = loads_data["BL1_FlapMom"] + DEL_tower = loads.general.damage_equivalent_load( + tower_load, 4, bin_num=100, data_length=600 + ) + DEL_blade = loads.general.damage_equivalent_load( + blade_load, 10, bin_num=100, data_length=600 + ) + + self.assertAlmostEqual( + DEL_tower, self.fatigue_tower, delta=self.fatigue_tower * 0.04 + ) + self.assertAlmostEqual( + DEL_blade, self.fatigue_blade, delta=self.fatigue_blade * 0.04 + ) + + def test_damage_equivalent_load_wrong_types(self): + # Test with incorrect types + data_signal = "invalid" # Should be np.ndarray + m = "invalid" # Should be float or int + bin_num = "invalid" # Should be int + data_length = "invalid" # Should be float or int + + with self.assertRaises(TypeError): + loads.general.damage_equivalent_load(data_signal, m, bin_num, data_length) def test_plot_statistics(self): # Define path - savepath = abspath(join(testdir, 'test_scatplotter.png')) + savepath = abspath(join(testdir, "test_scatplotter.png")) # Generate plot - loads.graphics.plot_statistics( self.data['means']['uWind_80m'], - self.data['means']['TB_ForeAft'], - self.data['maxs']['TB_ForeAft'], - self.data['mins']['TB_ForeAft'], - y_stdev=self.data['std']['TB_ForeAft'], - x_label='Wind Speed [m/s]', - y_label='Tower Base Mom [kNm]', - save_path=savepath) + loads.graphics.plot_statistics( + self.data["means"]["uWind_80m"], + self.data["means"]["TB_ForeAft"], + self.data["maxs"]["TB_ForeAft"], + self.data["mins"]["TB_ForeAft"], + y_stdev=self.data["std"]["TB_ForeAft"], + x_label="Wind Speed [m/s]", + y_label="Tower Base Mom [kNm]", + save_path=savepath, + ) self.assertTrue(isfile(savepath)) + def test_plot_statistics_wrong_types(self): + # Test with incorrect types for some arguments + x = "invalid" # Should be np.ndarray + y_mean = "invalid" # Should be np.ndarray + y_max = "invalid" # Should be np.ndarray + y_min = "invalid" # Should be np.ndarray + y_stdev = "invalid" # Should be np.ndarray + + kwargs = { + "x_label": "X Axis", + "y_label": "Y Axis", + "title": "Test Plot", + "save_path": "test_plot.png", + } + + with self.assertRaises(TypeError): + loads.graphics.plot_statistics(x, y_mean, y_max, y_min, y_stdev, **kwargs) def test_plot_bin_statistics(self): # Define signal name, path, and bin centers - savepath = abspath(join(testdir, 'test_binplotter.png')) - bin_centers = np.arange(3.5,25.5,step=1) - signal_name = 'TB_ForeAft' + savepath = abspath(join(testdir, "test_binplotter.png")) + bin_centers = np.arange(3.5, 25.5, step=1) + signal_name = "TB_ForeAft" # Specify inputs to be used in plotting - bin_mean = self.data['bin_means'][signal_name] - bin_max = self.data['bin_maxs'][signal_name] - bin_min = self.data['bin_mins'][signal_name] - bin_mean_std = self.data['bin_means_std'][signal_name] - bin_max_std = self.data['bin_maxs_std'][signal_name] - bin_min_std = self.data['bin_mins_std'][signal_name] + bin_mean = self.data["bin_means"][signal_name] + bin_max = self.data["bin_maxs"][signal_name] + bin_min = self.data["bin_mins"][signal_name] + bin_mean_std = self.data["bin_means_std"][signal_name] + bin_max_std = self.data["bin_maxs_std"][signal_name] + bin_min_std = self.data["bin_mins_std"][signal_name] # Generate plot - loads.graphics.plot_bin_statistics(bin_centers, - bin_mean, bin_max, bin_min, - bin_mean_std, bin_max_std, bin_min_std, - x_label='Wind Speed [m/s]', - y_label=signal_name, - title='Binned Stats', - save_path=savepath) + loads.graphics.plot_bin_statistics( + bin_centers, + bin_mean, + bin_max, + bin_min, + bin_mean_std, + bin_max_std, + bin_min_std, + x_label="Wind Speed [m/s]", + y_label=signal_name, + title="Binned Stats", + save_path=savepath, + ) self.assertTrue(isfile(savepath)) -class TestWDRT(unittest.TestCase): + def test_plot_bin_statistics_type_errors(self): + # Specify inputs to be used in plotting + bin_centers = np.arange(3.5, 25.5, step=1) + signal_name = "TB_ForeAft" + bin_mean = self.data["bin_means"][signal_name] + bin_max = self.data["bin_maxs"][signal_name] + bin_min = self.data["bin_mins"][signal_name] + bin_mean_std = self.data["bin_means_std"][signal_name] + bin_max_std = self.data["bin_maxs_std"][signal_name] + bin_min_std = self.data["bin_mins_std"][signal_name] + # Test invalid data types one at a time + with self.assertRaises(TypeError): + loads.graphics.plot_bin_statistics( + ["a", 2, 3], # Invalid bin_centers + bin_mean, + bin_max, + bin_min, + bin_mean_std, + bin_max_std, + bin_min_std, + ) + + with self.assertRaises(TypeError): + loads.graphics.plot_bin_statistics( + bin_centers, + ["a", 20, 30], # Invalid bin_mean + bin_max, + bin_min, + bin_mean_std, + bin_max_std, + bin_min_std, + ) + + with self.assertRaises(TypeError): + loads.graphics.plot_bin_statistics( + bin_centers, + bin_mean, + ["a", 25, 35], # Invalid bin_max + bin_min, + bin_mean_std, + bin_max_std, + bin_min_std, + ) + + with self.assertRaises(TypeError): + loads.graphics.plot_bin_statistics( + bin_centers, + bin_mean, + bin_max, + ["a", 15, 25], # Invalid bin_min + bin_mean_std, + bin_max_std, + bin_min_std, + ) + + with self.assertRaises(TypeError): + loads.graphics.plot_bin_statistics( + bin_centers, + bin_mean, + bin_max, + bin_min, + ["a", 2, 3], # Invalid bin_mean_std + bin_max_std, + bin_min_std, + ) + + with self.assertRaises(TypeError): + loads.graphics.plot_bin_statistics( + bin_centers, + bin_mean, + bin_max, + bin_min, + bin_mean_std, + ["a", 1.5, 2.5], # Invalid bin_max_std + bin_min_std, + ) + + with self.assertRaises(TypeError): + loads.graphics.plot_bin_statistics( + bin_centers, + bin_mean, + bin_max, + bin_min, + bin_mean_std, + bin_max_std, + ["a", 1.8, 2.8], # Invalid bin_min_std + ) + +class TestWDRT(unittest.TestCase): @classmethod def setUpClass(self): mler_file = join(datadir, "mler.csv") - mler_data = pd.read_csv(mler_file,index_col=None) - mler_tsfile = join(datadir,"mler_ts.csv") - mler_ts = pd.read_csv(mler_tsfile,index_col=0) + mler_data = pd.read_csv(mler_file, index_col=None) + mler_tsfile = join(datadir, "mler_ts.csv") + mler_ts = pd.read_csv(mler_tsfile, index_col=0) self.mler_ts = mler_ts - self.wave_freq = np.linspace( 0.,1,500) + self.wave_freq = np.linspace(0.0, 1, 500) self.mler = mler_data self.sim = loads.extreme.mler_simulation() @@ -138,45 +365,89 @@ def test_mler_coefficients(self): Tp = 15.1 # time period of waves pm = resource.pierson_moskowitz_spectrum(self.wave_freq, Tp, Hs) mler_data = loads.extreme.mler_coefficients( - self.mler['RAO'].astype(complex), pm, 1) + self.mler["RAO"].astype(complex), pm, 1 + ) + mler_data.reset_index(drop=True, inplace=True) + + assert_series_equal( + mler_data["WaveSpectrum"], + self.mler["Res_Spec"], + check_exact=False, + check_names=False, + atol=0.001, + ) + assert_series_equal( + mler_data["Phase"], + self.mler["phase"], + check_exact=False, + check_names=False, + rtol=0.001, + ) + + def test_mler_coefficients_xarray(self): + Hs = 9.0 # significant wave height + Tp = 15.1 # time period of waves + pm = resource.pierson_moskowitz_spectrum(self.wave_freq, Tp, Hs) + mler_data = loads.extreme.mler_coefficients( + self.mler["RAO"].astype(complex).to_xarray(), pm, 1 + ) mler_data.reset_index(drop=True, inplace=True) - assert_series_equal(mler_data['WaveSpectrum'], self.mler['Res_Spec'], - check_exact=False, check_names=False, atol=0.001) - assert_series_equal(mler_data['Phase'], self.mler['phase'], - check_exact=False, check_names=False, rtol=0.001) + assert_series_equal( + mler_data["WaveSpectrum"], + self.mler["Res_Spec"], + check_exact=False, + check_names=False, + atol=0.001, + ) + assert_series_equal( + mler_data["Phase"], + self.mler["phase"], + check_exact=False, + check_names=False, + rtol=0.001, + ) def test_mler_simulation(self): T = np.linspace(-150, 150, 301) X = np.linspace(-300, 300, 601) sim = loads.extreme.mler_simulation() - assert_array_almost_equal(sim['X'], X) - assert_array_almost_equal(sim['T'], T) + assert_array_almost_equal(sim["X"], X) + assert_array_almost_equal(sim["T"], T) def test_mler_wave_amp_normalize(self): - wave_freq = np.linspace(0., 1, 500) + wave_freq = np.linspace(0.0, 1, 500) mler = pd.DataFrame(index=wave_freq) - mler['WaveSpectrum'] = self.mler['Res_Spec'].values - mler['Phase'] = self.mler['phase'].values + mler["WaveSpectrum"] = self.mler["Res_Spec"].values + mler["Phase"] = self.mler["phase"].values k = resource.wave_number(wave_freq, 70) k = k.fillna(0) mler_norm = loads.extreme.mler_wave_amp_normalize( - 4.5*1.9, mler, self.sim, k.k.values) + 4.5 * 1.9, mler, self.sim, k.k.values + ) mler_norm.reset_index(drop=True, inplace=True) - assert_series_equal(mler_norm['WaveSpectrum'], self.mler['Norm_Spec'],check_exact=False,atol=0.001,check_names=False) + assert_series_equal( + mler_norm["WaveSpectrum"], + self.mler["Norm_Spec"], + check_exact=False, + atol=0.001, + check_names=False, + ) def test_mler_export_time_series(self): - wave_freq = np.linspace(0., 1, 500) + wave_freq = np.linspace(0.0, 1, 500) mler = pd.DataFrame(index=wave_freq) - mler['WaveSpectrum'] = self.mler['Norm_Spec'].values - mler['Phase'] = self.mler['phase'].values + mler["WaveSpectrum"] = self.mler["Norm_Spec"].values + mler["Phase"] = self.mler["phase"].values k = resource.wave_number(wave_freq, 70) k = k.fillna(0) - RAO = self.mler['RAO'].astype(complex) + RAO = self.mler["RAO"].astype(complex) mler_ts = loads.extreme.mler_export_time_series( - RAO.values, mler, self.sim, k.k.values) + RAO.values, mler, self.sim, k.k.values + ) + mler_ts.index.name = None # compatibility with old data assert_frame_equal(self.mler_ts, mler_ts, atol=0.0001) @@ -188,8 +459,7 @@ def test_return_year_value(self): for y in return_years: for stp in short_term_periods: with self.subTest(year=y, short_term=stp): - val = loads.extreme.return_year_value( - dist.ppf, y, stp) + val = loads.extreme.return_year_value(dist.ppf, y, stp) want = 4.5839339 self.assertAlmostEqual(want, val, 5) @@ -200,24 +470,41 @@ def test_longterm_extreme(self): w = [0.5, 0.5] lte = loads.extreme.full_seastate_long_term_extreme(ste, w) x = np.random.rand() - assert_allclose(lte.cdf(x), w[0]*ste[0].cdf(x) + w[1]*ste[1].cdf(x)) + assert_allclose(lte.cdf(x), w[0] * ste[0].cdf(x) + w[1] * ste[1].cdf(x)) def test_shortterm_extreme(self): - methods = ['peaks_weibull', 'peaks_weibull_tail_fit', - 'peaks_over_threshold', 'block_maxima_gev', - 'block_maxima_gumbel'] + methods = [ + "peaks_weibull", + "peaks_weibull_tail_fit", + "peaks_over_threshold", + "block_maxima_gev", + "block_maxima_gumbel", + ] filename = "time_series_for_extremes.txt" data = np.loadtxt(os.path.join(datadir, filename)) t = data[:, 0] data = data[:, 1] t_st = 1.0 * 60 * 60 x = 1.6 - cdfs_1 = [0.006750456316537166, 0.5921659393757381, 0.6156789503874247, - 0.6075807789811315, 0.9033574618279865] + cdfs_1 = [ + 0.006750456316537166, + 0.5921659393757381, + 0.6156789503874247, + 0.6075807789811315, + 0.9033574618279865, + ] for method, cdf_1 in zip(methods, cdfs_1): ste = loads.extreme.ste(t, data, t_st, method) assert_allclose(ste.cdf(x), cdf_1) + def test_automatic_threshold(self): + filename = "data_loads_hs.csv" + data = np.loadtxt(os.path.join(datadir, filename), delimiter=",") + years = 2.97 + pct, threshold = loads.extreme.automatic_hs_threshold(data, years) + assert np.isclose(pct, 0.9913) + assert np.isclose(threshold, 1.032092) + -if __name__ == '__main__': +if __name__ == "__main__": unittest.main() diff --git a/mhkit/tests/mooring/test_mooring.py b/mhkit/tests/mooring/test_mooring.py index 1ba09f42d..da11f614c 100644 --- a/mhkit/tests/mooring/test_mooring.py +++ b/mhkit/tests/mooring/test_mooring.py @@ -3,43 +3,237 @@ from matplotlib.animation import FuncAnimation import xarray as xr import mhkit.mooring as mooring +import pytest +import numpy as np testdir = dirname(abspath(__file__)) -datadir = normpath(join(testdir, '..', '..', '..', - 'examples', 'data', 'mooring')) +datadir = normpath(join(testdir, "..", "..", "..", "examples", "data", "mooring")) class TestMooring(unittest.TestCase): + @classmethod + def setUpClass(self): + fpath = join(datadir, "line1_test.nc") + self.ds = xr.open_dataset(fpath) + self.dsani = self.ds.sel(Time=slice(0, 10)) def test_moordyn_out(self): - fpath = join(datadir, 'Test.MD.out') + fpath = join(datadir, "Test.MD.out") inputpath = join(datadir, "TestInput.MD.dat") ds = mooring.io.read_moordyn(fpath, input_file=inputpath) - isinstance(ds, xr.Dataset) + self.assertIsInstance(ds, xr.Dataset) def test_lay_length(self): - fpath = join(datadir, 'line1_test.nc') + fpath = join(datadir, "line1_test.nc") ds = xr.open_dataset(fpath) laylengths = mooring.lay_length(ds, depth=-56, tolerance=0.25) laylength = laylengths.mean().values self.assertAlmostEqual(laylength, 45.0, 1) def test_animate_3d(self): - fpath = join(datadir, 'line1_test.nc') - ds = xr.open_dataset(fpath) - dsani = ds.sel(Time=slice(0, 10)) - ani = mooring.graphics.animate(dsani, dimension='3d', interval=10, repeat=True, - xlabel='X-axis', ylabel='Y-axis', zlabel='Depth [m]', title='Mooring Line Example') - isinstance(ani, FuncAnimation) + dsani = self.ds.sel(Time=slice(0, 10)) + ani = mooring.graphics.animate( + dsani, + dimension="3d", + interval=10, + repeat=True, + xlabel="X-axis", + ylabel="Y-axis", + zlabel="Depth [m]", + title="Mooring Line Example", + ) + self.assertIsInstance(ani, FuncAnimation) def test_animate_2d(self): - fpath = join(datadir, 'line1_test.nc') - ds = xr.open_dataset(fpath) - dsani = ds.sel(Time=slice(0, 10)) - ani2d = mooring.graphics.animate(dsani, dimension='2d', xaxis='x', yaxis='z', repeat=True, - xlabel='X-axis', ylabel='Depth [m]', title='Mooring Line Example') - isinstance(ani2d, FuncAnimation) + dsani = self.ds.sel(Time=slice(0, 10)) + ani2d = mooring.graphics.animate( + dsani, + dimension="2d", + xaxis="x", + yaxis="z", + repeat=True, + xlabel="X-axis", + ylabel="Depth [m]", + title="Mooring Line Example", + ) + self.assertIsInstance(ani2d, FuncAnimation) + + def test_animate_2d_update(self): + ani2d = mooring.graphics.animate( + self.ds, + dimension="2d", + xaxis="x", + yaxis="z", + repeat=True, + xlabel="X-axis", + ylabel="Depth [m]", + title="Mooring Line Example", + ) + + # Extract the figure and axes + fig = ani2d._fig + ax = fig.axes[0] + (line,) = ax.lines + + # Simulate the update for a specific frame + frame = 5 + + # Extracting data from the list of nodes + nodes_x, nodes_y, _ = mooring.graphics._get_axis_nodes( + self.dsani, "x", "z", "y" + ) + x_data = self.dsani[nodes_x[0]].isel(Time=frame).values + y_data = self.dsani[nodes_y[0]].isel(Time=frame).values + + # Manually set the data for the line object + line.set_data(x_data, y_data) + + # Extract updated data from the line object + updated_x, updated_y = line.get_data() + + # Assert that the updated data matches the dataset + np.testing.assert_array_equal(updated_x, x_data) + np.testing.assert_array_equal(updated_y, y_data) + + def test_animate_3d_update(self): + ani3d = mooring.graphics.animate( + self.ds, + dimension="3d", + xaxis="x", + yaxis="z", + zaxis="y", + repeat=True, + xlabel="X-axis", + ylabel="Depth [m]", + zlabel="Y-axis", + title="Mooring Line Example", + ) + + # Extract the figure and axes + fig = ani3d._fig + ax = fig.axes[0] + (line,) = ax.lines + + # Simulate the update for a specific frame + frame = 5 + + # Extracting data for the specified frame + nodes_x, nodes_y, nodes_z = mooring.graphics._get_axis_nodes( + self.dsani, "x", "z", "y" + ) + x_data = self.dsani[nodes_x[0]].isel(Time=frame).values + y_data = self.dsani[nodes_y[0]].isel(Time=frame).values + z_data = self.dsani[nodes_z[0]].isel(Time=frame).values + + # Manually set the data for the line object + line.set_data(x_data, y_data) + line.set_3d_properties(z_data) + + # Extract updated data from the line object + updated_x, updated_y, updated_z = line._verts3d + + # Assert that the updated data matches the dataset + np.testing.assert_array_equal(updated_x, x_data) + np.testing.assert_array_equal(updated_y, y_data) + np.testing.assert_array_equal(updated_z, z_data) + + # Test for xaxis, yaxis, zaxis type handling + def test_animate_xaxis_type_handling(self): + with pytest.raises(TypeError): + mooring.graphics.animate(self.dsani, xaxis=123) + + def test_animate_yaxis_type_handling(self): + with pytest.raises(TypeError): + mooring.graphics.animate(self.dsani, yaxis=123) + + def test_animate_zaxis_type_handling(self): + with pytest.raises(TypeError): + mooring.graphics.animate(self.dsani, zaxis=123) + + # Test for zlim and zlabel in 3D mode + def test_animate_zlim_type_handling_3d(self): + with pytest.raises(TypeError): + mooring.graphics.animate(self.dsani, dimension="3d", zlim="invalid") + + def test_animate_zlabel_type_handling_3d(self): + with pytest.raises(TypeError): + mooring.graphics.animate(self.dsani, dimension="3d", zlabel=123) + + # Test for xlim, ylim, interval, repeat, xlabel, ylabel, title + def test_animate_xlim_type_handling(self): + with pytest.raises(TypeError): + mooring.graphics.animate(self.dsani, xlim="invalid") + + def test_animate_ylim_type_handling(self): + with pytest.raises(TypeError): + mooring.graphics.animate(self.dsani, ylim="invalid") + + def test_animate_interval_type_handling(self): + with pytest.raises(TypeError): + mooring.graphics.animate(self.dsani, interval="invalid") + + def test_animate_repeat_type_handling(self): + with pytest.raises(TypeError): + mooring.graphics.animate(self.dsani, repeat="invalid") + + def test_animate_xlabel_type_handling(self): + with pytest.raises(TypeError): + mooring.graphics.animate(self.dsani, xlabel=123) + + def test_animate_ylabel_type_handling(self): + with pytest.raises(TypeError): + mooring.graphics.animate(self.dsani, ylabel=123) + + def test_animate_title_type_handling(self): + with pytest.raises(TypeError): + mooring.graphics.animate(self.dsani, title=123) + + def test_animate_dsani_type_handling(self): + with pytest.raises(TypeError): + mooring.graphics.animate("not_a_dataset") + + def test_animate_xlim_type_handling_none(self): + try: + mooring.graphics.animate(self.dsani, xlim=None) + except TypeError: + pytest.fail("Unexpected TypeError with xlim=None") + + def test_animate_ylim_type_handling_none(self): + try: + mooring.graphics.animate(self.dsani, ylim=None) + except TypeError: + pytest.fail("Unexpected TypeError with ylim=None") + + def test_animate_interval_type_handling(self): + with pytest.raises(TypeError): + mooring.graphics.animate(self.dsani, interval="not_an_int") + + def test_animate_repeat_type_handling(self): + with pytest.raises(TypeError): + mooring.graphics.animate(self.dsani, repeat="not_a_bool") + + def test_animate_xlabel_type_handling_none(self): + try: + mooring.graphics.animate(self.dsani, xlabel=None) + except TypeError: + pytest.fail("Unexpected TypeError with xlabel=None") + + def test_animate_ylabel_type_handling_none(self): + try: + mooring.graphics.animate(self.dsani, ylabel=None) + except TypeError: + pytest.fail("Unexpected TypeError with ylabel=None") + + def test_animate_title_type_handling_none(self): + try: + mooring.graphics.animate(self.dsani, title=None) + except TypeError: + pytest.fail("Unexpected TypeError with title=None") + + def test_animate_dimension_type_handling(self): + with pytest.raises(ValueError): + mooring.graphics.animate(self.dsani, dimension="not_2d_or_3d") -if __name__ == '__main__': +if __name__ == "__main__": unittest.main() diff --git a/mhkit/tests/power/test_power.py b/mhkit/tests/power/test_power.py index eb2807932..e218d149f 100644 --- a/mhkit/tests/power/test_power.py +++ b/mhkit/tests/power/test_power.py @@ -1,112 +1,186 @@ - -from os.path import abspath, dirname, join, isfile, normpath, relpath +from os.path import abspath, dirname, join, normpath, relpath import mhkit.power as power import pandas as pd +import xarray as xr import numpy as np import unittest -import os testdir = dirname(abspath(__file__)) -datadir = normpath(join(testdir,relpath('../../../examples/data/power'))) +datadir = normpath(join(testdir, relpath("../../../examples/data/power"))) -class TestDevice(unittest.TestCase): +class TestDevice(unittest.TestCase): @classmethod def setUpClass(self): self.t = 600 fs = 1000 - sample_frequency = 1000 # = fs - self.samples = np.linspace(0, self.t, int(fs*self.t), endpoint=False) + self.samples = np.linspace(0, self.t, int(fs * self.t), endpoint=False) self.frequency = 60 - self.freq_array = np.ones(len(self.samples))*60 - harmonics_int = np.arange(0,60*60,5) + self.freq_array = np.ones(len(self.samples)) * 60 + harmonics_int = np.arange(0, 60 * 60, 5) self.harmonics_int = harmonics_int - self.interharmonic = np.zeros(len(harmonics_int)) #since this is an idealized sin wave, the interharmonics should be zero + # since this is an idealized sin wave, the interharmonics should be zero + self.interharmonic = np.zeros(len(harmonics_int)) self.harmonics_vals = np.zeros(len(harmonics_int)) - self.harmonics_vals[12]= 1.0 #setting 60th harmonic to amplitude of the signal + # setting 60th harmonic to amplitude of the signal + self.harmonics_vals[12] = 1.0 + + # harmonic groups should be equal to every 12th harmonic in this idealized example + self.harmonic_groups = self.harmonics_vals[0::12] + self.thcd = ( + 0.0 # Since this is an idealized sin wave, there should be no distortion + ) - self.harmonic_groups = self.harmonics_vals[0::12] #harmonic groups should be equal to every 12th harmonic in this idealized example - self.thcd = 0.0 #Since this is an idealized sin wave, there should be no distortion - self.signal = np.sin(2 * np.pi * self.frequency * self.samples) - - self.current_data = [[1,2,3],[4,5,6],[7,8,9],[10,11,12]] - self.voltage_data = [[1,5,9],[2,6,10],[3,7,11],[4,8,12]] + + self.current_data = np.asarray([[1, 2, 3], [4, 5, 6], [7, 8, 9], [10, 11, 12]]) + self.voltage_data = np.asarray([[1, 5, 9], [2, 6, 10], [3, 7, 11], [4, 8, 12]]) @classmethod def tearDownClass(self): pass - def test_harmonics_sine_wave(self): - + def test_harmonics_sine_wave_pandas(self): current = pd.Series(self.signal, index=self.samples) harmonics = power.quality.harmonics(current, 1000, self.frequency) - for i,j in zip(harmonics.values, self.harmonics_vals): - self.assertAlmostEqual(i[0], j,1) + for i, j in zip(harmonics["data"].values, self.harmonics_vals): + self.assertAlmostEqual(i, j, 1) - def test_harmonic_subgroup_sine_wave(self): - current = pd.Series(self.signal, index=self.samples) - harmonics = pd.DataFrame(self.harmonics_vals, - index= self.harmonics_int) - hsg = power.quality.harmonic_subgroups(harmonics,self.frequency) - for i,j in zip(hsg.values,self.harmonic_groups): - self.assertAlmostEqual(i[0], j,1) + def test_harmonics_sine_wave_xarray(self): + current = xr.DataArray( + data=self.signal, dims="index", coords={"index": self.samples} + ) + harmonics = power.quality.harmonics(current, 1000, self.frequency) - def test_TCHD_sine_wave(self): - current = pd.Series(self.signal, index=self.samples) - harmonics = pd.DataFrame(self.harmonics_vals, - index= self.harmonics_int) - hsg = power.quality.harmonic_subgroups(harmonics,self.frequency) + for i, j in zip(harmonics["data"].values, self.harmonics_vals): + self.assertAlmostEqual(i, j, 1) - TCHD = power.quality.total_harmonic_current_distortion(hsg,18.8) # had to just put a random rated current in here - self.assertAlmostEqual(TCHD.values[0],self.thcd) + def test_harmonic_subgroup_sine_wave_pandas(self): + harmonics = pd.DataFrame(self.harmonics_vals, index=self.harmonics_int) + hsg = power.quality.harmonic_subgroups(harmonics, self.frequency) - def test_interharmonics_sine_wave(self): - current = pd.Series(self.signal, index=self.samples) - harmonics = pd.DataFrame(self.harmonics_vals, - index= self.harmonics_int) + for i, j in zip(hsg.values, self.harmonic_groups): + self.assertAlmostEqual(i[0], j, 1) + + def test_harmonic_subgroup_sine_wave_xarray(self): + harmonics = xr.Dataset( + data_vars={"harmonics": (["index"], self.harmonics_vals)}, + coords={"index": self.harmonics_int}, + ) + hsg = power.quality.harmonic_subgroups(harmonics, self.frequency) + + for i, j in zip(hsg.values, self.harmonic_groups): + self.assertAlmostEqual(i[0], j, 1) + + def test_TCHD_sine_wave_pandas(self): + harmonics = pd.DataFrame(self.harmonics_vals, index=self.harmonics_int) + hsg = power.quality.harmonic_subgroups(harmonics, self.frequency) + TCHD = power.quality.total_harmonic_current_distortion(hsg) + + self.assertAlmostEqual(TCHD.values[0], self.thcd) + + def test_TCHD_sine_wave_xarray(self): + harmonics = xr.Dataset( + data_vars={"harmonics": (["index"], self.harmonics_vals)}, + coords={"index": self.harmonics_int}, + ) + hsg = power.quality.harmonic_subgroups(harmonics, self.frequency) + TCHD = power.quality.total_harmonic_current_distortion(hsg) + + self.assertAlmostEqual(TCHD.values[0], self.thcd) + + def test_interharmonics_sine_wave_pandas(self): + harmonics = pd.DataFrame(self.harmonics_vals, index=self.harmonics_int) + inter_harmonics = power.quality.interharmonics(harmonics, self.frequency) + + for i, j in zip(inter_harmonics.values, self.interharmonic): + self.assertAlmostEqual(i[0], j, 1) + + def test_interharmonics_sine_wave_xarray(self): + harmonics = xr.Dataset( + data_vars={"harmonics": (["index"], self.harmonics_vals)}, + coords={"index": self.harmonics_int}, + ) + inter_harmonics = power.quality.interharmonics(harmonics, self.frequency) - inter_harmonics = power.quality.interharmonics(harmonics,self.frequency) + for i, j in zip(inter_harmonics.values, self.interharmonic): + self.assertAlmostEqual(i[0], j, 1) - for i,j in zip(inter_harmonics.values, self.interharmonic): - self.assertAlmostEqual(i[0], j,1) + def test_instfreq_pandas(self): + um = pd.Series(self.signal, index=self.samples) + freq = power.characteristics.instantaneous_frequency(um) + for i in freq.values: + self.assertAlmostEqual(i[0], self.frequency, 1) + + def test_instfreq_xarray(self): + um = pd.Series(self.signal, index=self.samples) + um = um.to_xarray() - def test_instfreq(self): - um = pd.Series(self.signal,index = self.samples) - freq = power.characteristics.instantaneous_frequency(um) for i in freq.values: - self.assertAlmostEqual(i[0], self.frequency,1) + self.assertAlmostEqual(i[0], self.frequency, 1) + + def test_dc_power_pandas(self): + current = pd.DataFrame(self.current_data, columns=["A1", "A2", "A3"]) + voltage = pd.DataFrame(self.voltage_data, columns=["V1", "V2", "V3"]) + + P = power.characteristics.dc_power(voltage, current) + P_test = (self.current_data * self.voltage_data).sum() + self.assertEqual(P.sum()["Gross"], P_test) + + P = power.characteristics.dc_power(voltage["V1"], current["A1"]) + P_test = (self.current_data[:, 0] * self.voltage_data[:, 0]).sum() + self.assertEqual(P.sum()["Gross"], P_test) + + def test_dc_power_xarray(self): + current = pd.DataFrame(self.current_data, columns=["A1", "A2", "A3"]) + voltage = pd.DataFrame(self.voltage_data, columns=["V1", "V2", "V3"]) + current = current.to_xarray() + voltage = voltage.to_xarray() - def test_dc_power_DataFrame(self): - current = pd.DataFrame(self.current_data, columns=['A1', 'A2', 'A3']) - voltage = pd.DataFrame(self.voltage_data, columns=['V1', 'V2', 'V3']) P = power.characteristics.dc_power(voltage, current) - self.assertEqual(P.sum()['Gross'], (voltage.values * current.values).sum()) - - def test_dc_power_Series(self): - current = pd.DataFrame(self.current_data, columns=['A1', 'A2', 'A3']) - voltage = pd.DataFrame(self.voltage_data, columns=['V1', 'V2', 'V3']) - P = power.characteristics.dc_power(voltage['V1'], current['A1']) - self.assertEqual(P.sum()['Gross'], sum( voltage['V1'] * current['A1'])) - - def test_ac_power_three_phase(self): - current = pd.DataFrame(self.current_data, columns=['A1', 'A2', 'A3']) - voltage = pd.DataFrame(self.voltage_data, columns=['V1', 'V2', 'V3']) - - P1 = power.characteristics.ac_power_three_phase( voltage, current, 1, False) + P_test = (self.current_data * self.voltage_data).sum() + self.assertEqual(P.sum()["Gross"], P_test) + + P = power.characteristics.dc_power(voltage["V1"], current["A1"]) + P_test = (self.current_data[:, 0] * self.voltage_data[:, 0]).sum() + self.assertEqual(P.sum()["Gross"], P_test) + + def test_ac_power_three_phase_pandas(self): + current = pd.DataFrame(self.current_data, columns=["A1", "A2", "A3"]) + voltage = pd.DataFrame(self.voltage_data, columns=["V1", "V2", "V3"]) + + P1 = power.characteristics.ac_power_three_phase(voltage, current, 1, False) P1b = power.characteristics.ac_power_three_phase(voltage, current, 0.5, False) - P2 = power.characteristics.ac_power_three_phase( voltage, current,1, True) + P2 = power.characteristics.ac_power_three_phase(voltage, current, 1, True) P2b = power.characteristics.ac_power_three_phase(voltage, current, 0.5, True) - - self.assertEqual(P1.sum()[0], 584) - self.assertEqual(P1b.sum()[0], 584/2) - self.assertAlmostEqual(P2.sum()[0], 1011.518, 2) - self.assertAlmostEqual(P2b.sum()[0], 1011.518/2, 2) - -if __name__ == '__main__': - unittest.main() - + + P_test = (self.current_data * self.voltage_data).sum() + self.assertEqual(P1.sum().iloc[0], P_test) + self.assertEqual(P1b.sum().iloc[0], P_test / 2) + self.assertAlmostEqual(P2.sum().iloc[0], P_test * np.sqrt(3), 2) + self.assertAlmostEqual(P2b.sum().iloc[0], P_test * np.sqrt(3) / 2, 2) + + def test_ac_power_three_phase_xarray(self): + current = pd.DataFrame(self.current_data, columns=["A1", "A2", "A3"]) + voltage = pd.DataFrame(self.voltage_data, columns=["V1", "V2", "V3"]) + current = current.to_xarray() + voltage = voltage.to_xarray() + + P1 = power.characteristics.ac_power_three_phase(voltage, current, 1, False) + P1b = power.characteristics.ac_power_three_phase(voltage, current, 0.5, False) + P2 = power.characteristics.ac_power_three_phase(voltage, current, 1, True) + P2b = power.characteristics.ac_power_three_phase(voltage, current, 0.5, True) + + P_test = (self.current_data * self.voltage_data).sum() + self.assertEqual(P1.sum().iloc[0], P_test) + self.assertEqual(P1b.sum().iloc[0], P_test / 2) + self.assertAlmostEqual(P2.sum().iloc[0], P_test * np.sqrt(3), 2) + self.assertAlmostEqual(P2b.sum().iloc[0], P_test * np.sqrt(3) / 2, 2) + + +if __name__ == "__main__": + unittest.main() diff --git a/mhkit/tests/river/test_io.py b/mhkit/tests/river/test_io.py deleted file mode 100644 index 714711ff1..000000000 --- a/mhkit/tests/river/test_io.py +++ /dev/null @@ -1,227 +0,0 @@ -from os.path import abspath, dirname, join, isfile, normpath, relpath -from numpy.testing import assert_array_almost_equal -from pandas.testing import assert_frame_equal -import scipy.interpolate as interp -import matplotlib.pylab as plt -import mhkit.river as river -import pandas as pd -import numpy as np -import unittest -import netCDF4 -import os - - -testdir = dirname(abspath(__file__)) -plotdir = join(testdir, 'plots') -isdir = os.path.isdir(plotdir) -if not isdir: os.mkdir(plotdir) -datadir = normpath(join(testdir,'..','..','..','examples','data','river')) - - -class TestIO(unittest.TestCase): - - @classmethod - def setUpClass(self): - d3ddatadir = normpath(join(datadir,'d3d')) - - filename= 'turbineTest_map.nc' - self.d3d_flume_data = netCDF4.Dataset(join(d3ddatadir,filename)) - - @classmethod - def tearDownClass(self): - pass - - def test_load_usgs_data_instantaneous(self): - file_name = join(datadir, 'USGS_08313000_Jan2019_instantaneous.json') - data = river.io.usgs.read_usgs_file(file_name) - - self.assertEqual(data.columns, ['Discharge, cubic feet per second']) - self.assertEqual(data.shape, (2972, 1)) # 4 data points are missing - - def test_load_usgs_data_daily(self): - file_name = join(datadir, 'USGS_08313000_Jan2019_daily.json') - data = river.io.usgs.read_usgs_file(file_name) - - expected_index = pd.date_range('2019-01-01', '2019-01-31', freq='D') - self.assertEqual(data.columns, ['Discharge, cubic feet per second']) - self.assertEqual((data.index == expected_index.tz_localize('UTC')).all(), True) - self.assertEqual(data.shape, (31, 1)) - - - def test_request_usgs_data_daily(self): - data=river.io.usgs.request_usgs_data(station="15515500", - parameter='00060', - start_date='2009-08-01', - end_date='2009-08-10', - data_type='Daily') - self.assertEqual(data.columns, ['Discharge, cubic feet per second']) - self.assertEqual(data.shape, (10, 1)) - - - def test_request_usgs_data_instant(self): - data=river.io.usgs.request_usgs_data(station="15515500", - parameter='00060', - start_date='2009-08-01', - end_date='2009-08-10', - data_type='Instantaneous') - self.assertEqual(data.columns, ['Discharge, cubic feet per second']) - # Every 15 minutes or 4 times per hour - self.assertEqual(data.shape, (10*24*4, 1)) - - def test_get_all_time(self): - data= self.d3d_flume_data - seconds_run = river.io.d3d.get_all_time(data) - seconds_run_expected= np.ndarray(shape=(5,), buffer= np.array([0, 60, 120, 180, 240]), dtype=int) - np.testing.assert_array_equal(seconds_run, seconds_run_expected) - - def test_convert_time(self): - data= self.d3d_flume_data - time_index = 2 - seconds_run = river.io.d3d.index_to_seconds(data, time_index = time_index) - seconds_run_expected = 120 - self.assertEqual(seconds_run, seconds_run_expected) - seconds_run = 60 - time_index= river.io.d3d.seconds_to_index(data, seconds_run = seconds_run) - time_index_expected = 1 - self.assertEqual(time_index, time_index_expected) - seconds_run = 62 - time_index= river.io.d3d.seconds_to_index(data, seconds_run = seconds_run) - time_index_expected = 1 - output_expected= f'ERROR: invalid seconds_run. Closest seconds_run found {time_index_expected}' - self.assertWarns(UserWarning) - - def test_layer_data(self): - data=self.d3d_flume_data - variable = ['ucx', 's1'] - for var in variable: - layer=2 - time_index= 3 - layer_data= river.io.d3d.get_layer_data(data, var, layer, time_index) - layer_compare = 2 - time_index_compare= 4 - layer_data_expected= river.io.d3d.get_layer_data(data, - var, layer_compare, - time_index_compare) - - assert_array_almost_equal(layer_data.x,layer_data_expected.x, decimal = 2) - assert_array_almost_equal(layer_data.y,layer_data_expected.y, decimal = 2) - assert_array_almost_equal(layer_data.v,layer_data_expected.v, decimal= 2) - - - - def test_create_points(self): - x=np.linspace(1, 3, num= 3) - y=np.linspace(1, 3, num= 3) - z=1 - points= river.io.d3d.create_points(x,y,z) - x=[1,2,3,1,2,3,1,2,3] - y=[1,1,1,2,2,2,3,3,3] - z=[1,1,1,1,1,1,1,1,1] - points_array= np.array([ [x_i, y_i, z_i] for x_i, y_i, z_i in zip(x, y, z)]) - points_expected= pd.DataFrame(points_array, columns=('x','y','z')) - assert_array_almost_equal(points, points_expected,decimal = 2) - - x=np.linspace(1, 3, num= 3) - y=2 - z=1 - points= river.io.d3d.create_points(x,y,z) - x=[1,2,3] - y=[2,2,2] - z=[1,1,1] - points_array= np.array([ [x_i, y_i, z_i] for x_i, y_i, z_i in zip(x, y, z)]) - points_expected= pd.DataFrame(points_array, columns=('x','y','z')) - assert_array_almost_equal(points, points_expected,decimal = 2) - - x=3 - y=2 - z=1 - points= river.io.d3d.create_points(x,y,z) - output_expected='Can provide at most two arrays' - self.assertWarns(UserWarning) - - def test_variable_interpolation(self): - data=self.d3d_flume_data - variables= ['ucx','turkin1'] - transformes_data= river.io.d3d.variable_interpolation(data, variables, points= 'faces', edges='nearest') - self.assertEqual(np.size(transformes_data['ucx']), np.size(transformes_data['turkin1'])) - transformes_data= river.io.d3d.variable_interpolation(data, variables, points= 'cells', edges='nearest') - self.assertEqual(np.size(transformes_data['ucx']), np.size(transformes_data['turkin1'])) - x=np.linspace(1, 3, num= 3) - y=np.linspace(1, 3, num= 3) - waterdepth=1 - points= river.io.d3d.create_points(x,y,waterdepth) - transformes_data= river.io.d3d.variable_interpolation(data, variables, points= points) - self.assertEqual(np.size(transformes_data['ucx']), np.size(transformes_data['turkin1'])) - - def test_get_all_data_points(self): - data=self.d3d_flume_data - variable= 'ucx' - time_step= 3 - output = river.io.d3d.get_all_data_points(data, variable, time_step) - size_output = np.size(output) - time_step_compair=4 - output_expected= river.io.d3d.get_all_data_points(data, variable, time_step_compair) - size_output_expected= np.size(output_expected) - self.assertEqual(size_output, size_output_expected) - - - def test_unorm(self): - x=np.linspace(1, 3, num= 3) - y=np.linspace(1, 3, num= 3) - z=np.linspace(1, 3, num= 3) - unorm = river.io.d3d.unorm(x,y,z) - unorm_expected= [np.sqrt(1**2+1**2+1**2),np.sqrt(2**2+2**2+2**2), np.sqrt(3**2+3**2+3**2)] - assert_array_almost_equal(unorm, unorm_expected, decimal = 2) - - def test_turbulent_intensity(self): - data=self.d3d_flume_data - time_index= -1 - x_test=np.linspace(1, 17, num= 10) - y_test=np.linspace(3, 3, num= 10) - waterdepth_test=np.linspace(1, 1, num= 10) - - test_points = np.array([ [x, y, waterdepth] for x, y, waterdepth in zip(x_test, y_test, waterdepth_test)]) - points= pd.DataFrame(test_points, columns=['x','y','waterdepth']) - - TI= river.io.d3d.turbulent_intensity(data, points, time_index) - - TI_vars= ['turkin1', 'ucx', 'ucy', 'ucz'] - TI_data_raw = {} - for var in TI_vars: - #get all data - var_data_df = river.io.d3d.get_all_data_points(data, var,time_index) - TI_data_raw[var] = var_data_df - TI_data= points.copy(deep=True) - - for var in TI_vars: - TI_data[var] = interp.griddata(TI_data_raw[var][['x','y','waterdepth']], - TI_data_raw[var][var], points[['x','y','waterdepth']]) - idx= np.where(np.isnan(TI_data[var])) - - if len(idx[0]): - for i in idx[0]: - TI_data[var][i]= interp.griddata(TI_data_raw[var][['x','y','waterdepth']], - TI_data_raw[var][var], - [points['x'][i],points['y'][i], points['waterdepth'][i]], - method='nearest') - - u_mag=river.io.d3d.unorm(TI_data['ucx'],TI_data['ucy'], TI_data['ucz']) - turbulent_intensity_expected= (np.sqrt(2/3*TI_data['turkin1'])/u_mag)*100 - - - assert_array_almost_equal(TI.turbulent_intensity, turbulent_intensity_expected, decimal = 2) - - TI = river.io.d3d.turbulent_intensity(data, points='faces') - TI_size = np.size(TI['turbulent_intensity']) - turkin1= river.io.d3d.get_all_data_points(data, 'turkin1',time_index) - turkin1_size= np.size(turkin1['turkin1']) - self.assertEqual(TI_size, turkin1_size) - - TI = river.io.d3d.turbulent_intensity(data, points='cells') - TI_size = np.size(TI['turbulent_intensity']) - ucx= river.io.d3d.get_all_data_points(data, 'ucx',time_index) - ucx_size= np.size(ucx['ucx']) - self.assertEqual(TI_size, ucx_size) -if __name__ == '__main__': - unittest.main() - diff --git a/mhkit/tests/river/test_io_d3d.py b/mhkit/tests/river/test_io_d3d.py new file mode 100644 index 000000000..f41ba4962 --- /dev/null +++ b/mhkit/tests/river/test_io_d3d.py @@ -0,0 +1,302 @@ +from os.path import abspath, dirname, join, normpath +from numpy.testing import assert_array_almost_equal +import scipy.interpolate as interp +import mhkit.river as river +import mhkit.tidal as tidal +import pandas as pd +import xarray as xr +import numpy as np +import unittest +import netCDF4 +import os + + +testdir = dirname(abspath(__file__)) +plotdir = join(testdir, "plots") +isdir = os.path.isdir(plotdir) +if not isdir: + os.mkdir(plotdir) +datadir = normpath(join(testdir, "..", "..", "..", "examples", "data", "river")) + + +class TestIO(unittest.TestCase): + @classmethod + def setUpClass(self): + d3ddatadir = normpath(join(datadir, "d3d")) + + filename = "turbineTest_map.nc" + self.d3d_flume_data = netCDF4.Dataset(join(d3ddatadir, filename)) + + @classmethod + def tearDownClass(self): + pass + + def test_get_all_time(self): + data = self.d3d_flume_data + seconds_run = river.io.d3d.get_all_time(data) + seconds_run_expected = np.ndarray( + shape=(5,), buffer=np.array([0, 60, 120, 180, 240]), dtype=int + ) + np.testing.assert_array_equal(seconds_run, seconds_run_expected) + + def test_convert_time(self): + data = self.d3d_flume_data + time_index = 2 + seconds_run = river.io.d3d.index_to_seconds(data, time_index=time_index) + seconds_run_expected = 120 + self.assertEqual(seconds_run, seconds_run_expected) + seconds_run = 60 + time_index = river.io.d3d.seconds_to_index(data, seconds_run=seconds_run) + time_index_expected = 1 + self.assertEqual(time_index, time_index_expected) + seconds_run = 62 + time_index = river.io.d3d.seconds_to_index(data, seconds_run=seconds_run) + time_index_expected = 1 + output_expected = f"ERROR: invalid seconds_run. Closest seconds_run found {time_index_expected}" + self.assertWarns(UserWarning) + + def test_convert_time_from_tidal(self): + """ + Test the conversion of time from using tidal import of d3d + """ + data = self.d3d_flume_data + time_index = 2 + seconds_run = tidal.io.d3d.index_to_seconds(data, time_index=time_index) + seconds_run_expected = 120 + self.assertEqual(seconds_run, seconds_run_expected) + + def test_layer_data(self): + data = self.d3d_flume_data + variable = ["ucx", "s1"] + for var in variable: + layer = 2 + time_index = 3 + layer_data = river.io.d3d.get_layer_data(data, var, layer, time_index) + layer_compare = 2 + time_index_compare = 4 + layer_data_expected = river.io.d3d.get_layer_data( + data, var, layer_compare, time_index_compare + ) + + assert_array_almost_equal(layer_data.x, layer_data_expected.x, decimal=2) + assert_array_almost_equal(layer_data.y, layer_data_expected.y, decimal=2) + assert_array_almost_equal(layer_data.v, layer_data_expected.v, decimal=2) + + def test_create_points_three_points(self): + """ + Test the scenario where all three inputs (x, y, z) are points. + """ + x, y, z = 1, 2, 3 + + expected = pd.DataFrame([[x, y, z]], columns=["x", "y", "waterdepth"]) + + points = river.io.d3d.create_points(x, y, z) + assert_array_almost_equal(points.values, expected.values, decimal=2) + + def test_create_points_invalid_input(self): + """ + Test scenarios where invalid inputs are provided to the function. + """ + with self.assertRaises(TypeError): + river.io.d3d.create_points("invalid", 2, 3) + + def test_create_points_two_arrays_one_point(self): + """ + Test with two arrays and one point. + """ + result = river.io.d3d.create_points(np.array([1, 2]), np.array([3]), 4) + expected = pd.DataFrame({"x": [1, 2], "y": [3, 3], "waterdepth": [4, 4]}) + pd.testing.assert_frame_equal( + result, + expected, + check_dtype=False, + check_names=False, + check_index_type=False, + ) + + def test_create_points_user_made_two_arrays_one_point(self): + """ + Test the scenario where all three inputs (x, y, z) are created from + points. + """ + x, y, z = np.linspace(1, 3, num=3), np.linspace(1, 3, num=3), 1 + + # Adjust the order of the expected values + expected_data = [ + [i, j, 1] for j in y for i in x + ] # Notice the swapped loop order + expected = pd.DataFrame(expected_data, columns=["x", "y", "waterdepth"]) + + points = river.io.d3d.create_points(x, y, z) + assert_array_almost_equal(points.values, expected.values, decimal=2) + + def test_create_points_mismatched_array_lengths(self): + """ + Test the scenario where x and y are arrays of different lengths. + """ + with self.assertRaises(ValueError): + river.io.d3d.create_points( + np.array([1, 2, 3]), np.array([1, 2]), np.array([3, 4]) + ) + + def test_create_pointsempty_arrays(self): + """ + Test the scenario where provided arrays are empty. + """ + with self.assertRaises(ValueError): + river.io.d3d.create_points([], [], []) + + def test_create_points_mixed_data_types(self): + """ + Test a combination of np.ndarray, pd.Series, and xr.DataArray. + """ + x = np.array([1, 2]) + y = pd.Series([3, 4]) + z = xr.DataArray([5, 6]) + result = river.io.d3d.create_points(x, y, z) + expected = pd.DataFrame( + {"x": [1, 2, 1, 2], "y": [3, 4, 3, 4], "waterdepth": [5, 5, 6, 6]} + ) + + pd.testing.assert_frame_equal( + result, + expected, + check_dtype=False, + check_names=False, + check_index_type=False, + ) + + def test_create_points_array_like_inputs(self): + """ + Test array-like inputs such as lists. + """ + result = river.io.d3d.create_points([1, 2], [3, 4], [5, 6]) + expected = pd.DataFrame( + {"x": [1, 2, 1, 2], "y": [3, 4, 3, 4], "waterdepth": [5, 5, 6, 6]} + ) + + pd.testing.assert_frame_equal( + result, + expected, + check_dtype=False, + check_names=False, + check_index_type=False, + ) + + def test_variable_interpolation(self): + data = self.d3d_flume_data + variables = ["ucx", "turkin1"] + transformes_data = river.io.d3d.variable_interpolation( + data, variables, points="faces", edges="nearest" + ) + self.assertEqual( + np.size(transformes_data["ucx"]), np.size(transformes_data["turkin1"]) + ) + transformes_data = river.io.d3d.variable_interpolation( + data, variables, points="cells", edges="nearest" + ) + self.assertEqual( + np.size(transformes_data["ucx"]), np.size(transformes_data["turkin1"]) + ) + x = np.linspace(1, 3, num=3) + y = np.linspace(1, 3, num=3) + waterdepth = 1 + points = river.io.d3d.create_points(x, y, waterdepth) + transformes_data = river.io.d3d.variable_interpolation( + data, variables, points=points + ) + self.assertEqual( + np.size(transformes_data["ucx"]), np.size(transformes_data["turkin1"]) + ) + + def test_get_all_data_points(self): + data = self.d3d_flume_data + variable = "ucx" + time_step = 3 + output = river.io.d3d.get_all_data_points(data, variable, time_step) + size_output = np.size(output) + time_step_compair = 4 + output_expected = river.io.d3d.get_all_data_points( + data, variable, time_step_compair + ) + size_output_expected = np.size(output_expected) + self.assertEqual(size_output, size_output_expected) + + def test_unorm(self): + x = np.linspace(1, 3, num=3) + y = np.linspace(1, 3, num=3) + z = np.linspace(1, 3, num=3) + unorm = river.io.d3d.unorm(x, y, z) + unorm_expected = [ + np.sqrt(1**2 + 1**2 + 1**2), + np.sqrt(2**2 + 2**2 + 2**2), + np.sqrt(3**2 + 3**2 + 3**2), + ] + assert_array_almost_equal(unorm, unorm_expected, decimal=2) + + def test_turbulent_intensity(self): + data = self.d3d_flume_data + time_index = -1 + x_test = np.linspace(1, 17, num=10) + y_test = np.linspace(3, 3, num=10) + waterdepth_test = np.linspace(1, 1, num=10) + + test_points = np.array( + [ + [x, y, waterdepth] + for x, y, waterdepth in zip(x_test, y_test, waterdepth_test) + ] + ) + points = pd.DataFrame(test_points, columns=["x", "y", "waterdepth"]) + + TI = river.io.d3d.turbulent_intensity(data, points, time_index) + + TI_vars = ["turkin1", "ucx", "ucy", "ucz"] + TI_data_raw = {} + for var in TI_vars: + # get all data + var_data_df = river.io.d3d.get_all_data_points(data, var, time_index) + TI_data_raw[var] = var_data_df + TI_data = points.copy(deep=True) + + for var in TI_vars: + TI_data[var] = interp.griddata( + TI_data_raw[var][["x", "y", "waterdepth"]], + TI_data_raw[var][var], + points[["x", "y", "waterdepth"]], + ) + idx = np.where(np.isnan(TI_data[var])) + + if len(idx[0]): + for i in idx[0]: + TI_data[var][i] = interp.griddata( + TI_data_raw[var][["x", "y", "waterdepth"]], + TI_data_raw[var][var], + [points["x"][i], points["y"][i], points["waterdepth"][i]], + method="nearest", + ) + + u_mag = river.io.d3d.unorm(TI_data["ucx"], TI_data["ucy"], TI_data["ucz"]) + turbulent_intensity_expected = ( + np.sqrt(2 / 3 * TI_data["turkin1"]) / u_mag + ) * 100 + + assert_array_almost_equal( + TI.turbulent_intensity, turbulent_intensity_expected, decimal=2 + ) + + TI = river.io.d3d.turbulent_intensity(data, points="faces") + TI_size = np.size(TI["turbulent_intensity"]) + turkin1 = river.io.d3d.get_all_data_points(data, "turkin1", time_index) + turkin1_size = np.size(turkin1["turkin1"]) + self.assertEqual(TI_size, turkin1_size) + + TI = river.io.d3d.turbulent_intensity(data, points="cells") + TI_size = np.size(TI["turbulent_intensity"]) + ucx = river.io.d3d.get_all_data_points(data, "ucx", time_index) + ucx_size = np.size(ucx["ucx"]) + self.assertEqual(TI_size, ucx_size) + + +if __name__ == "__main__": + unittest.main() diff --git a/mhkit/tests/river/test_io_usgs.py b/mhkit/tests/river/test_io_usgs.py new file mode 100644 index 000000000..b422bee2c --- /dev/null +++ b/mhkit/tests/river/test_io_usgs.py @@ -0,0 +1,66 @@ +from os.path import abspath, dirname, join, isfile, normpath, relpath +import mhkit.river as river +import pandas as pd +import unittest +import os + + +testdir = dirname(abspath(__file__)) +plotdir = join(testdir, "plots") +isdir = os.path.isdir(plotdir) +if not isdir: + os.mkdir(plotdir) +datadir = normpath(join(testdir, "..", "..", "..", "examples", "data", "river")) + + +class TestIO(unittest.TestCase): + @classmethod + def setUpClass(self): + pass + + @classmethod + def tearDownClass(self): + pass + + def test_load_usgs_data_instantaneous(self): + file_name = join(datadir, "USGS_08313000_Jan2019_instantaneous.json") + data = river.io.usgs.read_usgs_file(file_name) + + self.assertEqual(data.columns, ["Discharge, cubic feet per second"]) + self.assertEqual(data.shape, (2972, 1)) # 4 data points are missing + + def test_load_usgs_data_daily(self): + file_name = join(datadir, "USGS_08313000_Jan2019_daily.json") + data = river.io.usgs.read_usgs_file(file_name) + + expected_index = pd.date_range("2019-01-01", "2019-01-31", freq="D") + self.assertEqual(data.columns, ["Discharge, cubic feet per second"]) + self.assertEqual((data.index == expected_index.tz_localize("UTC")).all(), True) + self.assertEqual(data.shape, (31, 1)) + + def test_request_usgs_data_daily(self): + data = river.io.usgs.request_usgs_data( + station="15515500", + parameter="00060", + start_date="2009-08-01", + end_date="2009-08-10", + data_type="Daily", + ) + self.assertEqual(data.columns, ["Discharge, cubic feet per second"]) + self.assertEqual(data.shape, (10, 1)) + + def test_request_usgs_data_instant(self): + data = river.io.usgs.request_usgs_data( + station="15515500", + parameter="00060", + start_date="2009-08-01", + end_date="2009-08-10", + data_type="Instantaneous", + ) + self.assertEqual(data.columns, ["Discharge, cubic feet per second"]) + # Every 15 minutes or 4 times per hour + self.assertEqual(data.shape, (10 * 24 * 4, 1)) + + +if __name__ == "__main__": + unittest.main() diff --git a/mhkit/tests/river/test_performance.py b/mhkit/tests/river/test_performance.py index d1ef596a0..34c1d6147 100644 --- a/mhkit/tests/river/test_performance.py +++ b/mhkit/tests/river/test_performance.py @@ -12,10 +12,11 @@ testdir = dirname(abspath(__file__)) -plotdir = join(testdir, 'plots') +plotdir = join(testdir, "plots") isdir = os.path.isdir(plotdir) -if not isdir: os.mkdir(plotdir) -datadir = normpath(join(testdir,'..','..','..','examples','data','river')) +if not isdir: + os.mkdir(plotdir) +datadir = normpath(join(testdir, "..", "..", "..", "examples", "data", "river")) class TestPerformance(unittest.TestCase): @@ -24,26 +25,26 @@ def setUpClass(self): self.diameter = 1 self.height = 2 self.width = 3 - self.diameters = [1,2,3,4] + self.diameters = [1, 2, 3, 4] @classmethod def tearDownClass(self): pass - + def test_circular(self): - eq, ca = river.performance.circular(self.diameter) + eq, ca = river.performance.circular(self.diameter) self.assertEqual(eq, self.diameter) - self.assertEqual(ca, 0.25*np.pi*self.diameter**2.) + self.assertEqual(ca, 0.25 * np.pi * self.diameter**2.0) def test_ducted(self): - eq, ca =river.performance.ducted(self.diameter) + eq, ca = river.performance.ducted(self.diameter) self.assertEqual(eq, self.diameter) - self.assertEqual(ca, 0.25*np.pi*self.diameter**2.) - + self.assertEqual(ca, 0.25 * np.pi * self.diameter**2.0) + def test_rectangular(self): eq, ca = river.performance.rectangular(self.height, self.width) self.assertAlmostEqual(eq, 2.76, places=2) - self.assertAlmostEqual(ca, self.height*self.width, places=2) + self.assertAlmostEqual(ca, self.height * self.width, places=2) def test_multiple_circular(self): eq, ca = river.performance.multiple_circular(self.diameters) @@ -51,30 +52,33 @@ def test_multiple_circular(self): self.assertAlmostEqual(ca, 23.56, places=2) def test_tip_speed_ratio(self): - rotor_speed = [15,16,17,18] # create array of rotor speeds - rotor_diameter = 77 # diameter of rotor for GE 1.5 - inflow_speed = [13,13,13,13] # array of wind speeds - TSR_answer = [4.7,5.0,5.3,5.6] - - TSR = river.performance.tip_speed_ratio(np.asarray(rotor_speed)/60,rotor_diameter,inflow_speed) + rotor_speed = [15, 16, 17, 18] # create array of rotor speeds + rotor_diameter = 77 # diameter of rotor for GE 1.5 + inflow_speed = [13, 13, 13, 13] # array of wind speeds + TSR_answer = [4.7, 5.0, 5.3, 5.6] - for i,j in zip(TSR,TSR_answer): - self.assertAlmostEqual(i,j,delta=0.05) + TSR = river.performance.tip_speed_ratio( + np.asarray(rotor_speed) / 60, rotor_diameter, inflow_speed + ) + + for i, j in zip(TSR, TSR_answer): + self.assertAlmostEqual(i, j, delta=0.05) def test_power_coefficient(self): # data obtained from power performance report of wind turbine - inflow_speed = [4,6,8,10,12,14,16,18,20] - power_out = np.asarray([59,304,742,1200,1400,1482,1497,1497,1511]) + inflow_speed = [4, 6, 8, 10, 12, 14, 16, 18, 20] + power_out = np.asarray([59, 304, 742, 1200, 1400, 1482, 1497, 1497, 1511]) capture_area = 4656.63 rho = 1.225 - Cp_answer = [0.320,0.493,0.508,0.421,0.284,0.189,0.128,0.090,0.066] - - Cp = river.performance.power_coefficient(power_out*1000,inflow_speed,capture_area,rho) + Cp_answer = [0.320, 0.493, 0.508, 0.421, 0.284, 0.189, 0.128, 0.090, 0.066] + + Cp = river.performance.power_coefficient( + power_out * 1000, inflow_speed, capture_area, rho + ) - for i,j in zip(Cp,Cp_answer): - self.assertAlmostEqual(i,j,places=2) + for i, j in zip(Cp, Cp_answer): + self.assertAlmostEqual(i, j, places=2) - -if __name__ == '__main__': - unittest.main() +if __name__ == "__main__": + unittest.main() diff --git a/mhkit/tests/river/test_resource.py b/mhkit/tests/river/test_resource.py index 5ef4a402a..8b3a73023 100644 --- a/mhkit/tests/river/test_resource.py +++ b/mhkit/tests/river/test_resource.py @@ -1,195 +1,355 @@ -from os.path import abspath, dirname, join, isfile, normpath, relpath -from numpy.testing import assert_array_almost_equal -from pandas.testing import assert_frame_equal -import scipy.interpolate as interp +from os.path import abspath, dirname, join, isfile, normpath import matplotlib.pylab as plt import mhkit.river as river import pandas as pd +import xarray as xr import numpy as np import unittest -import netCDF4 import os testdir = dirname(abspath(__file__)) -plotdir = join(testdir, 'plots') +plotdir = join(testdir, "plots") isdir = os.path.isdir(plotdir) -if not isdir: os.mkdir(plotdir) -datadir = normpath(join(testdir,'..','..','..','examples','data','river')) +if not isdir: + os.mkdir(plotdir) +datadir = normpath(join(testdir, "..", "..", "..", "examples", "data", "river")) class TestResource(unittest.TestCase): - @classmethod def setUpClass(self): - self.data = pd.read_csv(join(datadir, 'tanana_discharge_data.csv'), index_col=0, - parse_dates=True) - self.data.columns = ['Q'] - - self.results = pd.read_csv(join(datadir, 'tanana_test_results.csv'), index_col=0, - parse_dates=True) + self.data = pd.read_csv( + join(datadir, "tanana_discharge_data.csv"), index_col=0, parse_dates=True + ) + self.data.columns = ["Q"] + + self.results = pd.read_csv( + join(datadir, "tanana_test_results.csv"), index_col=0, parse_dates=True + ) @classmethod def tearDownClass(self): pass - def test_Froude_number(self): v = 2 h = 5 Fr = river.resource.Froude_number(v, h) self.assertAlmostEqual(Fr, 0.286, places=3) - + + def test_froude_number_v_type_error(self): + v = "invalid_type" # String instead of int/float + h = 5 + with self.assertRaises(TypeError): + river.resource.Froude_number(v, h) + + def test_froude_number_h_type_error(self): + v = 2 + h = "invalid_type" # String instead of int/float + with self.assertRaises(TypeError): + river.resource.Froude_number(v, h) + + def test_froude_number_g_type_error(self): + v = 2 + h = 5 + g = "invalid_type" # String instead of int/float + with self.assertRaises(TypeError): + river.resource.Froude_number(v, h, g) def test_exceedance_probability(self): # Create arbitrary discharge between 0 and 8(N=9) Q = pd.Series(np.arange(9)) # Rank order for non-repeating elements simply adds 1 to each element - #if N=9, max F = 100((max(Q)+1)/10) = 90% - #if N=9, min F = 100((min(Q)+1)/10) = 10% + # if N=9, max F = 100((max(Q)+1)/10) = 90% + # if N=9, min F = 100((min(Q)+1)/10) = 10% + f = river.resource.exceedance_probability(Q) + self.assertEqual(f.min().values, 10.0) + self.assertEqual(f.max().values, 90.0) + + def test_exceedance_probability_xarray(self): + # Create arbitrary discharge between 0 and 8(N=9) + Q = xr.DataArray( + data=np.arange(9), dims="index", coords={"index": np.arange(9)} + ) + # if N=9, max F = 100((max(Q)+1)/10) = 90% + # if N=9, min F = 100((min(Q)+1)/10) = 10% f = river.resource.exceedance_probability(Q) - self.assertEqual(f.min().values , 10. ) - self.assertEqual(f.max().values , 90. ) + self.assertEqual(f.min().values, 10.0) + self.assertEqual(f.max().values, 90.0) + def test_exceedance_probability_type_error(self): + D = "invalid_type" # String instead of pd.Series or pd.DataFrame + with self.assertRaises(TypeError): + river.resource.exceedance_probability(D) def test_polynomial_fit(self): # Calculate a first order polynomial on an x=y line - p, r2 = river.resource.polynomial_fit(np.arange(8), np.arange(8),1) + p, r2 = river.resource.polynomial_fit(np.arange(8), np.arange(8), 1) # intercept should be 0 - self.assertAlmostEqual(p[0], 0.0, places=2 ) + self.assertAlmostEqual(p[0], 0.0, places=2) # slope should be 1 - self.assertAlmostEqual(p[1], 1.0, places=2 ) + self.assertAlmostEqual(p[1], 1.0, places=2) # r-squared should be perfect - self.assertAlmostEqual(r2, 1.0, places=2 ) + self.assertAlmostEqual(r2, 1.0, places=2) + def test_polynomial_fit_x_type_error(self): + x = "invalid_type" # String instead of numpy array + y = np.array([1, 2, 3]) + n = 1 + with self.assertRaises(TypeError): + river.resource.polynomial_fit(x, y, n) + + def test_polynomial_fit_y_type_error(self): + x = np.array([1, 2, 3]) + y = "invalid_type" # String instead of numpy array + n = 1 + with self.assertRaises(TypeError): + river.resource.polynomial_fit(x, y, n) + + def test_polynomial_fit_n_type_error(self): + x = np.array([1, 2, 3]) + y = np.array([1, 2, 3]) + n = "invalid_type" # String instead of int + with self.assertRaises(TypeError): + river.resource.polynomial_fit(x, y, n) def test_discharge_to_velocity(self): # Create arbitrary discharge between 0 and 8(N=9) Q = pd.Series(np.arange(9)) # Calculate a first order polynomial on an DV_Curve x=y line 10 times greater than the Q values - p, r2 = river.resource.polynomial_fit(np.arange(9), 10*np.arange(9),1) - # Becuase the polynomial line fits perfect we should expect the V to equal 10*Q + p, r2 = river.resource.polynomial_fit(np.arange(9), 10 * np.arange(9), 1) + # Because the polynomial line fits perfect we should expect the V to equal 10*Q V = river.resource.discharge_to_velocity(Q, p) - self.assertAlmostEqual(np.sum(10*Q - V['V']), 0.00, places=2 ) - + self.assertAlmostEqual(np.sum(10 * Q - V["V"]), 0.00, places=2) + + def test_discharge_to_velocity_xarray(self): + # Create arbitrary discharge between 0 and 8(N=9) + Q = xr.DataArray( + data=np.arange(9), dims="index", coords={"index": np.arange(9)} + ) + # Calculate a first order polynomial on an DV_Curve x=y line 10 times greater than the Q values + p, r2 = river.resource.polynomial_fit(np.arange(9), 10 * np.arange(9), 1) + # Because the polynomial line fits perfect we should expect the V to equal 10*Q + V = river.resource.discharge_to_velocity(Q, p, to_pandas=False) + self.assertAlmostEqual(np.sum(10 * Q - V["V"]).values, 0.00, places=2) + + def test_discharge_to_velocity_D_type_error(self): + D = "invalid_type" # String instead of pd.Series or pd.DataFrame + polynomial_coefficients = np.poly1d([1, 2]) + with self.assertRaises(TypeError): + river.resource.discharge_to_velocity(D, polynomial_coefficients) + + def test_discharge_to_velocity_polynomial_coefficients_type_error(self): + D = pd.Series([1, 2, 3]) + polynomial_coefficients = "invalid_type" # String instead of np.poly1d + with self.assertRaises(TypeError): + river.resource.discharge_to_velocity(D, polynomial_coefficients) def test_velocity_to_power(self): # Calculate a first order polynomial on an DV_Curve x=y line 10 times greater than the Q values - p, r2 = river.resource.polynomial_fit(np.arange(9), 10*np.arange(9),1) - # Becuase the polynomial line fits perfect we should expect the V to equal 10*Q + p, r2 = river.resource.polynomial_fit(np.arange(9), 10 * np.arange(9), 1) + # Because the polynomial line fits perfect we should expect the V to equal 10*Q V = river.resource.discharge_to_velocity(pd.Series(np.arange(9)), p) # Calculate a first order polynomial on an VP_Curve x=y line 10 times greater than the V values - p2, r22 = river.resource.polynomial_fit(np.arange(9), 10*np.arange(9),1) + p2, r22 = river.resource.polynomial_fit(np.arange(9), 10 * np.arange(9), 1) + # Set cut in/out to exclude 1 bin on either end of V range + cut_in = V["V"][1] + cut_out = V["V"].iloc[-2] + # Power should be 10x greater and exclude the ends of V + P = river.resource.velocity_to_power(V["V"], p2, cut_in, cut_out) + # Cut in power zero + self.assertAlmostEqual(P["P"][0], 0.00, places=2) + # Cut out power zero + self.assertAlmostEqual(P["P"].iloc[-1], 0.00, places=2) + # Middle 10x greater than velocity + self.assertAlmostEqual((P["P"][1:-1] - 10 * V["V"][1:-1]).sum(), 0.00, places=2) + + def test_velocity_to_power_xarray(self): + # Calculate a first order polynomial on an DV_Curve x=y line 10 times greater than the Q values + p, r2 = river.resource.polynomial_fit(np.arange(9), 10 * np.arange(9), 1) + # Because the polynomial line fits perfect we should expect the V to equal 10*Q + V = river.resource.discharge_to_velocity( + pd.Series(np.arange(9)), p, dimension="", to_pandas=False + ) + # Calculate a first order polynomial on an VP_Curve x=y line 10 times greater than the V values + p2, r22 = river.resource.polynomial_fit(np.arange(9), 10 * np.arange(9), 1) # Set cut in/out to exclude 1 bin on either end of V range - cut_in = V['V'][1] - cut_out = V['V'].iloc[-2] + cut_in = V["V"].values[1] + cut_out = V["V"].values[-2] # Power should be 10x greater and exclude the ends of V - P = river.resource.velocity_to_power(V['V'], p2, cut_in, cut_out) - #Cut in power zero - self.assertAlmostEqual(P['P'][0], 0.00, places=2 ) - #Cut out power zero - self.assertAlmostEqual(P['P'].iloc[-1], 0.00, places=2 ) + P = river.resource.velocity_to_power( + V["V"], p2, cut_in, cut_out, to_pandas=False + ) + # Cut in power zero + self.assertAlmostEqual(P["P"][0], 0.00, places=2) + # Cut out power zero + self.assertAlmostEqual(P["P"][-1], 0.00, places=2) # Middle 10x greater than velocity - self.assertAlmostEqual((P['P'][1:-1] - 10*V['V'][1:-1] ).sum(), 0.00, places=2 ) + self.assertAlmostEqual( + (P["P"][1:-1] - 10 * V["V"][1:-1]).sum().values, 0.00, places=2 + ) + + def test_velocity_to_power_V_type_error(self): + V = "invalid_type" # String instead of pd.Series or pd.DataFrame + polynomial_coefficients = np.poly1d([1, 2]) + cut_in = 1 + cut_out = 5 + with self.assertRaises(TypeError): + river.resource.velocity_to_power( + V, polynomial_coefficients, cut_in, cut_out + ) + + def test_velocity_to_power_polynomial_coefficients_type_error(self): + V = pd.Series([1, 2, 3]) + polynomial_coefficients = "invalid_type" # String instead of np.poly1d + cut_in = 1 + cut_out = 5 + with self.assertRaises(TypeError): + river.resource.velocity_to_power( + V, polynomial_coefficients, cut_in, cut_out + ) + def test_velocity_to_power_cut_in_type_error(self): + V = pd.Series([1, 2, 3]) + polynomial_coefficients = np.poly1d([1, 2]) + cut_in = "invalid_type" # String instead of int/float + cut_out = 5 + with self.assertRaises(TypeError): + river.resource.velocity_to_power( + V, polynomial_coefficients, cut_in, cut_out + ) + + def test_velocity_to_power_cut_out_type_error(self): + V = pd.Series([1, 2, 3]) + polynomial_coefficients = np.poly1d([1, 2]) + cut_in = 1 + cut_out = "invalid_type" # String instead of int/float + with self.assertRaises(TypeError): + river.resource.velocity_to_power( + V, polynomial_coefficients, cut_in, cut_out + ) def test_energy_produced(self): - # If power is always X then energy produced with be x*seconds - X=1 - seconds=1 - P = pd.Series(X*np.ones(10) ) + # If power is always X then energy produced with be x*seconds + X = 1 + seconds = 1 + P = pd.Series(X * np.ones(10)) EP = river.resource.energy_produced(P, seconds) - self.assertAlmostEqual(EP, X*seconds, places=1 ) + self.assertAlmostEqual(EP, X * seconds, places=1) # for a normal distribution of Power EP = mean *seconds - mu=5 - sigma=1 + mu = 5 + sigma = 1 power_dist = pd.Series(np.random.normal(mu, sigma, 10000)) EP2 = river.resource.energy_produced(power_dist, seconds) -# import ipdb; ipdb.set_trace() - self.assertAlmostEqual(EP2, mu*seconds, places=1 ) + self.assertAlmostEqual(EP2, mu * seconds, places=1) + + def test_energy_produced_xarray(self): + # If power is always X then energy produced with be x*seconds + X = 1 + seconds = 1 + P = xr.DataArray(data=X * np.ones(10)) + EP = river.resource.energy_produced(P, seconds) + self.assertAlmostEqual(EP, X * seconds, places=1) + + # for a normal distribution of Power EP = mean *seconds + mu = 5 + sigma = 1 + power_dist = xr.DataArray(data=np.random.normal(mu, sigma, 10000)) + EP2 = river.resource.energy_produced(power_dist, seconds) + self.assertAlmostEqual(EP2, mu * seconds, places=1) + def test_energy_produced_P_type_error(self): + P = "invalid_type" # String instead of pd.Series or pd.DataFrame + seconds = 3600 + with self.assertRaises(TypeError): + river.resource.energy_produced(P, seconds) + + def test_energy_produced_seconds_type_error(self): + P = pd.Series([100, 200, 300]) + seconds = "invalid_type" # String instead of int/float + with self.assertRaises(TypeError): + river.resource.energy_produced(P, seconds) def test_plot_flow_duration_curve(self): - filename = abspath(join(plotdir, 'river_plot_flow_duration_curve.png')) + filename = abspath(join(plotdir, "river_plot_flow_duration_curve.png")) if isfile(filename): os.remove(filename) - + f = river.resource.exceedance_probability(self.data.Q) plt.figure() - river.graphics.plot_flow_duration_curve(self.data['Q'], f['F']) - plt.savefig(filename, format='png') + river.graphics.plot_flow_duration_curve(self.data["Q"], f["F"]) + plt.savefig(filename, format="png") plt.close() - + self.assertTrue(isfile(filename)) - def test_plot_power_duration_curve(self): - filename = abspath(join(plotdir, 'river_plot_power_duration_curve.png')) + filename = abspath(join(plotdir, "river_plot_power_duration_curve.png")) if isfile(filename): os.remove(filename) - + f = river.resource.exceedance_probability(self.data.Q) plt.figure() - river.graphics.plot_flow_duration_curve(self.results['P_control'], f['F']) - plt.savefig(filename, format='png') + river.graphics.plot_flow_duration_curve(self.results["P_control"], f["F"]) + plt.savefig(filename, format="png") plt.close() - + self.assertTrue(isfile(filename)) - def test_plot_velocity_duration_curve(self): - filename = abspath(join(plotdir, 'river_plot_velocity_duration_curve.png')) + filename = abspath(join(plotdir, "river_plot_velocity_duration_curve.png")) if isfile(filename): os.remove(filename) - + f = river.resource.exceedance_probability(self.data.Q) plt.figure() - river.graphics.plot_velocity_duration_curve(self.results['V_control'], f['F']) - plt.savefig(filename, format='png') + river.graphics.plot_velocity_duration_curve(self.results["V_control"], f["F"]) + plt.savefig(filename, format="png") plt.close() - + self.assertTrue(isfile(filename)) - def test_plot_discharge_timeseries(self): - filename = abspath(join(plotdir, 'river_plot_discharge_timeseries.png')) - if isfile(filename): os.remove(filename) - + filename = abspath(join(plotdir, "river_plot_discharge_timeseries.png")) + if isfile(filename): + os.remove(filename) + plt.figure() - river.graphics.plot_discharge_timeseries(self.data['Q']) - plt.savefig(filename, format='png') + river.graphics.plot_discharge_timeseries(self.data["Q"]) + plt.savefig(filename, format="png") plt.close() - + self.assertTrue(isfile(filename)) - def test_plot_discharge_vs_velocity(self): - filename = abspath(join(plotdir, 'river_plot_discharge_vs_velocity.png')) + filename = abspath(join(plotdir, "river_plot_discharge_vs_velocity.png")) if isfile(filename): os.remove(filename) - + plt.figure() - river.graphics.plot_discharge_vs_velocity(self.data['Q'], self.results['V_control']) - plt.savefig(filename, format='png') + river.graphics.plot_discharge_vs_velocity( + self.data["Q"], self.results["V_control"] + ) + plt.savefig(filename, format="png") plt.close() - + self.assertTrue(isfile(filename)) - def test_plot_velocity_vs_power(self): - filename = abspath(join(plotdir, 'river_plot_velocity_vs_power.png')) + filename = abspath(join(plotdir, "river_plot_velocity_vs_power.png")) if isfile(filename): os.remove(filename) - + plt.figure() - river.graphics.plot_velocity_vs_power(self.results['V_control'], self.results['P_control']) - plt.savefig(filename, format='png') + river.graphics.plot_velocity_vs_power( + self.results["V_control"], self.results["P_control"] + ) + plt.savefig(filename, format="png") plt.close() - + self.assertTrue(isfile(filename)) - - -if __name__ == '__main__': - unittest.main() +if __name__ == "__main__": + unittest.main() diff --git a/mhkit/tests/tidal/test_io.py b/mhkit/tests/tidal/test_io.py index fa09db656..6993be815 100644 --- a/mhkit/tests/tidal/test_io.py +++ b/mhkit/tests/tidal/test_io.py @@ -12,6 +12,7 @@ - Requesting NOAA data with invalid date format - Requesting NOAA data with the end date before the start date """ + from os.path import abspath, dirname, join, normpath, relpath import unittest import os @@ -22,15 +23,14 @@ testdir = dirname(abspath(__file__)) -plotdir = join(testdir, 'plots') +plotdir = join(testdir, "plots") isdir = os.path.isdir(plotdir) if not isdir: os.mkdir(plotdir) -datadir = normpath(join(testdir, relpath('../../../examples/data/tidal'))) +datadir = normpath(join(testdir, relpath("../../../examples/data/tidal"))) class TestIO(unittest.TestCase): - @classmethod def setUpClass(self): pass @@ -41,46 +41,79 @@ def tearDownClass(self): def test_load_noaa_data(self): """ - Test that the read_noaa_json function reads data from a + Test that the read_noaa_json function reads data from a JSON file and returns a DataFrame and metadata with the correct shape and columns. """ - file_name = join(datadir, 's08010.json') + file_name = join(datadir, "s08010.json") data, metadata = tidal.io.noaa.read_noaa_json(file_name) - self.assertTrue(np.all(data.columns == ['s', 'd', 'b'])) + self.assertTrue(np.all(data.columns == ["s", "d", "b"])) self.assertEqual(data.shape, (18890, 3)) + self.assertEqual(metadata["id"], "s08010") + + def test_load_noaa_data_xarray(self): + """ + Test that the read_noaa_json function reads data from a + JSON file and returns a DataFrame and metadata with the + correct shape and columns. + """ + file_name = join(datadir, "s08010.json") + data = tidal.io.noaa.read_noaa_json(file_name, to_pandas=False) + self.assertTrue(np.all(list(data.variables) == ["index", "s", "d", "b"])) + self.assertEqual(len(data["index"]), 18890) + self.assertEqual(data.attrs["id"], "s08010") def test_request_noaa_data_basic(self): """ Test the request_noaa_data function with basic input parameters - and verify that the returned DataFrame and metadata have the + and verify that the returned DataFrame and metadata have the correct shape and columns. """ data, metadata = tidal.io.noaa.request_noaa_data( - station='s08010', - parameter='currents', - start_date='20180101', - end_date='20180102', + station="s08010", + parameter="currents", + start_date="20180101", + end_date="20180102", proxy=None, - write_json=None + write_json=None, ) - self.assertTrue(np.all(data.columns == ['s', 'd', 'b'])) + self.assertTrue(np.all(data.columns == ["s", "d", "b"])) self.assertEqual(data.shape, (183, 3)) + self.assertEqual(metadata["id"], "s08010") + + def test_request_noaa_data_basic_xarray(self): + """ + Test the request_noaa_data function with basic input parameters + and verify that the returned DataFrame and metadata have the + correct shape and columns. + """ + data = tidal.io.noaa.request_noaa_data( + station="s08010", + parameter="currents", + start_date="20180101", + end_date="20180102", + proxy=None, + write_json=None, + to_pandas=False, + ) + self.assertTrue(np.all(list(data.variables) == ["index", "s", "d", "b"])) + self.assertEqual(len(data["index"]), 183) + self.assertEqual(data.attrs["id"], "s08010") def test_request_noaa_data_write_json(self): """ Test the request_noaa_data function with the write_json parameter - and verify that the returned JSON file has the correct structure + and verify that the returned JSON file has the correct structure and can be loaded back into a dictionary. """ - test_json_file = 'test_noaa_data.json' - data, metadata = tidal.io.noaa.request_noaa_data( - station='s08010', - parameter='currents', - start_date='20180101', - end_date='20180102', + test_json_file = "test_noaa_data.json" + _, _ = tidal.io.noaa.request_noaa_data( + station="s08010", + parameter="currents", + start_date="20180101", + end_date="20180102", proxy=None, - write_json=test_json_file + write_json=test_json_file, ) self.assertTrue(os.path.isfile(test_json_file)) @@ -89,10 +122,10 @@ def test_request_noaa_data_write_json(self): os.remove(test_json_file) # Clean up the test JSON file - self.assertIn('metadata', loaded_data) - self.assertIn('s', loaded_data) - self.assertIn('d', loaded_data) - self.assertIn('b', loaded_data) + self.assertIn("metadata", loaded_data) + self.assertIn("s", loaded_data["columns"]) + self.assertIn("d", loaded_data["columns"]) + self.assertIn("b", loaded_data["columns"]) def test_request_noaa_data_invalid_dates(self): """ @@ -101,29 +134,29 @@ def test_request_noaa_data_invalid_dates(self): """ with self.assertRaises(ValueError): tidal.io.noaa.request_noaa_data( - station='s08010', - parameter='currents', - start_date='2018-01-01', # Invalid date format - end_date='20180102', + station="s08010", + parameter="currents", + start_date="2018-01-01", # Invalid date format + end_date="20180102", proxy=None, - write_json=None + write_json=None, ) def test_request_noaa_data_end_before_start(self): """ - Test the request_noaa_data function with the end date before + Test the request_noaa_data function with the end date before the start date and verify that it raises a ValueError. """ with self.assertRaises(ValueError): tidal.io.noaa.request_noaa_data( - station='s08010', - parameter='currents', - start_date='20180102', - end_date='20180101', # End date before start date + station="s08010", + parameter="currents", + start_date="20180102", + end_date="20180101", # End date before start date proxy=None, - write_json=None + write_json=None, ) -if __name__ == '__main__': +if __name__ == "__main__": unittest.main() diff --git a/mhkit/tests/tidal/test_performance.py b/mhkit/tests/tidal/test_performance.py index b06984e59..43c13b473 100644 --- a/mhkit/tests/tidal/test_performance.py +++ b/mhkit/tests/tidal/test_performance.py @@ -8,110 +8,205 @@ from mhkit.dolfyn import load testdir = dirname(abspath(__file__)) -plotdir = join(testdir, 'plots') +plotdir = join(testdir, "plots") isdir = os.path.isdir(plotdir) -if not isdir: os.mkdir(plotdir) -datadir = normpath(join(testdir,relpath('../../../examples/data/tidal'))) +if not isdir: + os.mkdir(plotdir) +datadir = normpath(join(testdir, relpath("../../../examples/data/tidal"))) class TestResource(unittest.TestCase): - @classmethod def setUpClass(self): - filename = join(datadir, 'adcp.principal.a1.20200815.nc') + filename = join(datadir, "adcp.principal.a1.20200815.nc") self.ds = load(filename) # Emulate power data - self.power = abs(self.ds['vel'][0,10]**3 * 1e5) + self.power = abs(self.ds["vel"][0, 10] ** 3 * 1e5) @classmethod def tearDownClass(self): pass - def test_power_curve(self,): + def test_power_curve(self): df93_circ = performance.power_curve( power=self.power, - velocity=self.ds['vel'].sel(dir='streamwise'), + velocity=self.ds["vel"].sel(dir="streamwise"), hub_height=4.2, - doppler_cell_size=0.5, - sampling_frequency=1, + doppler_cell_size=0.5, + sampling_frequency=1, window_avg_time=600, - turbine_profile='circular', + turbine_profile="circular", diameter=3, height=None, - width=None) - test_circ = np.array([1.26250990e+00, - 1.09230978e+00, - 1.89122103e+05, - 1.03223668e+04, - 2.04261423e+05, - 1.72095731e+05]) + width=None, + ) + test_circ = np.array( + [ + 1.26250990e00, + 1.09230978e00, + 1.89122103e05, + 1.03223668e04, + 2.04261423e05, + 1.72095731e05, + ] + ) df93_rect = performance.power_curve( power=self.power, - velocity=self.ds['vel'].sel(dir='streamwise'), + velocity=self.ds["vel"].sel(dir="streamwise"), hub_height=4.2, - doppler_cell_size=0.5, - sampling_frequency=1, + doppler_cell_size=0.5, + sampling_frequency=1, window_avg_time=600, - turbine_profile='rectangular', + turbine_profile="rectangular", diameter=None, height=1, - width=3) - test_rect = np.array([1.15032239e+00, - 3.75747621e-01, - 1.73098627e+05, - 3.04090212e+04, - 2.09073742e+05, - 1.27430552e+05]) - + width=3, + ) + test_rect = np.array( + [ + 1.15032239e00, + 3.75747621e-01, + 1.73098627e05, + 3.04090212e04, + 2.09073742e05, + 1.27430552e05, + ] + ) + assert_allclose(df93_circ.values[-2], test_circ, atol=1e-5) assert_allclose(df93_rect.values[-3], test_rect, atol=1e-5) + def test_power_curve_xarray(self): + df93_circ = performance.power_curve( + power=self.power, + velocity=self.ds["vel"].sel(dir="streamwise"), + hub_height=4.2, + doppler_cell_size=0.5, + sampling_frequency=1, + window_avg_time=600, + turbine_profile="circular", + diameter=3, + height=None, + width=None, + to_pandas=False, + ) + test_circ = np.array( + [ + 1.26250990e00, + 1.09230978e00, + 1.89122103e05, + 1.03223668e04, + 2.04261423e05, + 1.72095731e05, + ] + ) + + df93_rect = performance.power_curve( + power=self.power, + velocity=self.ds["vel"].sel(dir="streamwise"), + hub_height=4.2, + doppler_cell_size=0.5, + sampling_frequency=1, + window_avg_time=600, + turbine_profile="rectangular", + diameter=None, + height=1, + width=3, + to_pandas=False, + ) + test_rect = np.array( + [ + 1.15032239e00, + 3.75747621e-01, + 1.73098627e05, + 3.04090212e04, + 2.09073742e05, + 1.27430552e05, + ] + ) + + assert_allclose(df93_circ.isel(U_bins=-2).to_array(), test_circ, atol=1e-5) + assert_allclose(df93_rect.isel(U_bins=-3).to_array(), test_rect, atol=1e-5) + def test_velocity_profiles(self): df94 = performance.velocity_profiles( - velocity=self.ds['vel'].sel(dir='streamwise'), + velocity=self.ds["vel"].sel(dir="streamwise"), hub_height=4.2, water_depth=10, - sampling_frequency=1, + sampling_frequency=1, window_avg_time=600, - function='mean') + function="mean", + ) df95a = performance.velocity_profiles( - velocity=self.ds['vel'].sel(dir='streamwise'), + velocity=self.ds["vel"].sel(dir="streamwise"), hub_height=4.2, water_depth=10, sampling_frequency=1, window_avg_time=600, - function='rms') + function="rms", + ) df95b = performance.velocity_profiles( - velocity=self.ds['vel'].sel(dir='streamwise'), - hub_height=4.2, + velocity=self.ds["vel"].sel(dir="streamwise"), + hub_height=4.2, water_depth=10, - sampling_frequency=1, + sampling_frequency=1, window_avg_time=600, - function='std') - + function="std", + ) + test_df94 = np.array([0.32782955, 0.69326691, 1.00948623]) - test_df95a = np.array([0.3329345 , 0.69936798, 1.01762123]) + test_df95a = np.array([0.3329345, 0.69936798, 1.01762123]) test_df95b = np.array([0.05635571, 0.08671777, 0.12735139]) assert_allclose(df94.values[1], test_df94, atol=1e-5) assert_allclose(df95a.values[1], test_df95a, atol=1e-5) assert_allclose(df95b.values[1], test_df95b, atol=1e-5) - + + def test_velocity_profiles_xarray(self): + df94 = performance.velocity_profiles( + velocity=self.ds["vel"].sel(dir="streamwise"), + hub_height=4.2, + water_depth=10, + sampling_frequency=1, + window_avg_time=600, + function="mean", + to_pandas=False, + ) + + test_df94 = np.array([0.32782955, 0.69326691, 1.00948623]) + + assert_allclose(df94[1], test_df94, atol=1e-5) def test_power_efficiency(self): df97 = performance.device_efficiency( self.power, - velocity=self.ds['vel'].sel(dir='streamwise'), - water_density=self.ds['water_density'], - capture_area=np.pi*1.5**2, + velocity=self.ds["vel"].sel(dir="streamwise"), + water_density=self.ds["water_density"], + capture_area=np.pi * 1.5**2, hub_height=4.2, sampling_frequency=1, - window_avg_time=600) - + window_avg_time=600, + ) + + test_df97 = np.array(24.79197) + assert_allclose(df97.values[-1, -1], test_df97, atol=1e-5) + + def test_power_efficiency_xarray(self): + df97 = performance.device_efficiency( + self.power, + velocity=self.ds["vel"].sel(dir="streamwise"), + water_density=self.ds["water_density"], + capture_area=np.pi * 1.5**2, + hub_height=4.2, + sampling_frequency=1, + window_avg_time=600, + to_pandas=False, + ) + test_df97 = np.array(24.79197) - assert_allclose(df97.values[-1,-1], test_df97, atol=1e-5) + assert_allclose(df97["Efficiency"][-1], test_df97, atol=1e-5) -if __name__ == '__main__': - unittest.main() +if __name__ == "__main__": + unittest.main() diff --git a/mhkit/tests/tidal/test_resource.py b/mhkit/tests/tidal/test_resource.py index a7adc996c..7b5b6ad11 100644 --- a/mhkit/tests/tidal/test_resource.py +++ b/mhkit/tests/tidal/test_resource.py @@ -7,103 +7,108 @@ import mhkit.tidal as tidal testdir = dirname(abspath(__file__)) -plotdir = join(testdir, 'plots') +plotdir = join(testdir, "plots") isdir = os.path.isdir(plotdir) -if not isdir: os.mkdir(plotdir) -datadir = normpath(join(testdir,relpath('../../../examples/data/tidal'))) +if not isdir: + os.mkdir(plotdir) +datadir = normpath(join(testdir, relpath("../../../examples/data/tidal"))) class TestResource(unittest.TestCase): - @classmethod def setUpClass(self): - file_name = join(datadir, 's08010.json') + file_name = join(datadir, "s08010.json") self.data, self.metadata = tidal.io.noaa.read_noaa_json(file_name) - self.data.s = self.data.s / 100. # convert to m/s + self.data.s = self.data.s / 100.0 # convert to m/s self.flood = 171.5 self.ebb = 354.5 - @classmethod def tearDownClass(self): pass - + def test_exceedance_probability(self): - df = pd.DataFrame.from_records( {'vals': np.array([ 1, 2, 3, 4, 5, 6, 7, 8, 9])} ) - df['F'] = tidal.resource.exceedance_probability(df.vals) - self.assertEqual(df['F'].min(), 10) - self.assertEqual(df['F'].max(), 90) - - - def test_principal_flow_directions(self): - width_direction=10 - direction1, direction2 = tidal.resource.principal_flow_directions(self.data.d, width_direction) - self.assertEqual(direction1,172.0) - self.assertEqual(round(direction2,1),round(352.3,1)) - + df = pd.DataFrame.from_records({"vals": np.array([1, 2, 3, 4, 5, 6, 7, 8, 9])}) + df["F"] = tidal.resource.exceedance_probability(df.vals) + self.assertEqual(df["F"].min(), 10) + self.assertEqual(df["F"].max(), 90) + + def test_principal_flow_directions(self): + width_direction = 10 + direction1, direction2 = tidal.resource.principal_flow_directions( + self.data.d, width_direction + ) + self.assertEqual(direction1, 172.0) + self.assertEqual(round(direction2, 1), round(352.3, 1)) + def test_plot_current_timeseries(self): - filename = abspath(join(plotdir, 'tidal_plot_current_timeseries.png')) + filename = abspath(join(plotdir, "tidal_plot_current_timeseries.png")) if isfile(filename): os.remove(filename) - + plt.figure() tidal.graphics.plot_current_timeseries(self.data.d, self.data.s, 172) - plt.savefig(filename, format='png') + plt.savefig(filename, format="png") plt.close() - + self.assertTrue(isfile(filename)) - + def test_plot_joint_probability_distribution(self): - filename = abspath(join(plotdir, 'tidal_plot_joint_probability_distribution.png')) + filename = abspath( + join(plotdir, "tidal_plot_joint_probability_distribution.png") + ) if isfile(filename): os.remove(filename) - + plt.figure() - tidal.graphics.plot_joint_probability_distribution(self.data.d, self.data.s, 1, 0.1) - plt.savefig(f'{filename}') + tidal.graphics.plot_joint_probability_distribution( + self.data.d, self.data.s, 1, 0.1 + ) + plt.savefig(f"{filename}") plt.close() - + self.assertTrue(isfile(filename)) - + def test_plot_rose(self): - filename = abspath(join(plotdir, 'tidal_plot_rose.png')) + filename = abspath(join(plotdir, "tidal_plot_rose.png")) if isfile(filename): os.remove(filename) - + plt.figure() tidal.graphics.plot_rose(self.data.d, self.data.s, 1, 0.1) - plt.savefig(f'{filename}') + plt.savefig(f"{filename}") plt.close() - + self.assertTrue(isfile(filename)) def test_tidal_phase_probability(self): - filename = abspath(join(plotdir, 'tidal_plot_tidal_phase_probability.png')) + filename = abspath(join(plotdir, "tidal_plot_tidal_phase_probability.png")) if isfile(filename): os.remove(filename) - + plt.figure() - tidal.graphics.tidal_phase_probability(self.data.d, self.data.s, - self.flood, self.ebb) - plt.savefig(f'{filename}') + tidal.graphics.tidal_phase_probability( + self.data.d, self.data.s, self.flood, self.ebb + ) + plt.savefig(f"{filename}") plt.close() - + self.assertTrue(isfile(filename)) - + def test_tidal_phase_exceedance(self): - filename = abspath(join(plotdir, 'tidal_plot_tidal_phase_exceedance.png')) + filename = abspath(join(plotdir, "tidal_plot_tidal_phase_exceedance.png")) if isfile(filename): os.remove(filename) - + plt.figure() - tidal.graphics.tidal_phase_exceedance(self.data.d, self.data.s, - self.flood, self.ebb) - plt.savefig(f'{filename}') + tidal.graphics.tidal_phase_exceedance( + self.data.d, self.data.s, self.flood, self.ebb + ) + plt.savefig(f"{filename}") plt.close() - - self.assertTrue(isfile(filename)) + self.assertTrue(isfile(filename)) -if __name__ == '__main__': - unittest.main() +if __name__ == "__main__": + unittest.main() diff --git a/mhkit/tests/utils/test_cache.py b/mhkit/tests/utils/test_cache.py new file mode 100644 index 000000000..14aae0802 --- /dev/null +++ b/mhkit/tests/utils/test_cache.py @@ -0,0 +1,177 @@ +""" +Unit Testing for MHKiT Cache Utilities + +This module provides unit tests for the caching utilities present in the MHKiT library. +These utilities help in caching and retrieving data, ensuring efficient and repeatable +data access without redundant computations or network requests. + +The tests cover: +1. Creation of cache files with the correct file naming based on provided parameters. +2. Proper retrieval of data from the cache, ensuring data integrity. +3. Usage of appropriate file extensions based on the type of data being cached. +4. Clearing of cache directories as specified. + +By running these tests, one can validate that the caching utilities of MHKiT are functioning +as expected, ensuring that users can rely on cached data and metadata when using the MHKiT library. + +Usage: + python -m unittest test_cache.py + +Requirements: + - pandas + - hashlib + - tempfile + - shutil + - os + - unittest + - MHKiT library functions (from mhkit.utils.cache) + +Author: ssolson +Date: 2023-08-18 +""" + +import unittest +import hashlib +import tempfile +import shutil +import os +import pandas as pd +from mhkit.utils.cache import handle_caching, clear_cache + + +class TestCacheUtils(unittest.TestCase): + """ + Unit tests for cache utility functions. + + This test class provides a suite of tests to validate the functionality of caching utilities, + ensuring data is correctly cached, retrieved, and cleared. It specifically tests: + + 1. The creation of cache files by the `handle_caching` function. + 2. The correct retrieval of data from the cache. + 3. The appropriate file extension used when caching CDIP data. + 4. The effective clearing of specified cache directories. + + During the setup phase, a test cache directory is created, and sample data is prepared. + Upon completion of tests, the teardown phase ensures the test cache directory is removed, + leaving the environment clean. + + Attributes: + ----------- + cache_dir : str + Directory path where the test cache files will be stored. + hash_params : str + Sample parameters to be hashed for cache file naming. + data : pandas DataFrame + Sample data to be used for caching in tests. + """ + + @classmethod + def setUpClass(cls): + cls.cache_dir = os.path.join( + os.path.expanduser("~"), ".cache", "mhkit", "test_cache" + ) + cls.hash_params = "test_params" + cls.data = pd.DataFrame( + {"A": [1, 2, 3], "B": [4, 5, 6]}, index=pd.date_range("20220101", periods=3) + ) + + @classmethod + def tearDownClass(cls): + # Remove the test_cache directory + if os.path.exists(cls.cache_dir): + shutil.rmtree(cls.cache_dir) + + def test_handle_caching_creates_cache(self): + """ + Test if the `handle_caching` function correctly creates a cache file. + + The method tests the following scenario: + 1. Invokes the `handle_caching` function to cache a sample DataFrame. + 2. Constructs the expected cache file path based on provided `hash_params`. + 3. Checks if the cache file exists at the expected location. + + Asserts: + - The cache file is successfully created at the expected file path. + """ + handle_caching(self.hash_params, self.cache_dir, data=self.data) + + cache_filename = ( + hashlib.md5(self.hash_params.encode("utf-8")).hexdigest() + ".json" + ) + cache_filepath = os.path.join(self.cache_dir, cache_filename) + + assert os.path.isfile(cache_filepath) + + def test_handle_caching_retrieves_data(self): + """ + Test if the `handle_caching` function retrieves the correct data from cache. + + The method tests the following scenario: + 1. Invokes the `handle_caching` function to cache a sample DataFrame. + 2. Retrieves the data from the cache using the `handle_caching` function. + 3. Compares the retrieved data to the original sample DataFrame. + + Asserts: + - The retrieved data matches the original sample DataFrame. + """ + handle_caching(self.hash_params, self.cache_dir, data=self.data) + retrieved_data, _, _ = handle_caching(self.hash_params, self.cache_dir) + pd.testing.assert_frame_equal(self.data, retrieved_data, check_freq=False) + + def test_handle_caching_cdip_file_extension(self): + """ + Test if the `handle_caching` function uses the correct file extension for CDIP caching. + + The method tests the following scenario: + 1. Specifies the cache directory to include "cdip", signaling CDIP-related caching. + 2. Invokes the `handle_caching` function to cache a sample DataFrame in the CDIP directory. + 3. Constructs the expected cache file path using a ".pkl" extension based on provided `hash_params`. + 4. Checks if the cache file with the ".pkl" extension exists at the expected location. + + Asserts: + - The cache file with a ".pkl" extension is successfully created at the expected file path. + """ + cache_dir = os.path.join(self.cache_dir, "cdip") + handle_caching(self.hash_params, cache_dir, data=self.data) + + cache_filename = ( + hashlib.md5(self.hash_params.encode("utf-8")).hexdigest() + ".pkl" + ) + cache_filepath = os.path.join(cache_dir, cache_filename) + + assert os.path.isfile(cache_filepath) + + def test_clear_cache(self): + """ + Test if the `clear_cache` function correctly clears the specified cache directory. + + The method tests the following scenario: + 1. Moves the contents of the directory to be cleared to a temporary location. + 2. Invokes the `clear_cache` function to clear the specified directory. + 3. Checks if the directory has been cleared. + 4. Restores the original contents of the directory from the temporary location. + + Asserts: + - The specified directory is successfully cleared by the `clear_cache` function. + """ + specific_dir = "wave" + cache_dir = os.path.join(os.path.expanduser("~"), ".cache", "mhkit") + path_to_clear = os.path.join(cache_dir, specific_dir) + + # Step 1: Move contents to temporary directory + temp_dir = tempfile.mkdtemp() + if os.path.exists(path_to_clear): + shutil.move(path_to_clear, temp_dir) + + # Step 2: Run clear_cache and test + clear_cache(specific_dir) + assert not os.path.exists(path_to_clear) + + # Step 3: Move contents back to original location, if they exist in the temporary directory + if os.path.exists(os.path.join(temp_dir, specific_dir)): + shutil.move(os.path.join(temp_dir, specific_dir), cache_dir) + shutil.rmtree(temp_dir) # Clean up temporary directory + + +if __name__ == "__main__": + unittest.main() diff --git a/mhkit/tests/utils/test_upcrossing.py b/mhkit/tests/utils/test_upcrossing.py new file mode 100644 index 000000000..e389fc39a --- /dev/null +++ b/mhkit/tests/utils/test_upcrossing.py @@ -0,0 +1,144 @@ +from mhkit.utils import upcrossing, peaks, troughs, heights, periods, custom +import unittest +from numpy.testing import assert_allclose +import numpy as np +from scipy.optimize import fsolve + + +class TestUpcrossing(unittest.TestCase): + @classmethod + def setUpClass(self): + self.t = np.linspace(0, 4, 1000) + + self.signal = self._example_waveform(self, self.t) + + # Approximiate points for the zero crossing, + # used as starting points in numerical + # solution. + self.zero_cross_approx = [0, 2.1, 3, 3.8] + + def _example_waveform(self, t): + # Create simple wave form to analyse. + # This has been created to perform + # a simple independent calcuation that + # the mhkit functions can be tested against. + + A = np.array([0.5, 0.6, 0.3]) + T = np.array([3, 2, 1]) + w = 2 * np.pi / T + + signal = np.zeros(t.size) + for i in range(A.size): + signal += A[i] * np.sin(w[i] * t) + + return signal + + def _example_analysis(self, t, signal): + # NB: This only works due to the construction + # of our test signal. It is not suitable as + # a general approach. + grad = np.diff(signal) + + # +1 to get the index at turning point + turning_points = np.flatnonzero(grad[1:] * grad[:-1] < 0) + 1 + + crest_inds = turning_points[signal[turning_points] > 0] + trough_inds = turning_points[signal[turning_points] < 0] + + crests = signal[crest_inds] + troughs = signal[trough_inds] + + heights = crests - troughs + + zero_cross = fsolve(self._example_waveform, self.zero_cross_approx) + periods = np.diff(zero_cross) + + return crests, troughs, heights, periods + + def test_peaks(self): + want, _, _, _ = self._example_analysis(self.t, self.signal) + + got = peaks(self.t, self.signal) + + assert_allclose(got, want) + + def test_troughs(self): + _, want, _, _ = self._example_analysis(self.t, self.signal) + + got = troughs(self.t, self.signal) + + assert_allclose(got, want) + + def test_heights(self): + _, _, want, _ = self._example_analysis(self.t, self.signal) + + got = heights(self.t, self.signal) + + assert_allclose(got, want) + + def test_periods(self): + _, _, _, want = self._example_analysis(self.t, self.signal) + + got = periods(self.t, self.signal) + + assert_allclose(got, want, rtol=1e-3, atol=1e-3) + + def test_custom(self): + want, _, _, _ = self._example_analysis(self.t, self.signal) + + # create a similar function to finding the peaks + def f(ind1, ind2): + return np.max(self.signal[ind1:ind2]) + + got = custom(self.t, self.signal, f) + + assert_allclose(got, want) + + def test_peaks_with_inds(self): + want, _, _, _ = self._example_analysis(self.t, self.signal) + + inds = upcrossing(self.t, self.signal) + + got = peaks(self.t, self.signal, inds) + + assert_allclose(got, want) + + def test_trough_with_inds(self): + _, want, _, _ = self._example_analysis(self.t, self.signal) + + inds = upcrossing(self.t, self.signal) + + got = troughs(self.t, self.signal, inds) + + assert_allclose(got, want) + + def test_heights_with_inds(self): + _, _, want, _ = self._example_analysis(self.t, self.signal) + + inds = upcrossing(self.t, self.signal) + + got = heights(self.t, self.signal, inds) + + assert_allclose(got, want) + + def test_periods_with_inds(self): + _, _, _, want = self._example_analysis(self.t, self.signal) + + inds = upcrossing(self.t, self.signal) + + got = periods(self.t, self.signal, inds) + + assert_allclose(got, want, rtol=1e-3, atol=1e-3) + + def test_custom_with_inds(self): + want, _, _, _ = self._example_analysis(self.t, self.signal) + + inds = upcrossing(self.t, self.signal) + + # create a similar function to finding the peaks + def f(ind1, ind2): + return np.max(self.signal[ind1:ind2]) + + got = custom(self.t, self.signal, f, inds) + + assert_allclose(got, want) diff --git a/mhkit/tests/utils/test_utils.py b/mhkit/tests/utils/test_utils.py index 07e1ed029..315d0de19 100644 --- a/mhkit/tests/utils/test_utils.py +++ b/mhkit/tests/utils/test_utils.py @@ -5,149 +5,287 @@ import numpy as np import unittest import json +import xarray as xr testdir = dirname(abspath(__file__)) -loads_datadir = normpath(join(testdir,relpath('../../../examples/data/loads'))) +loads_datadir = normpath(join(testdir, relpath("../../../examples/data/loads"))) -class TestGenUtils(unittest.TestCase): +class TestGenUtils(unittest.TestCase): @classmethod def setUpClass(self): loads_data_file = join(loads_datadir, "loads_data_dict.json") - with open(loads_data_file, 'r') as fp: + with open(loads_data_file, "r") as fp: data_dict = json.load(fp) # convert dictionaries into dataframes - data = { - key: pd.DataFrame(data_dict[key]) - for key in data_dict - } + data = {key: pd.DataFrame(data_dict[key]) for key in data_dict} self.data = data - self.freq = 50 # Hz - self.period = 600 # seconds - + self.freq = 50 # Hz + self.period = 600 # seconds def test_get_statistics(self): # load in file - df = self.data['loads'] + df = self.data["loads"] df.Timestamp = pd.to_datetime(df.Timestamp) - df.set_index('Timestamp',inplace=True) + df.set_index("Timestamp", inplace=True) # run function - means,maxs,mins,stdevs = utils.get_statistics(df,self.freq,period=self.period,vector_channels=['WD_Nacelle','WD_NacelleMod']) + means, maxs, mins, stdevs = utils.get_statistics( + df, + self.freq, + period=self.period, + vector_channels=["WD_Nacelle", "WD_NacelleMod"], + ) # check statistics - self.assertAlmostEqual(means.reset_index().loc[0,'uWind_80m'],7.773,2) # mean - self.assertAlmostEqual(maxs.reset_index().loc[0,'uWind_80m'],13.271,2) # max - self.assertAlmostEqual(mins.reset_index().loc[0,'uWind_80m'],3.221,2) # min - self.assertAlmostEqual(stdevs.reset_index().loc[0,'uWind_80m'],1.551,2) # standard deviation - self.assertAlmostEqual(means.reset_index().loc[0,'WD_Nacelle'],178.1796,2) # mean - vector - self.assertAlmostEqual(stdevs.reset_index().loc[0,'WD_Nacelle'],36.093,2) # standard devaition - vector + self.assertAlmostEqual( + means.reset_index().loc[0, "uWind_80m"], 7.773, 2 + ) # mean + self.assertAlmostEqual(maxs.reset_index().loc[0, "uWind_80m"], 13.271, 2) # max + self.assertAlmostEqual(mins.reset_index().loc[0, "uWind_80m"], 3.221, 2) # min + self.assertAlmostEqual( + stdevs.reset_index().loc[0, "uWind_80m"], 1.551, 2 + ) # standard deviation + self.assertAlmostEqual( + means.reset_index().loc[0, "WD_Nacelle"], 178.1796, 2 + ) # mean - vector + self.assertAlmostEqual( + stdevs.reset_index().loc[0, "WD_Nacelle"], 36.093, 2 + ) # standard devaition - vector # check timestamp - string_time = '2017-03-01 01:28:41' + string_time = "2017-03-01 01:28:41" time = pd.to_datetime(string_time) - self.assertTrue(means.index[0]==time) - + self.assertTrue(means.index[0] == time) + def test_vector_statistics(self): # load in vector variable - df = self.data['loads'] - vector_data = df['WD_Nacelle'] + df = self.data["loads"] + vector_data = df["WD_Nacelle"] vector_avg, vector_std = utils.vector_statistics(vector_data) # check answers - self.assertAlmostEqual(vector_avg,178.1796,2) # mean - vector - self.assertAlmostEqual(vector_std,36.093,2) # standard devaition - vector + self.assertAlmostEqual(vector_avg, 178.1796, 2) # mean - vector + self.assertAlmostEqual(vector_std, 36.093, 2) # standard devaition - vector def test_unwrap_vector(self): # create array of test values and corresponding expected answers - test = [-740,-400,-50,0,50,400,740] - correct = [340,320,310,0,50,40,20] + test = [-740, -400, -50, 0, 50, 400, 740] + correct = [340, 320, 310, 0, 50, 40, 20] # get answers from function answer = utils.unwrap_vector(test) - + # check if answer is correct - assert_frame_equal(pd.DataFrame(answer,dtype='int32'),pd.DataFrame(correct,dtype='int32')) + assert_frame_equal( + pd.DataFrame(answer, dtype="int32"), pd.DataFrame(correct, dtype="int32") + ) def test_matlab_to_datetime(self): # store matlab timestamp - mat_time = 7.367554921296296e+05 + mat_time = 7.367554921296296e05 # corresponding datetime - string_time = '2017-03-01 11:48:40' + string_time = "2017-03-01 11:48:40" time = pd.to_datetime(string_time) # test function answer = utils.matlab_to_datetime(mat_time) - answer2 = answer.round('s') # round to nearest second for comparison - + answer2 = answer.round("s") # round to nearest second for comparison + # check if answer is correct self.assertTrue(answer2 == time) def test_excel_to_datetime(self): # store excel timestamp - excel_time = 4.279549212962963e+04 + excel_time = 4.279549212962963e04 # corresponding datetime - string_time = '2017-03-01 11:48:40' + string_time = "2017-03-01 11:48:40" time = pd.to_datetime(string_time) # test function answer = utils.excel_to_datetime(excel_time) - answer2 = answer.round('s') # round to nearest second for comparison - + answer2 = answer.round("s") # round to nearest second for comparison + # check if answer is correct - self.assertTrue(answer2 == time) + self.assertTrue(answer2 == time) def test_magnitude_phase_2D(self): # float - magnitude=9 - x=y = np.sqrt(1/2*magnitude**2) + magnitude = 9 + x = y = np.sqrt(1 / 2 * magnitude**2) phase = np.arctan2(y, x) - mag, theta = utils.magnitude_phase(x,y) - + mag, theta = utils.magnitude_phase(x, y) + self.assertAlmostEqual(magnitude, mag) self.assertAlmostEqual(phase, theta) - - #list - xx = [x,x] - yy = [y,y] - mag, theta = utils.magnitude_phase(xx,yy) - self.assertTrue(all(mag==magnitude)) - self.assertTrue(all(theta==phase)) - - #series - xs = pd.Series(xx,index=range(len(xx))) - ys = pd.Series(yy,index=range(len(yy))) - - mag, theta = utils.magnitude_phase(xs,ys) - self.assertTrue(all(mag==magnitude)) - self.assertTrue(all(theta==phase)) - + + # list + xx = [x, x] + yy = [y, y] + mag, theta = utils.magnitude_phase(xx, yy) + self.assertTrue(all(mag == magnitude)) + self.assertTrue(all(theta == phase)) + + # series + xs = pd.Series(xx, index=range(len(xx))) + ys = pd.Series(yy, index=range(len(yy))) + + mag, theta = utils.magnitude_phase(xs, ys) + self.assertTrue(all(mag == magnitude)) + self.assertTrue(all(theta == phase)) + def test_magnitude_phase_3D(self): # float - magnitude=9 - x=y=z = np.sqrt(1/3*magnitude**2) + magnitude = 9 + x = y = z = np.sqrt(1 / 3 * magnitude**2) phase1 = np.arctan2(y, x) - phase2 = np.arctan2(np.sqrt(x**2+y**2),z) - mag, theta, phi = utils.magnitude_phase(x,y,z) - + phase2 = np.arctan2(np.sqrt(x**2 + y**2), z) + mag, theta, phi = utils.magnitude_phase(x, y, z) + self.assertAlmostEqual(magnitude, mag) self.assertAlmostEqual(phase1, theta) self.assertAlmostEqual(phase2, phi) - - #list - xx = [x,x] - yy = [y,y] - zz = [z,z] - mag, theta, phi = utils.magnitude_phase(xx,yy,zz) - self.assertTrue(all(mag==magnitude)) - self.assertTrue(all(theta==phase1)) - self.assertTrue(all(phi==phase2)) - - #series - xs = pd.Series(xx,index=range(len(xx))) - ys = pd.Series(yy,index=range(len(yy))) - zs = pd.Series(zz,index=range(len(zz))) - - mag, theta, phi = utils.magnitude_phase(xs,ys,zs) - self.assertTrue(all(mag==magnitude)) - self.assertTrue(all(theta==phase1)) - self.assertTrue(all(phi==phase2)) - - -if __name__ == '__main__': + + # list + xx = [x, x] + yy = [y, y] + zz = [z, z] + mag, theta, phi = utils.magnitude_phase(xx, yy, zz) + self.assertTrue(all(mag == magnitude)) + self.assertTrue(all(theta == phase1)) + self.assertTrue(all(phi == phase2)) + + # series + xs = pd.Series(xx, index=range(len(xx))) + ys = pd.Series(yy, index=range(len(yy))) + zs = pd.Series(zz, index=range(len(zz))) + + mag, theta, phi = utils.magnitude_phase(xs, ys, zs) + self.assertTrue(all(mag == magnitude)) + self.assertTrue(all(theta == phase1)) + self.assertTrue(all(phi == phase2)) + + def test_convert_to_dataarray(self): + # test data + a = 5 + t = np.arange(0.0, 5.0, 0.5) + i = np.arange(0.0, 10.0, 1) + d1 = i**2 / 5.0 + d2 = -d1 + + # test data formats + test_n = d1 + test_s = pd.Series(d1, t) + test_df = pd.DataFrame({"d1": d1}, index=t) + test_df2 = pd.DataFrame({"d1": d1, "d1_duplicate": d1}, index=t) + test_da = xr.DataArray( + data=d1, + dims="time", + coords=dict(time=t), + ) + test_ds = xr.Dataset( + data_vars={"d1": (["time"], d1)}, coords={"time": t, "index": i} + ) + test_ds2 = xr.Dataset( + data_vars={ + "d1": (["time"], d1), + "d2": (["ind"], d2), + }, + coords={"time": t, "index": i}, + ) + + # numpy + n = utils.convert_to_dataarray(test_n, "test_data") + self.assertIsInstance(n, xr.DataArray) + self.assertTrue(all(n.data == d1)) + self.assertEqual(n.name, "test_data") + + # Series + s = utils.convert_to_dataarray(test_s) + self.assertIsInstance(s, xr.DataArray) + self.assertTrue(all(s.data == d1)) + + # DataArray + da = utils.convert_to_dataarray(test_da) + self.assertIsInstance(da, xr.DataArray) + self.assertTrue(all(da.data == d1)) + + # Dataframe + df = utils.convert_to_dataarray(test_df) + self.assertIsInstance(df, xr.DataArray) + self.assertTrue(all(df.data == d1)) + + # Dataset + ds = utils.convert_to_dataarray(test_ds) + self.assertIsInstance(ds, xr.DataArray) + self.assertTrue(all(ds.data == d1)) + + # int (error) + with self.assertRaises(TypeError): + utils.convert_to_dataarray(a) + + # non-string name (error) + with self.assertRaises(TypeError): + utils.convert_to_dataarray(test_n, 5) + + # Multivariate Dataframe (error) + with self.assertRaises(ValueError): + utils.convert_to_dataarray(test_df2) + + # Multivariate Dataset (error) + with self.assertRaises(ValueError): + utils.convert_to_dataarray(test_ds2) + + def test_convert_to_dataset(self): + # test data + a = 5 + t = np.arange(0, 5, 0.5) + i = np.arange(0, 10, 1) + d1 = i**2 / 5.0 + d2 = -d1 + + # test data formats + test_n = d1 + test_s = pd.Series(d1, t) + test_df2 = pd.DataFrame({"d1": d1, "d2": d2}, index=t) + test_da = xr.DataArray( + data=d1, + dims="time", + coords=dict(time=t), + ) + test_ds2 = xr.Dataset( + data_vars={ + "d1": (["time"], d1), + "d2": (["ind"], d2), + }, + coords={"time": t, "index": i}, + ) + + # Series + s = utils.convert_to_dataset(test_s) + self.assertIsInstance(s, xr.Dataset) + self.assertTrue(all(s["data"].data == d1)) + + # DataArray with custom name + da = utils.convert_to_dataset(test_da, "test_name") + self.assertIsInstance(da, xr.Dataset) + self.assertTrue(all(da["test_name"].data == d1)) + + # Dataframe + df = utils.convert_to_dataset(test_df2) + self.assertIsInstance(df, xr.Dataset) + self.assertTrue(all(df["d1"].data == d1)) + self.assertTrue(all(df["d2"].data == d2)) + + # Dataset + ds = utils.convert_to_dataset(test_ds2) + self.assertIsInstance(ds, xr.Dataset) + self.assertTrue(all(ds["d1"].data == d1)) + self.assertTrue(all(ds["d2"].data == d2)) + + # int (error) + with self.assertRaises(TypeError): + utils.convert_to_dataset(a) + + # non-string name (error) + with self.assertRaises(TypeError): + utils.convert_to_dataset(test_n, 5) + + +if __name__ == "__main__": unittest.main() diff --git a/mhkit/tests/wave/io/hindcast/test_hindcast.py b/mhkit/tests/wave/io/hindcast/test_hindcast.py index 08333e6c9..379eeeee4 100644 --- a/mhkit/tests/wave/io/hindcast/test_hindcast.py +++ b/mhkit/tests/wave/io/hindcast/test_hindcast.py @@ -22,6 +22,7 @@ Run the script directly as a standalone program, or import the TestWPTOhindcast class in another test suite. """ + import unittest from os.path import abspath, dirname, join, normpath from pandas.testing import assert_frame_equal @@ -31,220 +32,207 @@ import xarray as xr testdir = dirname(abspath(__file__)) -datadir = normpath(join(testdir,'..','..','..','..','..','examples','data','wave')) +datadir = normpath( + join(testdir, "..", "..", "..", "..", "..", "examples", "data", "wave") +) class TestWPTOhindcast(unittest.TestCase): - ''' + """ A test call designed to check the WPTO hindcast retrival - ''' + """ @classmethod def setUpClass(cls): - ''' + """ Intitialize the WPTO hindcast test with expected data - ''' + """ cls.my_swh = pd.read_csv( - join(datadir,'hindcast/multi_year_hindcast.csv'), - index_col = 'time_index', - names = ['time_index','significant_wave_height_0'], - header = 0, - dtype = {'significant_wave_height_0':'float32'} + join(datadir, "hindcast/multi_year_hindcast.csv"), + index_col="time_index", + names=["time_index", "significant_wave_height_0"], + header=0, + dtype={"significant_wave_height_0": "float32"}, ) cls.my_swh.index = pd.to_datetime(cls.my_swh.index) cls.ml = pd.read_csv( - join(datadir,'hindcast/single_year_hindcast_multiloc.csv'), - index_col = 'time_index', - names = [ - 'time_index', - 'mean_absolute_period_0', - 'mean_absolute_period_1' - ], - header = 0, - dtype = { - 'mean_absolute_period_0':'float32', - 'mean_absolute_period_1':'float32' - } + join(datadir, "hindcast/single_year_hindcast_multiloc.csv"), + index_col="time_index", + names=["time_index", "mean_absolute_period_0", "mean_absolute_period_1"], + header=0, + dtype={ + "mean_absolute_period_0": "float32", + "mean_absolute_period_1": "float32", + }, ) cls.ml.index = pd.to_datetime(cls.ml.index) cls.mp = pd.read_csv( - join(datadir,'hindcast/multiparm.csv'), - index_col = 'time_index', - names = [ - 'time_index', - 'energy_period_87', - 'mean_zero-crossing_period_87' - ], - header = 0, - dtype = { - 'energy_period_87':'float32', - 'mean_zero-crossing_period_87':'float32' - } + join(datadir, "hindcast/multiparm.csv"), + index_col="time_index", + names=["time_index", "energy_period_87", "mean_zero-crossing_period_87"], + header=0, + dtype={ + "energy_period_87": "float32", + "mean_zero-crossing_period_87": "float32", + }, ) cls.mp.index = pd.to_datetime(cls.mp.index) cls.ml_meta = pd.read_csv( - join(datadir,'hindcast/multiloc_meta.csv'), - index_col = 0, - names = [ + join(datadir, "hindcast/multiloc_meta.csv"), + index_col=0, + names=[ None, - 'water_depth', - 'latitude', - 'longitude', - 'distance_to_shore', - 'timezone', - 'jurisdiction', - 'gid', + "water_depth", + "latitude", + "longitude", + "distance_to_shore", + "timezone", + "jurisdiction", + "gid", ], - header = 0, - dtype = { - 'water_depth':'float32', - 'latitude':'float32', - 'longitude':'float32', - 'distance_to_shore':'float32', - 'timezone':'int16', - 'gid': 'int64', - } + header=0, + dtype={ + "water_depth": "float32", + "latitude": "float32", + "longitude": "float32", + "distance_to_shore": "float32", + "timezone": "int16", + "gid": "int64", + }, ) cls.my_meta = pd.read_csv( - join(datadir,'hindcast/multi_year_meta.csv'), - names = [ - 'water_depth', - 'latitude', - 'longitude', - 'distance_to_shore', - 'timezone', - 'jurisdiction', - 'gid' + join(datadir, "hindcast/multi_year_meta.csv"), + names=[ + "water_depth", + "latitude", + "longitude", + "distance_to_shore", + "timezone", + "jurisdiction", + "gid", ], - header = 0, - dtype = { - 'water_depth':'float32', - 'latitude':'float32', - 'longitude':'float32', - 'distance_to_shore':'float32', - 'timezone':'int16', - 'gid':'int64' - } + header=0, + dtype={ + "water_depth": "float32", + "latitude": "float32", + "longitude": "float32", + "distance_to_shore": "float32", + "timezone": "int16", + "gid": "int64", + }, ) cls.mp_meta = pd.read_csv( - join(datadir,'hindcast/multiparm_meta.csv'), - index_col = 0, - names = [ + join(datadir, "hindcast/multiparm_meta.csv"), + index_col=0, + names=[ None, - 'water_depth', - 'latitude', - 'longitude', - 'distance_to_shore', - 'timezone', - 'jurisdiction', - 'gid', + "water_depth", + "latitude", + "longitude", + "distance_to_shore", + "timezone", + "jurisdiction", + "gid", ], - header = 0, - dtype = { - 'water_depth':'float32', - 'latitude':'float32', - 'longitude':'float32', - 'distance_to_shore':'float32', - 'timezone':'int16', - 'gid':'int64', - } + header=0, + dtype={ + "water_depth": "float32", + "latitude": "float32", + "longitude": "float32", + "distance_to_shore": "float32", + "timezone": "int16", + "gid": "int64", + }, ) - cls.multi_year_dir_spectra = xr.open_dataset(join(datadir, 'hindcast/multi_year_dir_spectra.nc')) + cls.multi_year_dir_spectra = xr.open_dataset( + join(datadir, "hindcast/multi_year_dir_spectra.nc") + ) cls.multi_year_dir_spectra_meta = pd.read_csv( - join(datadir, 'hindcast/multi_year_dir_spectra_meta.csv'), - dtype = { - 'water_depth':'float32', - 'latitude':'float32', - 'longitude':'float32', - 'distance_to_shore':'float32', - 'timezone':'int16', - 'gid':'int64' - }) + join(datadir, "hindcast/multi_year_dir_spectra_meta.csv"), + dtype={ + "water_depth": "float32", + "latitude": "float32", + "longitude": "float32", + "distance_to_shore": "float32", + "timezone": "int16", + "gid": "int64", + }, + ) def test_multi_year(self): - ''' + """ Test multiple years on a single data_type, lat_lon, and parameter - ''' - data_type = '3-hour' - years = [1990,1992] - lat_lon = (44.624076,-124.280097) - parameters = 'significant_wave_height' - - wave_multiyear, meta = (wave.io.hindcast.hindcast - .request_wpto_point_data( - data_type, - parameters, - lat_lon, - years, - as_xarray=True - ) + """ + data_type = "3-hour" + years = [1990, 1992] + lat_lon = (44.624076, -124.280097) + parameters = "significant_wave_height" + + wave_multiyear, meta = wave.io.hindcast.hindcast.request_wpto_point_data( + data_type, parameters, lat_lon, years, to_pandas=False ) wave_multiyear_df = ( - wave_multiyear['significant_wave_height_0'] + wave_multiyear["significant_wave_height_0"] .to_dataframe() - .tz_localize('UTC') - ) + .tz_localize("UTC") + ) assert_frame_equal(self.my_swh, wave_multiyear_df) assert_frame_equal(self.my_meta, meta) - def test_multi_parm(self): - ''' + """ Test multiple parameters on a single data_type, year, and lat_lon - ''' - data_type = '1-hour' + """ + data_type = "1-hour" years = [1996] - lat_lon = (44.624076,-124.280097) - parameters = ['energy_period','mean_zero-crossing_period'] - wave_multiparm, meta= (wave.io.hindcast.hindcast - .request_wpto_point_data( - data_type, - parameters, - lat_lon, - years - ) + lat_lon = (44.624076, -124.280097) + parameters = ["energy_period", "mean_zero-crossing_period"] + wave_multiparm, meta = wave.io.hindcast.hindcast.request_wpto_point_data( + data_type, parameters, lat_lon, years ) - assert_frame_equal(self.mp,wave_multiparm) - assert_frame_equal(self.mp_meta,meta) - + assert_frame_equal(self.mp, wave_multiparm) + assert_frame_equal(self.mp_meta, meta) def test_multi_loc(self): - ''' + """ Test mutiple locations on point data and directional spectrum at a single data_type, year, and parameter. - ''' - data_type = '3-hour' + """ + data_type = "3-hour" years = [1995] - lat_lon = ((44.624076,-124.280097),(43.489171,-125.152137)) - parameters = 'mean_absolute_period' - wave_multiloc, meta=wave.io.hindcast.hindcast.request_wpto_point_data( - data_type, - parameters, - lat_lon, - years + lat_lon = ((44.624076, -124.280097), (43.489171, -125.152137)) + parameters = "mean_absolute_period" + wave_multiloc, meta = wave.io.hindcast.hindcast.request_wpto_point_data( + data_type, parameters, lat_lon, years ) - dir_multiyear, meta_dir = (wave.io.hindcast.hindcast - .request_wpto_directional_spectrum(lat_lon,year=str(years[0])) + ( + dir_multiyear, + meta_dir, + ) = wave.io.hindcast.hindcast.request_wpto_directional_spectrum( + lat_lon, year=str(years[0]) ) + dir_multiyear = dir_multiyear.sel( - time_index=slice( - dir_multiyear.time_index[0], - dir_multiyear.time_index[99] - ) + time_index=slice(dir_multiyear.time_index[0], dir_multiyear.time_index[99]) ) - + # Convert to effcient range index + meta_dir.index = pd.RangeIndex(start=0, stop=len(meta_dir.index)) + assert_frame_equal(self.ml, wave_multiloc) assert_frame_equal(self.ml_meta, meta) xrt.assert_allclose(self.multi_year_dir_spectra, dir_multiyear) - assert_frame_equal(self.multi_year_dir_spectra_meta, meta_dir) + assert_frame_equal( + self.multi_year_dir_spectra_meta, meta_dir, check_dtype=False + ) + -if __name__ == '__main__': +if __name__ == "__main__": unittest.main() diff --git a/mhkit/tests/wave/io/hindcast/test_wind_toolkit.py b/mhkit/tests/wave/io/hindcast/test_wind_toolkit.py index ad5e2ba96..6544f8b52 100644 --- a/mhkit/tests/wave/io/hindcast/test_wind_toolkit.py +++ b/mhkit/tests/wave/io/hindcast/test_wind_toolkit.py @@ -1,180 +1,364 @@ from os.path import abspath, dirname, join, isfile, normpath, relpath from pandas.testing import assert_frame_equal -from numpy.testing import assert_allclose -from scipy.interpolate import interp1d -from random import seed, randint import matplotlib.pylab as plt -from datetime import datetime -import xarray.testing as xrt import mhkit.wave.io.hindcast.wind_toolkit as wtk -from io import StringIO import pandas as pd -import numpy as np -import contextlib import unittest -import netCDF4 -import inspect -import pickle -import time -import json -import sys -import os +import pytest testdir = dirname(abspath(__file__)) -datadir = normpath(join(testdir,'..','..','..','..','..','examples','data','wave','wind_toolkit')) +datadir = normpath( + join( + testdir, + "..", + "..", + "..", + "..", + "..", + "examples", + "data", + "wave", + "wind_toolkit", + ) +) class TestWINDToolkit(unittest.TestCase): - @classmethod def setUpClass(self): - - self.my = pd.read_csv(join(datadir,'wtk_multiyear.csv'), - index_col = 'time_index', - names = ['time_index','pressure_200m_0'], - header = 0, - dtype = {'pressure_200m_0':'float32'}) + self.my = pd.read_csv( + join(datadir, "wtk_multiyear.csv"), + index_col="time_index", + names=["time_index", "pressure_200m_0"], + header=0, + dtype={"pressure_200m_0": "float32"}, + ) self.my.index = pd.to_datetime(self.my.index) - self.ml = pd.read_csv(join(datadir,'wtk_multiloc.csv'), - index_col = 'time_index', - names = ['time_index','windspeed_10m_0','windspeed_10m_1'], - header = 0, - dtype = {'windspeed_10m_0':'float32', - 'windspeed_10m_1':'float32'}) + self.ml = pd.read_csv( + join(datadir, "wtk_multiloc.csv"), + index_col="time_index", + names=["time_index", "windspeed_10m_0", "windspeed_10m_1"], + header=0, + dtype={"windspeed_10m_0": "float32", "windspeed_10m_1": "float32"}, + ) self.ml.index = pd.to_datetime(self.ml.index) - self.mp = pd.read_csv(join(datadir,'wtk_multiparm.csv'), - index_col = 'time_index', - names = ['time_index','temperature_20m_0','temperature_40m_0'], - header = 0, - dtype = {'temperature_20m_0':'float32', - 'temperature_40m_0':'float32'}) + self.mp = pd.read_csv( + join(datadir, "wtk_multiparm.csv"), + index_col="time_index", + names=["time_index", "temperature_20m_0", "temperature_40m_0"], + header=0, + dtype={"temperature_20m_0": "float32", "temperature_40m_0": "float32"}, + ) self.mp.index = pd.to_datetime(self.mp.index) - self.my_meta = pd.read_csv(join(datadir,'wtk_multiyear_meta.csv'), - index_col = 0, - names = ['latitude','longitude','country','state','county','timezone','elevation','offshore'], - header = 0, - dtype = {'latitude':'float32','longitude':'float32', - 'country':'str','state':'str','county':'str', - 'timezone':'int16','elevation':'float32','offshore':'int16'}) - - self.ml_meta = pd.read_csv(join(datadir,'wtk_multiloc_meta.csv'), - index_col = 0, - names = ['latitude','longitude','country','state','county','timezone','elevation','offshore'], - header = 0, - dtype = {'latitude':'float32','longitude':'float32', - 'country':'str','state':'str','county':'str', - 'timezone':'int16','elevation':'float32','offshore':'int16'}) - - self.mp_meta = pd.read_csv(join(datadir,'wtk_multiparm_meta.csv'), - index_col = 0, - names = ['latitude','longitude','country','state','county','timezone','elevation','offshore'], - header = 0, - dtype = {'latitude':'float32','longitude':'float32', - 'country':'str','state':'str','county':'str', - 'timezone':'int16','elevation':'float32','offshore':'int16'}) + self.my_meta = pd.read_csv( + join(datadir, "wtk_multiyear_meta.csv"), + index_col=0, + names=[ + "latitude", + "longitude", + "country", + "state", + "county", + "timezone", + "elevation", + "offshore", + ], + header=0, + dtype={ + "latitude": "float32", + "longitude": "float32", + "country": "str", + "state": "str", + "county": "str", + "timezone": "int16", + "elevation": "float32", + "offshore": "int16", + }, + ) + + # Replace NaN values in 'state' and 'county' with the string "None" + self.my_meta["state"] = self.my_meta["state"].fillna("None") + self.my_meta["county"] = self.my_meta["county"].fillna("None") + + self.ml_meta = pd.read_csv( + join(datadir, "wtk_multiloc_meta.csv"), + index_col=0, + names=[ + "latitude", + "longitude", + "country", + "state", + "county", + "timezone", + "elevation", + "offshore", + ], + header=0, + dtype={ + "latitude": "float32", + "longitude": "float32", + "country": "str", + "state": "str", + "county": "str", + "timezone": "int16", + "elevation": "float32", + "offshore": "int16", + }, + ) + # Replace NaN values in 'state' and 'county' with the string "None" + self.ml_meta["state"] = self.ml_meta["state"].fillna("None") + self.ml_meta["county"] = self.ml_meta["county"].fillna("None") + + self.mp_meta = pd.read_csv( + join(datadir, "wtk_multiparm_meta.csv"), + index_col=0, + names=[ + "latitude", + "longitude", + "country", + "state", + "county", + "timezone", + "elevation", + "offshore", + ], + header=0, + dtype={ + "latitude": "float32", + "longitude": "float32", + "country": "str", + "state": "str", + "county": "str", + "timezone": "int16", + "elevation": "float32", + "offshore": "int16", + }, + ) + # Replace NaN values in 'state' and 'county' with the string "None" + self.mp_meta["state"] = self.mp_meta["state"].fillna("None") + self.mp_meta["county"] = self.mp_meta["county"].fillna("None") @classmethod def tearDownClass(self): pass - ## WIND Toolkit data + # WIND Toolkit data def test_multi_year(self): - data_type = '1-hour' - years = [2018,2019] - lat_lon = (44.624076,-124.280097) # NW_Pacific - parameters = 'pressure_200m' + data_type = "1-hour" + years = [2018, 2019] + lat_lon = (44.624076, -124.280097) # NW_Pacific + parameters = "pressure_200m" wtk_multiyear, meta = wtk.request_wtk_point_data( - data_type, parameters, - lat_lon, years) - assert_frame_equal(self.my,wtk_multiyear) - assert_frame_equal(self.my_meta,meta) - + data_type, parameters, lat_lon, years + ) + assert_frame_equal(self.my, wtk_multiyear) + assert_frame_equal(self.my_meta, meta) def test_multi_loc(self): - data_type = '1-hour' + data_type = "1-hour" years = [2001] - lat_lon = ((39.33,-67.21),(41.3,-75.9)) # Mid-Atlantic - parameters = 'windspeed_10m' + lat_lon = ((39.33, -67.21), (41.3, -75.9)) # Mid-Atlantic + parameters = "windspeed_10m" wtk_multiloc, meta = wtk.request_wtk_point_data( - data_type, parameters, - lat_lon, years) - assert_frame_equal(self.ml,wtk_multiloc) - assert_frame_equal(self.ml_meta,meta) - + data_type, parameters, lat_lon, years + ) + assert_frame_equal(self.ml, wtk_multiloc) + assert_frame_equal(self.ml_meta, meta) def test_multi_parm(self): - data_type = '1-hour' + data_type = "1-hour" years = [2012] - lat_lon = (17.2,-156.5) # Hawaii - parameters = ['temperature_20m','temperature_40m'] + lat_lon = (17.2, -156.5) # Hawaii + + parameters = ["temperature_20m", "temperature_40m"] wtk_multiparm, meta = wtk.request_wtk_point_data( - data_type, parameters, - lat_lon, years) - assert_frame_equal(self.mp,wtk_multiparm) - assert_frame_equal(self.mp_meta,meta) - + data_type, parameters, lat_lon, years + ) + + assert_frame_equal(self.mp, wtk_multiparm) + assert_frame_equal(self.mp_meta, meta) + + def test_invalid_parameter_type(self): + with pytest.raises(TypeError): + wtk.request_wtk_point_data( + time_interval="1-hour", + parameter=123, # Invalid type, should be a string or list of strings + lat_lon=(17.2, -156.5), + years=[2012], + ) + + def test_invalid_lat_lon_type(self): + with pytest.raises(TypeError): + wtk.request_wtk_point_data( + time_interval="1-hour", + parameter="temperature_20m", + lat_lon="17.2, -156.5", # Invalid type, should be a tuple or list of tuples + years=[2012], + ) + + def test_invalid_time_interval_type(self): + with pytest.raises(TypeError): + wtk.request_wtk_point_data( + time_interval=123, # Invalid type, should be a string + parameter="temperature_20m", + lat_lon=(17.2, -156.5), + years=[2012], + ) + + def test_invalid_years_type(self): + with pytest.raises(TypeError): + wtk.request_wtk_point_data( + time_interval="1-hour", + parameter="temperature_20m", + lat_lon=(17.2, -156.5), + years="2012", # Invalid type, should be a list + ) + + def test_invalid_preferred_region_type(self): + with pytest.raises(TypeError): + wtk.request_wtk_point_data( + time_interval="1-hour", + parameter="temperature_20m", + lat_lon=(17.2, -156.5), + years=[2012], + preferred_region=123, # Invalid type, should be a string + ) + + def test_invalid_tree_type(self): + with pytest.raises(TypeError): + wtk.request_wtk_point_data( + time_interval="1-hour", + parameter="temperature_20m", + lat_lon=(17.2, -156.5), + years=[2012], + preferred_region="", + tree=123, # Invalid type, should be a string or None + ) + + def test_invalid_unscale_type(self): + with pytest.raises(TypeError): + wtk.request_wtk_point_data( + time_interval="1-hour", + parameter="temperature_20m", + lat_lon=(17.2, -156.5), + years=[2012], + preferred_region="", + tree=None, + unscale="True", # Invalid type, should be bool + ) + + def test_invalid_str_decode_type(self): + with pytest.raises(TypeError): + wtk.request_wtk_point_data( + time_interval="1-hour", + parameter="temperature_20m", + lat_lon=(17.2, -156.5), + years=[2012], + preferred_region="", + tree=None, + unscale=True, + str_decode=123, # Invalid type, should be bool + ) + + def test_invalid_hsds_type(self): + with pytest.raises(TypeError): + wtk.request_wtk_point_data( + time_interval="1-hour", + parameter="temperature_20m", + lat_lon=(17.2, -156.5), + years=[2012], + preferred_region="", + tree=None, + unscale=True, + str_decode=True, + hsds="True", # Invalid type, should be bool + ) + + def test_invalid_clear_cache_type(self): + with pytest.raises(TypeError): + wtk.request_wtk_point_data( + time_interval="1-hour", + parameter="temperature_20m", + lat_lon=(17.2, -156.5), + years=[2012], + preferred_region="", + tree=None, + unscale=True, + str_decode=True, + hsds=True, + clear_cache="False", # Invalid type, should be bool + ) + # test region_selection function and catch for the preferred region def test_region(self): - region = wtk.region_selection((41.9,-125.3), preferred_region='Offshore_CA') - assert region=='Offshore_CA' - - region = wtk.region_selection((41.9,-125.3), preferred_region='NW_Pacific') - assert region=='NW_Pacific' - + region = wtk.region_selection((41.9, -125.3), preferred_region="Offshore_CA") + assert region == "Offshore_CA" + + region = wtk.region_selection((41.9, -125.3), preferred_region="NW_Pacific") + assert region == "NW_Pacific" + try: - region = wtk.region_selection((41.9,-125.3)) + region = wtk.region_selection((41.9, -125.3)) except TypeError: pass else: - assert False, 'Check wind_toolkit.region_selection() method for catching regional overlap' - - region = wtk.region_selection((36.3,-122.3), preferred_region='') - assert region=='Offshore_CA' - - region = wtk.region_selection((16.3,-155.3), preferred_region='') - assert region=='Hawaii' - - region = wtk.region_selection((45.3,-126.3), preferred_region='') - assert region=='NW_Pacific' - - region = wtk.region_selection((39.3,-70.3), preferred_region='') - assert region=='Mid_Atlantic' - + assert ( + False + ), "Check wind_toolkit.region_selection() method for catching regional overlap" + + region = wtk.region_selection((36.3, -122.3), preferred_region="") + assert region == "Offshore_CA" + + region = wtk.region_selection((16.3, -155.3), preferred_region="") + assert region == "Hawaii" + + region = wtk.region_selection((45.3, -126.3), preferred_region="") + assert region == "NW_Pacific" + + region = wtk.region_selection((39.3, -70.3), preferred_region="") + assert region == "Mid_Atlantic" + # test the check for multiple region def test_multi_region(self): - data_type = '1-hour' + data_type = "1-hour" years = [2012] - lat_lon = ((17.2,-156.5),(45.3,-126.3)) - parameters = ['temperature_20m'] + lat_lon = ((17.2, -156.5), (45.3, -126.3)) + parameters = ["temperature_20m"] try: data, meta = wtk.request_wtk_point_data( - data_type, parameters, - lat_lon, years) + data_type, parameters, lat_lon, years + ) except TypeError: pass else: - assert False, 'Check wind_toolkit.region_selection() method for catching requests over multiple regions' + assert ( + False + ), "Check wind_toolkit.region_selection() method for catching requests over multiple regions" # test plot_region() def test_plot_region(self): fig, ax1 = plt.subplots() - ax1 = wtk.plot_region('Mid_Atlantic',ax=ax1) - - ax2 = wtk.plot_region('NW_Pacific') - + ax1 = wtk.plot_region("Mid_Atlantic", ax=ax1) + + ax2 = wtk.plot_region("NW_Pacific") + # test elevation_to_string() def test_elevation_to_string(self): - - parameter = 'windspeed' + parameter = "windspeed" elevations = [20, 40, 60, 120, 180] parameter_list = wtk.elevation_to_string(parameter, elevations) - assert parameter_list==['windspeed_20m','windspeed_40m','windspeed_60m', - 'windspeed_120m','windspeed_180m'] - + assert parameter_list == [ + "windspeed_20m", + "windspeed_40m", + "windspeed_60m", + "windspeed_120m", + "windspeed_180m", + ] + -if __name__ == '__main__': +if __name__ == "__main__": unittest.main() diff --git a/mhkit/tests/wave/io/test_cdip.py b/mhkit/tests/wave/io/test_cdip.py index f42227329..b77958df6 100644 --- a/mhkit/tests/wave/io/test_cdip.py +++ b/mhkit/tests/wave/io/test_cdip.py @@ -1,66 +1,61 @@ -from os.path import abspath, dirname, join, isfile, normpath, relpath -from pandas.testing import assert_frame_equal -from numpy.testing import assert_allclose -from scipy.interpolate import interp1d -from random import seed, randint +from os.path import abspath, dirname, join, isfile, normpath import matplotlib.pylab as plt from datetime import datetime -import xarray.testing as xrt import mhkit.wave as wave -from io import StringIO -import pandas as pd -import numpy as np -import contextlib import unittest import netCDF4 -import inspect -import pickle -import time -import json -import sys +import pytz import os testdir = dirname(abspath(__file__)) -datadir = normpath(join(testdir,'..','..','..','..','examples','data','wave')) +datadir = normpath(join(testdir, "..", "..", "..", "..", "examples", "data", "wave")) class TestIOcdip(unittest.TestCase): - @classmethod def setUpClass(self): - b067_1996='http://thredds.cdip.ucsd.edu/thredds/dodsC/cdip/' + \ - 'archive/067p1/067p1_d04.nc' + b067_1996 = ( + "http://thredds.cdip.ucsd.edu/thredds/dodsC/cdip/" + + "archive/067p1/067p1_d04.nc" + ) self.test_nc = netCDF4.Dataset(b067_1996) - self.vars2D = [ 'waveEnergyDensity', 'waveMeanDirection', - 'waveA1Value', 'waveB1Value', 'waveA2Value', - 'waveB2Value', 'waveCheckFactor', 'waveSpread', - 'waveM2Value', 'waveN2Value'] + self.vars2D = [ + "waveEnergyDensity", + "waveMeanDirection", + "waveA1Value", + "waveB1Value", + "waveA2Value", + "waveB2Value", + "waveCheckFactor", + "waveSpread", + "waveM2Value", + "waveN2Value", + ] @classmethod def tearDownClass(self): pass def test_validate_date(self): - date='2013-11-12' + date = "2013-11-12" start_date = wave.io.cdip._validate_date(date) assert isinstance(start_date, datetime) - date='11-12-2012' + date = "11-12-2012" self.assertRaises(ValueError, wave.io.cdip._validate_date, date) def test_request_netCDF_historic(self): - station_number='067' - nc = wave.io.cdip.request_netCDF(station_number, 'historic') + station_number = "067" + nc = wave.io.cdip.request_netCDF(station_number, "historic") isinstance(nc, netCDF4.Dataset) def test_request_netCDF_realtime(self): - station_number='067' - nc = wave.io.cdip.request_netCDF(station_number, 'realtime') + station_number = "067" + nc = wave.io.cdip.request_netCDF(station_number, "realtime") isinstance(nc, netCDF4.Dataset) - def test_start_and_end_of_year(self): year = 2020 start_day, end_day = wave.io.cdip._start_and_end_of_year(year) @@ -68,121 +63,135 @@ def test_start_and_end_of_year(self): assert isinstance(start_day, datetime) assert isinstance(end_day, datetime) - expected_start = datetime(year,1,1) - expected_end = datetime(year,12,31) + expected_start = datetime(year, 1, 1) + expected_end = datetime(year, 12, 31) self.assertEqual(start_day, expected_start) self.assertEqual(end_day, expected_end) def test_dates_to_timestamp(self): + start_date = datetime(1996, 10, 2, tzinfo=pytz.UTC) + end_date = datetime(1996, 10, 20, tzinfo=pytz.UTC) - start_date='1996-10-02' - end_date='1996-10-20' + start_stamp, end_stamp = wave.io.cdip._dates_to_timestamp( + self.test_nc, start_date=start_date, end_date=end_date + ) - start_stamp, end_stamp = wave.io.cdip._dates_to_timestamp(self.test_nc, - start_date=start_date, end_date=end_date) + start_dt = datetime.utcfromtimestamp(start_stamp).replace(tzinfo=pytz.UTC) + end_dt = datetime.utcfromtimestamp(end_stamp).replace(tzinfo=pytz.UTC) - start_dt = datetime.utcfromtimestamp(start_stamp) - end_dt = datetime.utcfromtimestamp(end_stamp) - - self.assertTrue(start_dt.strftime('%Y-%m-%d') == start_date) - self.assertTrue(end_dt.strftime('%Y-%m-%d') == end_date) + self.assertEqual(start_dt, start_date) + self.assertEqual(end_dt, end_date) def test_get_netcdf_variables_all2Dvars(self): - data = wave.io.cdip.get_netcdf_variables(self.test_nc, - all_2D_variables=True) - returned_keys = [key for key in data['data']['wave2D'].keys()] - self.assertTrue( returned_keys == self.vars2D) + data = wave.io.cdip.get_netcdf_variables( + self.test_nc, all_2D_variables=True, to_pandas=False + ) + returned_keys = [key for key in data["data"]["wave2D"].keys()] + self.assertTrue(set(returned_keys) == set(self.vars2D)) def test_get_netcdf_variables_params(self): - parameters =['waveHs', 'waveTp','notParam', 'waveMeanDirection'] - data = wave.io.cdip.get_netcdf_variables(self.test_nc, - parameters=parameters) - - returned_keys_1D = [key for key in data['data']['wave'].keys()] - returned_keys_2D = [key for key in data['data']['wave2D'].keys()] - returned_keys_metadata = [key for key in data['metadata']['wave']] + parameters = ["waveHs", "waveTp", "notParam", "waveMeanDirection"] + data = wave.io.cdip.get_netcdf_variables(self.test_nc, parameters=parameters) - self.assertTrue( returned_keys_1D == ['waveHs', 'waveTp']) - self.assertTrue( returned_keys_2D == ['waveMeanDirection']) - self.assertTrue( returned_keys_metadata == ['waveFrequency']) + returned_keys_1D = set([key for key in data["data"]["wave"].keys()]) + returned_keys_2D = [key for key in data["data"]["wave2D"].keys()] + returned_keys_metadata = [key for key in data["metadata"]["wave"]] + self.assertTrue(returned_keys_1D == set(["waveHs", "waveTp"])) + self.assertTrue(returned_keys_2D == ["waveMeanDirection"]) + self.assertTrue(returned_keys_metadata == ["waveFrequency"]) def test_get_netcdf_variables_time_slice(self): - start_date='1996-10-01' - end_date='1996-10-31' + start_date = "1996-10-01" + end_date = "1996-10-31" - data = wave.io.cdip.get_netcdf_variables(self.test_nc, - start_date=start_date, end_date=end_date, - parameters='waveHs') + data = wave.io.cdip.get_netcdf_variables( + self.test_nc, start_date=start_date, end_date=end_date, parameters="waveHs" + ) - start_dt = datetime.strptime(start_date, '%Y-%m-%d') - end_dt = datetime.strptime(end_date, '%Y-%m-%d') - - self.assertTrue(data['data']['wave'].index[-1] < end_dt) - self.assertTrue(data['data']['wave'].index[0] > start_dt) + start_dt = datetime.strptime(start_date, "%Y-%m-%d") + end_dt = datetime.strptime(end_date, "%Y-%m-%d") + self.assertTrue(data["data"]["wave"].index[-1] < end_dt) + self.assertTrue(data["data"]["wave"].index[0] > start_dt) def test_request_parse_workflow_multiyear(self): - station_number = '067' - year1=2011 - year2=2013 + station_number = "067" + year1 = 2011 + year2 = 2013 years = [year1, year2] - parameters =['waveHs', 'waveMeanDirection', 'waveA1Value'] - data = wave.io.cdip.request_parse_workflow(station_number=station_number, - years=years, parameters =parameters ) - - expected_index0 = datetime(year1,1,1) - expected_index_final = datetime(year2,12,31) + parameters = ["waveHs", "waveMeanDirection", "waveA1Value"] + data = wave.io.cdip.request_parse_workflow( + station_number=station_number, years=years, parameters=parameters + ) - wave1D = data['data']['wave'] - self.assertEqual(wave1D.index[0].floor('d').to_pydatetime(), expected_index0) + expected_index0 = datetime(year1, 1, 1) + expected_index_final = datetime(year2, 12, 31) - self.assertEqual(wave1D.index[-1].floor('d').to_pydatetime(), expected_index_final) + wave1D = data["data"]["wave"] + self.assertEqual(wave1D.index[0].floor("d").to_pydatetime(), expected_index0) - for key,wave2D in data['data']['wave2D'].items(): - self.assertEqual(wave2D.index[0].floor('d').to_pydatetime(), expected_index0) - self.assertEqual(wave2D.index[-1].floor('d').to_pydatetime(), expected_index_final) + self.assertEqual( + wave1D.index[-1].floor("d").to_pydatetime(), expected_index_final + ) + for key, wave2D in data["data"]["wave2D"].items(): + self.assertEqual( + wave2D.index[0].floor("d").to_pydatetime(), expected_index0 + ) + self.assertEqual( + wave2D.index[-1].floor("d").to_pydatetime(), expected_index_final + ) def test_plot_boxplot(self): - filename = abspath(join(testdir, 'wave_plot_boxplot.png')) + filename = abspath(join(testdir, "wave_plot_boxplot.png")) if isfile(filename): os.remove(filename) - station_number = '067' + station_number = "067" year = 2011 - data = wave.io.cdip.request_parse_workflow(station_number=station_number,years=year, - parameters =['waveHs'], - all_2D_variables=False) + data = wave.io.cdip.request_parse_workflow( + station_number=station_number, + years=year, + parameters=["waveHs"], + all_2D_variables=False, + ) plt.figure() - wave.graphics.plot_boxplot(data['data']['wave']['waveHs']) - plt.savefig(filename, format='png') + wave.graphics.plot_boxplot(data["data"]["wave"]["waveHs"]) + plt.savefig(filename, format="png") plt.close() self.assertTrue(isfile(filename)) - + os.remove(filename) def test_plot_compendium(self): - filename = abspath(join(testdir, 'wave_plot_boxplot.png')) + filename = abspath(join(testdir, "wave_plot_boxplot.png")) if isfile(filename): os.remove(filename) - station_number = '067' + station_number = "067" year = 2011 - data = wave.io.cdip.request_parse_workflow(station_number=station_number,years=year, - parameters =['waveHs', 'waveTp', 'waveDp'], - all_2D_variables=False) + data = wave.io.cdip.request_parse_workflow( + station_number=station_number, + years=year, + parameters=["waveHs", "waveTp", "waveDp"], + all_2D_variables=False, + ) plt.figure() - wave.graphics.plot_compendium(data['data']['wave']['waveHs'], - data['data']['wave']['waveTp'], data['data']['wave']['waveDp'] ) - plt.savefig(filename, format='png') + wave.graphics.plot_compendium( + data["data"]["wave"]["waveHs"], + data["data"]["wave"]["waveTp"], + data["data"]["wave"]["waveDp"], + ) + plt.savefig(filename, format="png") plt.close() self.assertTrue(isfile(filename)) + os.remove(filename) -if __name__ == '__main__': +if __name__ == "__main__": unittest.main() diff --git a/mhkit/tests/wave/io/test_ndbc.py b/mhkit/tests/wave/io/test_ndbc.py index 444734824..aa5b86a96 100644 --- a/mhkit/tests/wave/io/test_ndbc.py +++ b/mhkit/tests/wave/io/test_ndbc.py @@ -5,6 +5,7 @@ import mhkit.wave as wave from io import StringIO import pandas as pd +import xarray as xr import numpy as np import contextlib import unittest @@ -12,38 +13,84 @@ testdir = dirname(abspath(__file__)) -datadir = normpath(join(testdir, '..', '..', '..', - '..', 'examples', 'data', 'wave')) +datadir = normpath(join(testdir, "..", "..", "..", "..", "examples", "data", "wave")) class TestIOndbc(unittest.TestCase): - @classmethod def setUpClass(self): - self.expected_columns_metRT = ['WDIR', 'WSPD', 'GST', 'WVHT', 'DPD', - 'APD', 'MWD', 'PRES', 'ATMP', 'WTMP', 'DEWP', 'VIS', 'PTDY', 'TIDE'] - self.expected_units_metRT = {'WDIR': 'degT', 'WSPD': 'm/s', 'GST': 'm/s', - 'WVHT': 'm', 'DPD': 'sec', 'APD': 'sec', 'MWD': 'degT', 'PRES': 'hPa', - 'ATMP': 'degC', 'WTMP': 'degC', 'DEWP': 'degC', 'VIS': 'nmi', - 'PTDY': 'hPa', 'TIDE': 'ft'} - - self.expected_columns_metH = ['WDIR', 'WSPD', 'GST', 'WVHT', 'DPD', - 'APD', 'MWD', 'PRES', 'ATMP', 'WTMP', 'DEWP', 'VIS', 'TIDE'] - self.expected_units_metH = {'WDIR': 'degT', 'WSPD': 'm/s', 'GST': 'm/s', - 'WVHT': 'm', 'DPD': 'sec', 'APD': 'sec', 'MWD': 'deg', 'PRES': 'hPa', - 'ATMP': 'degC', 'WTMP': 'degC', 'DEWP': 'degC', 'VIS': 'nmi', - 'TIDE': 'ft'} - self.filenames = ['46042w1996.txt.gz', - '46029w1997.txt.gz', - '46029w1998.txt.gz'] - self.swden = pd.read_csv(join(datadir, self.filenames[0]), sep=r'\s+', - compression='gzip') - - buoy = '42012' + self.expected_columns_metRT = [ + "WDIR", + "WSPD", + "GST", + "WVHT", + "DPD", + "APD", + "MWD", + "PRES", + "ATMP", + "WTMP", + "DEWP", + "VIS", + "PTDY", + "TIDE", + ] + self.expected_units_metRT = { + "WDIR": "degT", + "WSPD": "m/s", + "GST": "m/s", + "WVHT": "m", + "DPD": "sec", + "APD": "sec", + "MWD": "degT", + "PRES": "hPa", + "ATMP": "degC", + "WTMP": "degC", + "DEWP": "degC", + "VIS": "nmi", + "PTDY": "hPa", + "TIDE": "ft", + } + + self.expected_columns_metH = [ + "WDIR", + "WSPD", + "GST", + "WVHT", + "DPD", + "APD", + "MWD", + "PRES", + "ATMP", + "WTMP", + "DEWP", + "VIS", + "TIDE", + ] + self.expected_units_metH = { + "WDIR": "degT", + "WSPD": "m/s", + "GST": "m/s", + "WVHT": "m", + "DPD": "sec", + "APD": "sec", + "MWD": "deg", + "PRES": "hPa", + "ATMP": "degC", + "WTMP": "degC", + "DEWP": "degC", + "VIS": "nmi", + "TIDE": "ft", + } + self.filenames = ["46042w1996.txt.gz", "46029w1997.txt.gz", "46029w1998.txt.gz"] + self.swden = pd.read_csv( + join(datadir, self.filenames[0]), sep=r"\s+", compression="gzip" + ) + + buoy = "42012" year = 2021 - date = np.datetime64('2021-02-21T12:40:00') - directional_data_all = wave.io.ndbc.request_directional_data( - buoy, year) + date = np.datetime64("2021-02-21T12:40:00") + directional_data_all = wave.io.ndbc.request_directional_data(buoy, year) self.directional_data = directional_data_all.sel(date=date) @classmethod @@ -52,10 +99,9 @@ def tearDownClass(self): # Realtime data def test_ndbc_read_realtime_met(self): - data, units = wave.io.ndbc.read_file(join(datadir, '46097.txt')) + data, units = wave.io.ndbc.read_file(join(datadir, "46097.txt")) expected_index0 = datetime(2019, 4, 2, 13, 50) - self.assertSetEqual(set(data.columns), set( - self.expected_columns_metRT)) + self.assertSetEqual(set(data.columns), set(self.expected_columns_metRT)) self.assertEqual(data.index[0], expected_index0) self.assertEqual(data.shape, (6490, 14)) self.assertEqual(units, self.expected_units_metRT) @@ -63,8 +109,7 @@ def test_ndbc_read_realtime_met(self): # Historical data def test_ndbnc_read_historical_met(self): # QC'd monthly data, Aug 2019 - data, units = wave.io.ndbc.read_file( - join(datadir, '46097h201908qc.txt')) + data, units = wave.io.ndbc.read_file(join(datadir, "46097h201908qc.txt")) expected_index0 = datetime(2019, 8, 1, 0, 0) self.assertSetEqual(set(data.columns), set(self.expected_columns_metH)) self.assertEqual(data.index[0], expected_index0) @@ -73,86 +118,90 @@ def test_ndbnc_read_historical_met(self): # Spectral data def test_ndbc_read_spectral(self): - data, units = wave.io.ndbc.read_file(join(datadir, 'data.txt')) - self.assertEqual(data.shape, (743, 47)) + data, units = wave.io.ndbc.read_file(join(datadir, "data.txt"), to_pandas=False) + self.assertEqual(len(data.data_vars), 47) + self.assertEqual(len(data["dim_0"]), 743) self.assertEqual(units, None) # Continuous wind data def test_ndbc_read_cwind_no_units(self): - data, units = wave.io.ndbc.read_file(join(datadir, '42a01c2003.txt')) + data, units = wave.io.ndbc.read_file(join(datadir, "42a01c2003.txt")) self.assertEqual(data.shape, (4320, 5)) self.assertEqual(units, None) def test_ndbc_read_cwind_units(self): - data, units = wave.io.ndbc.read_file(join(datadir, '46002c2016.txt')) + data, units = wave.io.ndbc.read_file(join(datadir, "46002c2016.txt")) self.assertEqual(data.shape, (28468, 5)) - self.assertEqual(units, wave.io.ndbc.parameter_units('cwind')) + self.assertEqual(units, wave.io.ndbc.parameter_units("cwind")) def test_ndbc_available_data(self): - data = wave.io.ndbc.available_data('swden', buoy_number='46029') + data = wave.io.ndbc.available_data("swden", buoy_number="46029") cols = data.columns.tolist() - exp_cols = ['id', 'year', 'filename'] + exp_cols = ["id", "year", "filename"] self.assertEqual(cols, exp_cols) years = [int(year) for year in data.year.tolist()] - exp_years = [*range(1996, 1996+len(years))] + exp_years = [*range(1996, 1996 + len(years))] self.assertEqual(years, exp_years) self.assertEqual(data.shape, (len(data), 3)) def test__ndbc_parse_filenames(self): filenames = pd.Series(self.filenames) - buoys = wave.io.ndbc._parse_filenames('swden', filenames) + buoys = wave.io.ndbc._parse_filenames("swden", filenames) years = buoys.year.tolist() numbers = buoys.id.tolist() fnames = buoys.filename.tolist() self.assertEqual(buoys.shape, (len(filenames), 3)) - self.assertListEqual(years, ['1996', '1997', '1998']) - self.assertListEqual(numbers, ['46042', '46029', '46029']) + self.assertListEqual(years, ["1996", "1997", "1998"]) + self.assertListEqual(numbers, ["46042", "46029", "46029"]) self.assertListEqual(fnames, self.filenames) def test_ndbc_request_data(self): filenames = pd.Series(self.filenames[0]) - ndbc_data = wave.io.ndbc.request_data('swden', filenames) - self.assertTrue(self.swden.equals(ndbc_data['1996'])) + ndbc_data = wave.io.ndbc.request_data("swden", filenames, to_pandas=False) + self.assertTrue(xr.Dataset(self.swden).equals(ndbc_data["1996"])) def test_ndbc_request_data_from_dataframe(self): filenames = pd.DataFrame(pd.Series(data=self.filenames[0])) - ndbc_data = wave.io.ndbc.request_data('swden', filenames) - assert_frame_equal(self.swden, ndbc_data['1996']) + ndbc_data = wave.io.ndbc.request_data("swden", filenames) + assert_frame_equal(self.swden, ndbc_data["1996"]) def test_ndbc_request_data_filenames_length(self): - with self.assertRaises(AssertionError): - wave.io.ndbc.request_data('swden', pd.Series(dtype=float)) + with self.assertRaises(ValueError): + wave.io.ndbc.request_data("swden", pd.Series(dtype=float)) def test_ndbc_to_datetime_index(self): - dt = wave.io.ndbc.to_datetime_index('swden', self.swden) + dt = wave.io.ndbc.to_datetime_index("swden", self.swden) self.assertEqual(type(dt.index), pd.DatetimeIndex) - self.assertFalse({'YY', 'MM', 'DD', 'hh'}.issubset(dt.columns)) + self.assertFalse({"YY", "MM", "DD", "hh"}.issubset(dt.columns)) def test_ndbc_request_data_empty_file(self): temp_stdout = StringIO() # known empty file. If NDBC replaces, this test may fail. filename = "42008h1984.txt.gz" - buoy_id = '42008' - year = '1984' + buoy_id = "42008" + year = "1984" with contextlib.redirect_stdout(temp_stdout): - wave.io.ndbc.request_data('stdmet', pd.Series(filename)) + wave.io.ndbc.request_data("stdmet", pd.Series(filename)) output = temp_stdout.getvalue().strip() - msg = (f'The NDBC buoy {buoy_id} for year {year} with ' - f'filename {filename} is empty or missing ' - 'data. Please omit this file from your data ' - 'request in the future.') + msg = ( + f"The NDBC buoy {buoy_id} for year {year} with " + f"filename {filename} is empty or missing " + "data. Please omit this file from your data " + "request in the future." + ) self.assertEqual(output, msg) def test_ndbc_request_multiple_files_with_empty_file(self): temp_stdout = StringIO() # known empty file. If NDBC replaces, this test may fail. - empty_file = '42008h1984.txt.gz' - working_file = '46042h1996.txt.gz' + empty_file = "42008h1984.txt.gz" + working_file = "46042h1996.txt.gz" filenames = pd.Series([empty_file, working_file]) + with contextlib.redirect_stdout(temp_stdout): - ndbc_data = wave.io.ndbc.request_data('stdmet', filenames) + ndbc_data = wave.io.ndbc.request_data("stdmet", filenames) self.assertEqual(1, len(ndbc_data)) def test_ndbc_dates_to_datetime(self): @@ -161,19 +210,18 @@ def test_ndbc_dates_to_datetime(self): def test_ndbc_date_string_to_datetime(self): swden = self.swden.copy(deep=True) - swden['mm'] = np.zeros(len(swden)).astype(int).astype(str) - year_string = 'YY' - year_fmt = '%y' - parse_columns = [year_string, 'MM', 'DD', 'hh', 'mm'] - df = wave.io.ndbc._date_string_to_datetime(swden, parse_columns, - year_fmt) - dt = df['date'] + swden["mm"] = np.zeros(len(swden)).astype(int).astype(str) + year_string = "YY" + year_fmt = "%y" + parse_columns = [year_string, "MM", "DD", "hh", "mm"] + df = wave.io.ndbc._date_string_to_datetime(swden, parse_columns, year_fmt) + dt = df["date"] self.assertEqual(datetime(1996, 1, 1, 1, 0), dt[1]) def test_ndbc_parameter_units(self): - parameter = 'swden' + parameter = "swden" units = wave.io.ndbc.parameter_units(parameter) - self.assertEqual(units[parameter], '(m*m)/Hz') + self.assertEqual(units[parameter], "(m*m)/Hz") def test_ndbc_request_directional_data(self): data = self.directional_data @@ -189,31 +237,33 @@ def test_ndbc_request_directional_data(self): def test_ndbc_create_spread_function(self): directions = np.arange(0, 360, 2.0) - spread = wave.io.ndbc.create_spread_function( - self.directional_data, directions) + spread = wave.io.ndbc.create_spread_function(self.directional_data, directions) self.assertEqual(spread.shape, (47, 180)) - self.assertEqual(spread.units, '1/Hz/deg') + self.assertEqual(spread.units, "1/Hz/deg") def test_ndbc_create_directional_spectrum(self): directions = np.arange(0, 360, 2.0) spectrum = wave.io.ndbc.create_directional_spectrum( - self.directional_data, directions) + self.directional_data, directions + ) self.assertEqual(spectrum.shape, (47, 180)) - self.assertEqual(spectrum.units, 'm^2/Hz/deg') + self.assertEqual(spectrum.units, "m^2/Hz/deg") def test_plot_directional_spectrum(self): directions = np.arange(0, 360, 2.0) spectrum = wave.io.ndbc.create_spread_function( - self.directional_data, directions) + self.directional_data, directions + ) wave.graphics.plot_directional_spectrum( spectrum, - min=0.0, + color_level_min=0.0, fill=True, nlevels=6, name="Elevation Variance", - units="m^2") + units="m^2", + ) - filename = abspath(join(testdir, 'wave_plot_directional_spectrum.png')) + filename = abspath(join(testdir, "wave_plot_directional_spectrum.png")) if isfile(filename): os.remove(filename) plt.savefig(filename) @@ -224,27 +274,28 @@ def test_plot_directional_spectrum(self): def test_get_buoy_metadata(self): metadata = wave.io.ndbc.get_buoy_metadata("46042") expected_keys = { - 'buoy', - 'provider', - 'type', - 'SCOOP payload', - 'lat', - 'lon', - 'Site elevation', - 'Air temp height', - 'Anemometer height', - 'Barometer elevation', - 'Sea temp depth', - 'Water depth', - 'Watch circle radius' + "buoy", + "provider", + "type", + "SCOOP payload", + "lat", + "lon", + "Site elevation", + "Air temp height", + "Anemometer height", + "Barometer elevation", + "Sea temp depth", + "Water depth", + "Watch circle radius", } self.assertSetEqual(set(metadata.keys()), expected_keys) self.assertEqual( - metadata['provider'], 'Owned and maintained by National Data Buoy Center') - self.assertEqual(metadata['type'], '3-meter foam buoy w/ seal cage') - self.assertAlmostEqual(float(metadata['lat']), 36.785) - self.assertAlmostEqual(float(metadata['lon']), 122.396) - self.assertEqual(metadata['Site elevation'], 'sea level') + metadata["provider"], "Owned and maintained by National Data Buoy Center" + ) + self.assertEqual(metadata["type"], "3-meter foam buoy w/ seal cage") + self.assertAlmostEqual(float(metadata["lat"]), 36.785) + self.assertAlmostEqual(float(metadata["lon"]), 122.396) + self.assertEqual(metadata["Site elevation"], "sea level") def test_get_buoy_metadata_invalid_station(self): with self.assertRaises(ValueError): @@ -255,5 +306,5 @@ def test_get_buoy_metadata_nonexistent_station(self): wave.io.ndbc.get_buoy_metadata("99999") -if __name__ == '__main__': +if __name__ == "__main__": unittest.main() diff --git a/mhkit/tests/wave/io/test_swan.py b/mhkit/tests/wave/io/test_swan.py index c3e113d81..6388bac2b 100644 --- a/mhkit/tests/wave/io/test_swan.py +++ b/mhkit/tests/wave/io/test_swan.py @@ -9,6 +9,7 @@ import mhkit.wave as wave from io import StringIO import pandas as pd +import xarray as xr import numpy as np import contextlib import unittest @@ -22,19 +23,22 @@ testdir = dirname(abspath(__file__)) -datadir = normpath(join(testdir,'..','..','..','..','examples','data','wave')) +datadir = normpath(join(testdir, "..", "..", "..", "..", "examples", "data", "wave")) class TestSWAN(unittest.TestCase): - @classmethod def setUpClass(self): - swan_datadir = join(datadir,'swan') - self.table_file = join(swan_datadir,'SWANOUT.DAT') - self.swan_block_mat_file = join(swan_datadir,'SWANOUT.MAT') - self.swan_block_txt_file = join(swan_datadir,'SWANOUTBlock.DAT') - self.expected_table = pd.read_csv(self.table_file, sep='\s+', comment='%', - names=['Xp', 'Yp', 'Hsig', 'Dir', 'RTpeak', 'TDir']) + swan_datadir = join(datadir, "swan") + self.table_file = join(swan_datadir, "SWANOUT.DAT") + self.swan_block_mat_file = join(swan_datadir, "SWANOUT.MAT") + self.swan_block_txt_file = join(swan_datadir, "SWANOUTBlock.DAT") + self.expected_table = pd.read_csv( + self.table_file, + sep="\s+", + comment="%", + names=["Xp", "Yp", "Hsig", "Dir", "RTpeak", "TDir"], + ) @classmethod def tearDownClass(self): @@ -45,39 +49,49 @@ def test_read_table(self): assert_frame_equal(self.expected_table, swan_table) def test_read_block_mat(self): - swanBlockMat, metaDataMat = wave.io.swan.read_block(self.swan_block_mat_file ) + swanBlockMat, metaDataMat = wave.io.swan.read_block(self.swan_block_mat_file) self.assertEqual(len(swanBlockMat), 4) - self.assertAlmostEqual(self.expected_table['Hsig'].sum(), - swanBlockMat['Hsig'].sum().sum(), places=1) + self.assertAlmostEqual( + self.expected_table["Hsig"].sum(), + swanBlockMat["Hsig"].sum().sum(), + places=1, + ) def test_read_block_txt(self): swanBlockTxt, metaData = wave.io.swan.read_block(self.swan_block_txt_file) self.assertEqual(len(swanBlockTxt), 4) - sumSum = swanBlockTxt['Significant wave height'].sum().sum() - self.assertAlmostEqual(self.expected_table['Hsig'].sum(), - sumSum, places=-2) + sumSum = swanBlockTxt["Significant wave height"].sum().sum() + self.assertAlmostEqual(self.expected_table["Hsig"].sum(), sumSum, places=-2) + + def test_read_block_txt_xarray(self): + swanBlockTxt, metaData = wave.io.swan.read_block( + self.swan_block_txt_file, to_pandas=False + ) + self.assertEqual(len(swanBlockTxt), 4) + sumSum = swanBlockTxt["Significant wave height"].sum().sum() + self.assertAlmostEqual(self.expected_table["Hsig"].sum(), sumSum, places=-2) def test_block_to_table(self): - x=np.arange(5) - y=np.arange(5,10) - df = pd.DataFrame(np.random.rand(5,5), columns=x, index=y) + x = np.arange(5) + y = np.arange(5, 10) + df = pd.DataFrame(np.random.rand(5, 5), columns=x, index=y) dff = wave.io.swan.block_to_table(df) - self.assertEqual(dff.shape, (len(x)*len(y), 3)) + self.assertEqual(dff.shape, (len(x) * len(y), 3)) self.assertTrue(all(dff.x.unique() == np.unique(x))) def test_dictionary_of_block_to_table(self): - x=np.arange(5) - y=np.arange(5,10) - df = pd.DataFrame(np.random.rand(5,5), columns=x, index=y) - keys = ['data1', 'data2'] + x = np.arange(5) + y = np.arange(5, 10) + df = pd.DataFrame(np.random.rand(5, 5), columns=x, index=y) + keys = ["data1", "data2"] data = [df, df] - dict_of_dfs = dict(zip(keys,data)) + dict_of_dfs = dict(zip(keys, data)) dff = wave.io.swan.dictionary_of_block_to_table(dict_of_dfs) - self.assertEqual(dff.shape, (len(x)*len(y), 2+len(keys))) + self.assertEqual(dff.shape, (len(x) * len(y), 2 + len(keys))) self.assertTrue(all(dff.x.unique() == np.unique(x))) for key in keys: self.assertTrue(key in dff.keys()) -if __name__ == '__main__': +if __name__ == "__main__": unittest.main() diff --git a/mhkit/tests/wave/io/test_wecsim.py b/mhkit/tests/wave/io/test_wecsim.py index 3c070458c..52df214b9 100644 --- a/mhkit/tests/wave/io/test_wecsim.py +++ b/mhkit/tests/wave/io/test_wecsim.py @@ -22,11 +22,10 @@ testdir = dirname(abspath(__file__)) -datadir = normpath(join(testdir,'..','..','..','..','examples','data','wave')) +datadir = normpath(join(testdir, "..", "..", "..", "..", "examples", "data", "wave")) class TestWECSim(unittest.TestCase): - @classmethod def setUpClass(self): pass @@ -37,52 +36,61 @@ def tearDownClass(self): ### WEC-Sim data, no mooring def test_read_wecSim_no_mooring(self): - ws_output = wave.io.wecsim.read_output(join(datadir, 'RM3_matlabWorkspace_structure.mat')) - self.assertEqual(ws_output['wave'].elevation.name,'elevation') - self.assertEqual(ws_output['bodies']['body1'].name,'float') - self.assertEqual(ws_output['ptos'].name,'PTO1') - self.assertEqual(ws_output['constraints'].name,'Constraint1') - self.assertEqual(len(ws_output['mooring']),0) - self.assertEqual(len(ws_output['moorDyn']),0) - self.assertEqual(len(ws_output['ptosim']),0) - self.assertEqual(len(ws_output['cables']),0) - + ws_output = wave.io.wecsim.read_output( + join(datadir, "RM3_matlabWorkspace_structure.mat") + ) + self.assertEqual(ws_output["wave"].elevation.name, "elevation") + self.assertEqual(ws_output["bodies"]["body1"].name, "float") + self.assertEqual(ws_output["ptos"].name, "PTO1") + self.assertEqual(ws_output["constraints"].name, "Constraint1") + self.assertEqual(len(ws_output["mooring"]), 0) + self.assertEqual(len(ws_output["moorDyn"]), 0) + self.assertEqual(len(ws_output["ptosim"]), 0) + self.assertEqual(len(ws_output["cables"]), 0) + ### WEC-Sim data, with cable def test_read_wecSim_cable(self): - ws_output = wave.io.wecsim.read_output(join(datadir, 'Cable_matlabWorkspace_structure.mat')) - self.assertEqual(ws_output['wave'].elevation.name,'elevation') - self.assertEqual(ws_output['bodies']['body1'].name,'BuoyDraft5cm') - self.assertEqual(ws_output['cables'].name,'Cable') - self.assertEqual(ws_output['constraints']['constraint1'].name,'Mooring') - self.assertEqual(len(ws_output['mooring']),0) - self.assertEqual(len(ws_output['moorDyn']),0) - self.assertEqual(len(ws_output['ptosim']),0) - self.assertEqual(len(ws_output['ptos']),0) + ws_output = wave.io.wecsim.read_output( + join(datadir, "Cable_matlabWorkspace_structure.mat"), + to_pandas=False, + ) + self.assertEqual(ws_output["wave"]["elevation"].name, "elevation") + self.assertEqual( + ws_output["bodies"]["body1"]["position_dof1"].name, "position_dof1" + ) + self.assertEqual(len(ws_output["mooring"]), 0) + self.assertEqual(len(ws_output["moorDyn"]), 0) + self.assertEqual(len(ws_output["ptosim"]), 0) + self.assertEqual(len(ws_output["ptos"]), 0) ### WEC-Sim data, with mooring def test_read_wecSim_with_mooring(self): - ws_output = wave.io.wecsim.read_output(join(datadir, 'RM3MooringMatrix_matlabWorkspace_structure.mat')) - self.assertEqual(ws_output['wave'].elevation.name,'elevation') - self.assertEqual(ws_output['bodies']['body1'].name,'float') - self.assertEqual(ws_output['ptos'].name,'PTO1') - self.assertEqual(ws_output['constraints'].name,'Constraint1') - self.assertEqual(len(ws_output['mooring']),40001) - self.assertEqual(len(ws_output['moorDyn']),0) - self.assertEqual(len(ws_output['ptosim']),0) - self.assertEqual(len(ws_output['cables']),0) + ws_output = wave.io.wecsim.read_output( + join(datadir, "RM3MooringMatrix_matlabWorkspace_structure.mat") + ) + self.assertEqual(ws_output["wave"].elevation.name, "elevation") + self.assertEqual(ws_output["bodies"]["body1"].name, "float") + self.assertEqual(ws_output["ptos"].name, "PTO1") + self.assertEqual(ws_output["constraints"].name, "Constraint1") + self.assertEqual(len(ws_output["mooring"]), 40001) + self.assertEqual(len(ws_output["moorDyn"]), 0) + self.assertEqual(len(ws_output["ptosim"]), 0) + self.assertEqual(len(ws_output["cables"]), 0) ### WEC-Sim data, with moorDyn def test_read_wecSim_with_moorDyn(self): - ws_output = wave.io.wecsim.read_output(join(datadir, 'RM3MoorDyn_matlabWorkspace_structure.mat')) - self.assertEqual(ws_output['wave'].elevation.name,'elevation') - self.assertEqual(ws_output['bodies']['body1'].name,'float') - self.assertEqual(ws_output['ptos'].name,'PTO1') - self.assertEqual(ws_output['constraints'].name,'Constraint1') - self.assertEqual(len(ws_output['mooring']),40001) - self.assertEqual(len(ws_output['moorDyn']),7) - self.assertEqual(len(ws_output['ptosim']),0) - self.assertEqual(len(ws_output['cables']),0) + ws_output = wave.io.wecsim.read_output( + join(datadir, "RM3MoorDyn_matlabWorkspace_structure.mat") + ) + self.assertEqual(ws_output["wave"].elevation.name, "elevation") + self.assertEqual(ws_output["bodies"]["body1"].name, "float") + self.assertEqual(ws_output["ptos"].name, "PTO1") + self.assertEqual(ws_output["constraints"].name, "Constraint1") + self.assertEqual(len(ws_output["mooring"]), 40001) + self.assertEqual(len(ws_output["moorDyn"]), 7) + self.assertEqual(len(ws_output["ptosim"]), 0) + self.assertEqual(len(ws_output["cables"]), 0) -if __name__ == '__main__': +if __name__ == "__main__": unittest.main() diff --git a/mhkit/tests/wave/test_contours.py b/mhkit/tests/wave/test_contours.py index fab2f828a..b0281665d 100644 --- a/mhkit/tests/wave/test_contours.py +++ b/mhkit/tests/wave/test_contours.py @@ -1,241 +1,545 @@ from os.path import abspath, dirname, join, isfile, normpath, relpath -from pandas.testing import assert_frame_equal from numpy.testing import assert_allclose -from scipy.interpolate import interp1d -from random import seed, randint import matplotlib.pylab as plt -from datetime import datetime -import xarray.testing as xrt import mhkit.wave as wave -from io import StringIO import pandas as pd import numpy as np -import contextlib +import warnings import unittest -import netCDF4 -import inspect import pickle -import time import json -import sys import os testdir = dirname(abspath(__file__)) -plotdir = join(testdir, 'plots') +plotdir = join(testdir, "plots") isdir = os.path.isdir(plotdir) -if not isdir: os.mkdir(plotdir) -datadir = normpath(join(testdir,relpath('../../../examples/data/wave'))) +if not isdir: + os.mkdir(plotdir) +datadir = normpath(join(testdir, relpath("../../../examples/data/wave"))) class TestContours(unittest.TestCase): - @classmethod def setUpClass(self): + f_name = "Hm0_Te_46022.json" + self.Hm0Te = pd.read_json(join(datadir, f_name)) - f_name= 'Hm0_Te_46022.json' - self.Hm0Te = pd.read_json(join(datadir,f_name)) - - file_loc=join(datadir, 'principal_component_analysis.pkl') - with open(file_loc, 'rb') as f: + file_loc = join(datadir, "principal_component_analysis.pkl") + with open(file_loc, "rb") as f: self.pca = pickle.load(f) f.close() - file_loc=join(datadir,'WDRT_caluculated_countours.json') + file_loc = join(datadir, "WDRT_caluculated_countours.json") with open(file_loc) as f: self.wdrt_copulas = json.load(f) f.close() - ndbc_46050=pd.read_csv(join(datadir,'NDBC46050.csv')) - self.wdrt_Hm0 = ndbc_46050['Hm0'] - self.wdrt_Te = ndbc_46050['Te'] + ndbc_46050 = pd.read_csv(join(datadir, "NDBC46050.csv")) + self.wdrt_Hm0 = ndbc_46050["Hm0"] + self.wdrt_Te = ndbc_46050["Te"] - self.wdrt_dt=3600 - self.wdrt_period= 50 + self.wdrt_dt = 3600 + self.wdrt_period = 50 @classmethod def tearDownClass(self): pass def test_environmental_contour(self): - Hm0Te = self.Hm0Te - df = Hm0Te[Hm0Te['Hm0'] < 20] + df = Hm0Te[Hm0Te["Hm0"] < 20] Hm0 = df.Hm0.values Te = df.Te.values - dt_ss = (Hm0Te.index[2]-Hm0Te.index[1]).seconds + dt_ss = (Hm0Te.index[2] - Hm0Te.index[1]).seconds period = 100 - copula = wave.contours.environmental_contours(Hm0, - Te, dt_ss, period, 'PCA') + copula = wave.contours.environmental_contours(Hm0, Te, dt_ss, period, "PCA") - Hm0_contour=copula['PCA_x1'] - Te_contour=copula['PCA_x2'] + Hm0_contour = copula["PCA_x1"] + Te_contour = copula["PCA_x2"] - file_loc=join(datadir,'Hm0_Te_contours_46022.csv') + file_loc = join(datadir, "Hm0_Te_contours_46022.csv") expected_contours = pd.read_csv(file_loc) - assert_allclose(expected_contours.Hm0_contour.values, - Hm0_contour, rtol=1e-3) + assert_allclose(expected_contours.Hm0_contour.values, Hm0_contour, rtol=1e-3) + + def test_environmental_contours_invalid_inputs(self): + # Invalid x1 tests + x1_non_numeric = "not an array" + with self.assertRaises(TypeError): + wave.contours.environmental_contours( + x1_non_numeric, self.wdrt_Te, 3600, 50, "PCA" + ) + + x1_scalar = 5 + with self.assertRaises(TypeError): + wave.contours.environmental_contours( + x1_scalar, self.wdrt_Te, 3600, 50, "PCA" + ) + + # Invalid x2 tests + x2_non_numeric = "not an array" + with self.assertRaises(TypeError): + wave.contours.environmental_contours( + self.wdrt_Hm0, x2_non_numeric, 3600, 50, "PCA" + ) + + x2_scalar = 10 + with self.assertRaises(TypeError): + wave.contours.environmental_contours( + self.wdrt_Hm0, x2_scalar, 3600, 50, "PCA" + ) + + # Unequal lengths of x1 and x2 + x2_unequal_length = self.wdrt_Te[:-1] + with self.assertRaises(ValueError): + wave.contours.environmental_contours( + self.wdrt_Hm0, x2_unequal_length, 3600, 50, "PCA" + ) + + # Invalid sea_state_duration tests + invalid_sea_state_duration_string = "one hour" + with self.assertRaises(TypeError): + wave.contours.environmental_contours( + self.wdrt_Hm0, + self.wdrt_Te, + invalid_sea_state_duration_string, + 50, + "PCA", + ) + + invalid_sea_state_duration_list = [3600] + with self.assertRaises(TypeError): + wave.contours.environmental_contours( + self.wdrt_Hm0, self.wdrt_Te, invalid_sea_state_duration_list, 50, "PCA" + ) + + # Invalid return_period tests + invalid_return_period_string = "fifty years" + with self.assertRaises(TypeError): + wave.contours.environmental_contours( + self.wdrt_Hm0, self.wdrt_Te, 3600, invalid_return_period_string, "PCA" + ) + + invalid_return_period_list = [50] + with self.assertRaises(TypeError): + wave.contours.environmental_contours( + self.wdrt_Hm0, self.wdrt_Te, 3600, invalid_return_period_list, "PCA" + ) + + # Invalid method tests + invalid_method = 123 + with self.assertRaises(TypeError): + wave.contours.environmental_contours( + self.wdrt_Hm0, self.wdrt_Te, 3600, 50, invalid_method + ) + + invalid_bin_val_size = "not a number" + with self.assertRaises(TypeError): + wave.contours.environmental_contours( + self.wdrt_Hm0, + self.wdrt_Te, + 3600, + 50, + "PCA", + bin_val_size=invalid_bin_val_size, + ) + + invalid_nb_steps = 100.5 + with self.assertRaises(TypeError): + wave.contours.environmental_contours( + self.wdrt_Hm0, self.wdrt_Te, 3600, 50, "PCA", nb_steps=invalid_nb_steps + ) + + invalid_initial_bin_max_val = "not a number" + with self.assertRaises(TypeError): + wave.contours.environmental_contours( + self.wdrt_Hm0, + self.wdrt_Te, + 3600, + 50, + "PCA", + initial_bin_max_val=invalid_initial_bin_max_val, + ) + + invalid_min_bin_count = 40.5 + with self.assertRaises(TypeError): + wave.contours.environmental_contours( + self.wdrt_Hm0, + self.wdrt_Te, + 3600, + 50, + "PCA", + min_bin_count=invalid_min_bin_count, + ) + + with self.assertRaises(TypeError): + wave.contours.environmental_contours( + self.wdrt_Hm0, self.wdrt_Te, 3600, 50, "bivariate_KDE" + ) + + invalid_PCA = "not a dict" + with self.assertRaises(TypeError): + wave.contours.environmental_contours( + self.wdrt_Hm0, self.wdrt_Te, 3600, 50, "PCA", PCA=invalid_PCA + ) + + invalid_PCA_bin_size = "not an int" + with self.assertRaises(TypeError): + wave.contours.environmental_contours( + self.wdrt_Hm0, + self.wdrt_Te, + 3600, + 50, + "PCA", + PCA_bin_size=invalid_PCA_bin_size, + ) + + invalid_return_fit = "not a boolean" + with self.assertRaises(TypeError): + wave.contours.environmental_contours( + self.wdrt_Hm0, + self.wdrt_Te, + 3600, + 50, + "PCA", + return_fit=invalid_return_fit, + ) + + invalid_Ndata_bivariate_KDE = "not a number" + with self.assertRaises(TypeError): + wave.contours.environmental_contours( + self.wdrt_Hm0, + self.wdrt_Te, + 3600, + 50, + "bivariate_KDE", + Ndata_bivariate_KDE=invalid_Ndata_bivariate_KDE, + ) + + invalid_max_x1 = "not a number" + with self.assertRaises(TypeError): + wave.contours.environmental_contours( + self.wdrt_Hm0, self.wdrt_Te, 3600, 50, "PCA", max_x1=invalid_max_x1 + ) + + invalid_max_x2 = "not a number" + with self.assertRaises(TypeError): + wave.contours.environmental_contours( + self.wdrt_Hm0, self.wdrt_Te, 3600, 50, "PCA", max_x2=invalid_max_x2 + ) + + invalid_bandwidth = "not a number" + with self.assertRaises(TypeError): + wave.contours.environmental_contours( + self.wdrt_Hm0, + self.wdrt_Te, + 3600, + 50, + "bivariate_KDE", + bandwidth=invalid_bandwidth, + ) + + def test_PCA_contours_invalid_inputs(self): + Hm0Te = self.Hm0Te + df = Hm0Te[Hm0Te["Hm0"] < 20] + + Hm0 = df.Hm0.values + Te = df.Te.values + + dt_ss = (Hm0Te.index[2] - Hm0Te.index[1]).seconds + period = 100 + + copula = wave.contours.environmental_contours( + Hm0, Te, dt_ss, period, "PCA", return_fit=True + ) + + PCA_args = { + "nb_steps": 1000, + "return_fit": False, + "bin_size": 250, + } + + # Invalid x1 tests + x1_non_numeric = "not an array" + with self.assertRaises(TypeError): + wave.contours.PCA_contour( + x1_non_numeric, self.wdrt_Te, copula["PCA_fit"], PCA_args + ) + + x1_scalar = 5 + with self.assertRaises(TypeError): + wave.contours.PCA_contour( + x1_scalar, self.wdrt_Te, copula["PCA_fit"], PCA_args + ) + + # Invalid x2 tests + x2_non_numeric = "not an array" + with self.assertRaises(TypeError): + wave.contours.PCA_contour( + self.wdrt_Hm0, x2_non_numeric, copula["PCA_fit"], PCA_args + ) + + x2_scalar = 10 + with self.assertRaises(TypeError): + wave.contours.PCA_contour( + self.wdrt_Hm0, x2_scalar, copula["PCA_fit"], PCA_args + ) + + # Unequal lengths of x1 and x2 + x2_unequal_length = self.wdrt_Te[:-1] + with self.assertRaises(ValueError): + wave.contours.PCA_contour( + self.wdrt_Hm0, x2_unequal_length, copula["PCA_fit"], PCA_args + ) def test__principal_component_analysis(self): Hm0Te = self.Hm0Te - df = Hm0Te[Hm0Te['Hm0'] < 20] + df = Hm0Te[Hm0Te["Hm0"] < 20] + + Hm0 = df.Hm0.values + Te = df.Te.values + PCA = wave.contours._principal_component_analysis(Hm0, Te, bin_size=250) + + assert_allclose(PCA["principal_axes"], self.pca["principal_axes"]) + self.assertAlmostEqual(PCA["shift"], self.pca["shift"]) + self.assertAlmostEqual(PCA["x1_fit"]["mu"], self.pca["x1_fit"]["mu"]) + self.assertAlmostEqual(PCA["mu_fit"].slope, self.pca["mu_fit"].slope) + self.assertAlmostEqual(PCA["mu_fit"].intercept, self.pca["mu_fit"].intercept) + assert_allclose(PCA["sigma_fit"]["x"], self.pca["sigma_fit"]["x"]) + + def test__principal_component_analysis_invalid_inputs(self): + x1_valid = np.array([1, 2, 3]) + x2_valid = np.array([1, 2, 3]) + + # Test invalid x1 (non-array input) + x1_non_array = "not an array" + with self.assertRaises(TypeError): + wave.contours._principal_component_analysis(x1_non_array, x2_valid) + + # Test invalid x2 (non-array input) + x2_non_array = "not an array" + with self.assertRaises(TypeError): + wave.contours._principal_component_analysis(x1_valid, x2_non_array) + + # Test invalid bin_size (non-integer input) + invalid_bin_size = "not an integer" + with self.assertRaises(TypeError): + wave.contours._principal_component_analysis( + x1_valid, x2_valid, bin_size=invalid_bin_size + ) + + def test_principal_component_analysis_bin_size_adjustment_warning(self): + Hm0Te = self.Hm0Te + df = Hm0Te[Hm0Te["Hm0"] < 20] Hm0 = df.Hm0.values Te = df.Te.values - PCA = (wave.contours - ._principal_component_analysis(Hm0,Te, bin_size=250)) - - assert_allclose(PCA['principal_axes'], - self.pca['principal_axes']) - self.assertAlmostEqual(PCA['shift'], self.pca['shift']) - self.assertAlmostEqual(PCA['x1_fit']['mu'], - self.pca['x1_fit']['mu']) - self.assertAlmostEqual(PCA['mu_fit'].slope, - self.pca['mu_fit'].slope) - self.assertAlmostEqual(PCA['mu_fit'].intercept, - self.pca['mu_fit'].intercept) - assert_allclose(PCA['sigma_fit']['x'], - self.pca['sigma_fit']['x']) + + large_bin_size = 1000000 + + with warnings.catch_warnings(record=True) as w: + warnings.simplefilter("always") # Cause all warnings to always be triggered + wave.contours._principal_component_analysis( + Hm0, Te, bin_size=large_bin_size + ) + + self.assertTrue(len(w) == 1) # Check that exactly one warning was raised + self.assertTrue( + issubclass(w[-1].category, UserWarning) + ) # Check the warning category + self.assertIn( + "To allow for a minimum of 4 bins, the bin size has been set to", + str(w[-1].message), + ) def test_plot_environmental_contour(self): - file_loc= join(plotdir, 'wave_plot_environmental_contour.png') + file_loc = join(plotdir, "wave_plot_environmental_contour.png") filename = abspath(file_loc) if isfile(filename): os.remove(filename) Hm0Te = self.Hm0Te - df = Hm0Te[Hm0Te['Hm0'] < 20] + df = Hm0Te[Hm0Te["Hm0"] < 20] Hm0 = df.Hm0.values Te = df.Te.values - dt_ss = (Hm0Te.index[2]-Hm0Te.index[1]).seconds + dt_ss = (Hm0Te.index[2] - Hm0Te.index[1]).seconds time_R = 100 - copulas = wave.contours.environmental_contours(Hm0, Te, dt_ss, - time_R, 'PCA') + copulas = wave.contours.environmental_contours(Hm0, Te, dt_ss, time_R, "PCA") - Hm0_contour=copulas['PCA_x1'] - Te_contour=copulas['PCA_x2'] + Hm0_contour = copulas["PCA_x1"] + Te_contour = copulas["PCA_x2"] - dt_ss = (Hm0Te.index[2]-Hm0Te.index[1]).seconds + dt_ss = (Hm0Te.index[2] - Hm0Te.index[1]).seconds time_R = 100 plt.figure() - (wave.graphics - .plot_environmental_contour(Te, Hm0, - Te_contour, Hm0_contour, - data_label='NDBC 46022', - contour_label='100-year Contour', - x_label = 'Te [s]', - y_label = 'Hm0 [m]') + ( + wave.graphics.plot_environmental_contour( + Te, + Hm0, + Te_contour, + Hm0_contour, + data_label="NDBC 46022", + contour_label="100-year Contour", + x_label="Te [s]", + y_label="Hm0 [m]", + ) ) - plt.savefig(filename, format='png') + plt.savefig(filename, format="png") plt.close() self.assertTrue(isfile(filename)) def test_plot_environmental_contour_multiyear(self): - filename = abspath(join(plotdir, - 'wave_plot_environmental_contour_multiyear.png')) + filename = abspath( + join(plotdir, "wave_plot_environmental_contour_multiyear.png") + ) if isfile(filename): os.remove(filename) Hm0Te = self.Hm0Te - df = Hm0Te[Hm0Te['Hm0'] < 20] + df = Hm0Te[Hm0Te["Hm0"] < 20] Hm0 = df.Hm0.values Te = df.Te.values - dt_ss = (Hm0Te.index[2]-Hm0Te.index[1]).seconds + dt_ss = (Hm0Te.index[2] - Hm0Te.index[1]).seconds time_R = [100, 105, 110, 120, 150] - Hm0s=[] - Tes=[] + Hm0s = [] + Tes = [] for period in time_R: - copulas = (wave.contours - .environmental_contours(Hm0,Te,dt_ss,period,'PCA')) + copulas = wave.contours.environmental_contours( + Hm0, Te, dt_ss, period, "PCA" + ) - Hm0s.append(copulas['PCA_x1']) - Tes.append(copulas['PCA_x2']) + Hm0s.append(copulas["PCA_x1"]) + Tes.append(copulas["PCA_x2"]) - contour_label = [f'{year}-year Contour' for year in time_R] + contour_label = [f"{year}-year Contour" for year in time_R] plt.figure() - (wave.graphics - .plot_environmental_contour(Te, Hm0, - Tes, Hm0s, - data_label='NDBC 46022', - contour_label=contour_label, - x_label = 'Te [s]', - y_label = 'Hm0 [m]') - ) - plt.savefig(filename, format='png') + ( + wave.graphics.plot_environmental_contour( + Te, + Hm0, + Tes, + Hm0s, + data_label="NDBC 46022", + contour_label=contour_label, + x_label="Te [s]", + y_label="Hm0 [m]", + ) + ) + plt.savefig(filename, format="png") plt.close() self.assertTrue(isfile(filename)) def test_standard_copulas(self): - copulas = (wave.contours - .environmental_contours(self.wdrt_Hm0, self.wdrt_Te, - self.wdrt_dt, self.wdrt_period, - method=['gaussian', 'gumbel', 'clayton']) - ) + copulas = wave.contours.environmental_contours( + self.wdrt_Hm0, + self.wdrt_Te, + self.wdrt_dt, + self.wdrt_period, + method=["gaussian", "gumbel", "clayton"], + ) # WDRT slightly vaires Rosenblatt copula parameters from # the other copula default parameters - rosen = (wave.contours - .environmental_contours(self.wdrt_Hm0, self.wdrt_Te, - self.wdrt_dt, self.wdrt_period, method=['rosenblatt'], - min_bin_count=50, initial_bin_max_val=0.5, - bin_val_size=0.25)) - copulas['rosenblatt_x1'] = rosen['rosenblatt_x1'] - copulas['rosenblatt_x2'] = rosen['rosenblatt_x2'] - - methods=['gaussian', 'gumbel', 'clayton', 'rosenblatt'] - close=[] + rosen = wave.contours.environmental_contours( + self.wdrt_Hm0, + self.wdrt_Te, + self.wdrt_dt, + self.wdrt_period, + method=["rosenblatt"], + min_bin_count=50, + initial_bin_max_val=0.5, + bin_val_size=0.25, + ) + copulas["rosenblatt_x1"] = rosen["rosenblatt_x1"] + copulas["rosenblatt_x2"] = rosen["rosenblatt_x2"] + + methods = ["gaussian", "gumbel", "clayton", "rosenblatt"] + close = [] for method in methods: - close.append(np.allclose(copulas[f'{method}_x1'], - self.wdrt_copulas[f'{method}_x1'])) - close.append(np.allclose(copulas[f'{method}_x2'], - self.wdrt_copulas[f'{method}_x2'])) + close.append( + np.allclose(copulas[f"{method}_x1"], self.wdrt_copulas[f"{method}_x1"]) + ) + close.append( + np.allclose(copulas[f"{method}_x2"], self.wdrt_copulas[f"{method}_x2"]) + ) self.assertTrue(all(close)) def test_nonparametric_copulas(self): - methods=['nonparametric_gaussian','nonparametric_clayton', - 'nonparametric_gumbel'] - - np_copulas = wave.contours.environmental_contours(self.wdrt_Hm0, - self.wdrt_Te, self.wdrt_dt, self.wdrt_period, method=methods) + methods = [ + "nonparametric_gaussian", + "nonparametric_clayton", + "nonparametric_gumbel", + ] + + np_copulas = wave.contours.environmental_contours( + self.wdrt_Hm0, self.wdrt_Te, self.wdrt_dt, self.wdrt_period, method=methods + ) - close=[] + close = [] for method in methods: - close.append(np.allclose(np_copulas[f'{method}_x1'], - self.wdrt_copulas[f'{method}_x1'], atol=0.13)) - close.append(np.allclose(np_copulas[f'{method}_x2'], - self.wdrt_copulas[f'{method}_x2'], atol=0.13)) + close.append( + np.allclose( + np_copulas[f"{method}_x1"], + self.wdrt_copulas[f"{method}_x1"], + atol=0.13, + ) + ) + close.append( + np.allclose( + np_copulas[f"{method}_x2"], + self.wdrt_copulas[f"{method}_x2"], + atol=0.13, + ) + ) self.assertTrue(all(close)) def test_kde_copulas(self): - kde_copula = wave.contours.environmental_contours(self.wdrt_Hm0, - self.wdrt_Te, self.wdrt_dt, self.wdrt_period, - method=['bivariate_KDE'], bandwidth=[0.23, 0.23]) - log_kde_copula = (wave.contours - .environmental_contours(self.wdrt_Hm0, self.wdrt_Te, - self.wdrt_dt, self.wdrt_period, method=['bivariate_KDE_log'], bandwidth=[0.02, 0.11]) - ) - - close= [ np.allclose(kde_copula['bivariate_KDE_x1'], - self.wdrt_copulas['bivariate_KDE_x1']), - np.allclose(kde_copula['bivariate_KDE_x2'], - self.wdrt_copulas['bivariate_KDE_x2']), - np.allclose(log_kde_copula['bivariate_KDE_log_x1'], - self.wdrt_copulas['bivariate_KDE_log_x1']), - np.allclose(log_kde_copula['bivariate_KDE_log_x2'], - self.wdrt_copulas['bivariate_KDE_log_x2'])] + kde_copula = wave.contours.environmental_contours( + self.wdrt_Hm0, + self.wdrt_Te, + self.wdrt_dt, + self.wdrt_period, + method=["bivariate_KDE"], + bandwidth=[0.23, 0.23], + ) + log_kde_copula = wave.contours.environmental_contours( + self.wdrt_Hm0, + self.wdrt_Te, + self.wdrt_dt, + self.wdrt_period, + method=["bivariate_KDE_log"], + bandwidth=[0.02, 0.11], + ) + + close = [ + np.allclose( + kde_copula["bivariate_KDE_x1"], self.wdrt_copulas["bivariate_KDE_x1"] + ), + np.allclose( + kde_copula["bivariate_KDE_x2"], self.wdrt_copulas["bivariate_KDE_x2"] + ), + np.allclose( + log_kde_copula["bivariate_KDE_log_x1"], + self.wdrt_copulas["bivariate_KDE_log_x1"], + ), + np.allclose( + log_kde_copula["bivariate_KDE_log_x2"], + self.wdrt_copulas["bivariate_KDE_log_x2"], + ), + ] self.assertTrue(all(close)) def test_samples_contours(self): @@ -243,30 +547,39 @@ def test_samples_contours(self): hs_samples_0 = np.array([8.56637939, 9.27612515, 8.70427774]) hs_contour = np.array(self.wdrt_copulas["gaussian_x1"]) te_contour = np.array(self.wdrt_copulas["gaussian_x2"]) - hs_samples = wave.contours.samples_contour( - te_samples, te_contour, hs_contour) + hs_samples = wave.contours.samples_contour(te_samples, te_contour, hs_contour) assert_allclose(hs_samples, hs_samples_0) def test_samples_seastate(self): - hs_0 = np.array([5.91760129, 4.55185088, 1.41144991, 12.64443154, - 7.89753791, 0.93890797]) - te_0 = np.array([14.24199604, 8.25383556, 6.03901866, 16.9836369, - 9.51967777, 3.46969355]) - w_0 = np.array([2.18127398e-01, 2.18127398e-01, 2.18127398e-01, - 2.45437862e-07, 2.45437862e-07, 2.45437862e-07]) - - df = self.Hm0Te[self.Hm0Te['Hm0'] < 20] - dt_ss = (self.Hm0Te.index[2]-self.Hm0Te.index[1]).seconds + hs_0 = np.array( + [5.91760129, 4.55185088, 1.41144991, 12.64443154, 7.89753791, 0.93890797] + ) + te_0 = np.array( + [14.24199604, 8.25383556, 6.03901866, 16.9836369, 9.51967777, 3.46969355] + ) + w_0 = np.array( + [ + 2.18127398e-01, + 2.18127398e-01, + 2.18127398e-01, + 2.45437862e-07, + 2.45437862e-07, + 2.45437862e-07, + ] + ) + + df = self.Hm0Te[self.Hm0Te["Hm0"] < 20] + dt_ss = (self.Hm0Te.index[2] - self.Hm0Te.index[1]).seconds points_per_interval = 3 return_periods = np.array([50, 100]) np.random.seed(0) hs, te, w = wave.contours.samples_full_seastate( - df.Hm0.values, df.Te.values, points_per_interval, return_periods, - dt_ss) + df.Hm0.values, df.Te.values, points_per_interval, return_periods, dt_ss + ) assert_allclose(hs, hs_0) assert_allclose(te, te_0) assert_allclose(w, w_0) -if __name__ == '__main__': +if __name__ == "__main__": unittest.main() diff --git a/mhkit/tests/wave/test_performance.py b/mhkit/tests/wave/test_performance.py index f4bc2a566..b8fce7cb8 100644 --- a/mhkit/tests/wave/test_performance.py +++ b/mhkit/tests/wave/test_performance.py @@ -1,130 +1,147 @@ from os.path import abspath, dirname, join, isfile, normpath, relpath -from pandas.testing import assert_frame_equal -from numpy.testing import assert_allclose -from scipy.interpolate import interp1d -from random import seed, randint import matplotlib.pylab as plt -from datetime import datetime import xarray.testing as xrt import mhkit.wave as wave -from io import StringIO import pandas as pd import numpy as np -import contextlib import unittest -import netCDF4 -import inspect -import pickle -import time -import json -import sys import os testdir = dirname(abspath(__file__)) -plotdir = join(testdir, 'plots') +plotdir = join(testdir, "plots") isdir = os.path.isdir(plotdir) -if not isdir: os.mkdir(plotdir) -datadir = normpath(join(testdir,relpath('../../../examples/data/wave'))) +if not isdir: + os.mkdir(plotdir) +datadir = normpath(join(testdir, relpath("../../../examples/data/wave"))) class TestPerformance(unittest.TestCase): - @classmethod def setUpClass(self): np.random.seed(123) Hm0 = np.random.rayleigh(4, 100000) - Te = np.random.normal(4.5, .8, 100000) + Te = np.random.normal(4.5, 0.8, 100000) P = np.random.normal(200, 40, 100000) J = np.random.normal(300, 10, 100000) - ndbc_data_file = join(datadir,'data.txt') + ndbc_data_file = join(datadir, "data.txt") [raw_ndbc_data, meta] = wave.io.ndbc.read_file(ndbc_data_file) self.S = raw_ndbc_data.T - self.data = pd.DataFrame({'Hm0': Hm0, 'Te': Te, 'P': P,'J': J}) - self.Hm0_bins = np.arange(0,19,0.5) - self.Te_bins = np.arange(0,9,1) - self.expected_stats = ["mean","std","median","count","sum","min","max","freq"] + self.data = pd.DataFrame({"Hm0": Hm0, "Te": Te, "P": P, "J": J}) + self.Hm0_bins = np.arange(0, 19, 0.5) + self.Te_bins = np.arange(0, 9, 1) + self.expected_stats = [ + "mean", + "std", + "median", + "count", + "sum", + "min", + "max", + "freq", + ] @classmethod def tearDownClass(self): pass def test_capture_length(self): - L = wave.performance.capture_length(self.data['P'], self.data['J']) + L = wave.performance.capture_length(self.data["P"], self.data["J"]) L_stats = wave.performance.statistics(L) - self.assertAlmostEqual(L_stats['mean'], 0.6676, 3) + self.assertAlmostEqual(L_stats["mean"], 0.6676, 3) def test_capture_length_matrix(self): - L = wave.performance.capture_length(self.data['P'], self.data['J']) - LM = wave.performance.capture_length_matrix(self.data['Hm0'], self.data['Te'], - L, 'std', self.Hm0_bins, self.Te_bins) + L = wave.performance.capture_length(self.data["P"], self.data["J"]) + LM = wave.performance.capture_length_matrix( + self.data["Hm0"], self.data["Te"], L, "std", self.Hm0_bins, self.Te_bins + ) - self.assertEqual(LM.shape, (38,9)) + self.assertEqual(LM.shape, (38, 9)) self.assertEqual(LM.isna().sum().sum(), 131) def test_wave_energy_flux_matrix(self): - JM = wave.performance.wave_energy_flux_matrix(self.data['Hm0'], self.data['Te'], - self.data['J'], 'mean', self.Hm0_bins, self.Te_bins) - - self.assertEqual(JM.shape, (38,9)) + JM = wave.performance.wave_energy_flux_matrix( + self.data["Hm0"], + self.data["Te"], + self.data["J"], + "mean", + self.Hm0_bins, + self.Te_bins, + ) + + self.assertEqual(JM.shape, (38, 9)) self.assertEqual(JM.isna().sum().sum(), 131) def test_power_matrix(self): - L = wave.performance.capture_length(self.data['P'], self.data['J']) - LM = wave.performance.capture_length_matrix(self.data['Hm0'], self.data['Te'], - L, 'mean', self.Hm0_bins, self.Te_bins) - JM = wave.performance.wave_energy_flux_matrix(self.data['Hm0'], self.data['Te'], - self.data['J'], 'mean', self.Hm0_bins, self.Te_bins) + L = wave.performance.capture_length(self.data["P"], self.data["J"]) + LM = wave.performance.capture_length_matrix( + self.data["Hm0"], self.data["Te"], L, "mean", self.Hm0_bins, self.Te_bins + ) + JM = wave.performance.wave_energy_flux_matrix( + self.data["Hm0"], + self.data["Te"], + self.data["J"], + "mean", + self.Hm0_bins, + self.Te_bins, + ) PM = wave.performance.power_matrix(LM, JM) - self.assertEqual(PM.shape, (38,9)) + self.assertEqual(PM.shape, (38, 9)) self.assertEqual(PM.isna().sum().sum(), 131) def test_mean_annual_energy_production(self): - L = wave.performance.capture_length(self.data['P'], self.data['J']) - maep = wave.performance.mean_annual_energy_production_timeseries(L, self.data['J']) + L = wave.performance.capture_length(self.data["P"], self.data["J"]) + maep = wave.performance.mean_annual_energy_production_timeseries( + L, self.data["J"] + ) self.assertAlmostEqual(maep, 1754020.077, 2) - def test_plot_matrix(self): - filename = abspath(join(plotdir, 'wave_plot_matrix.png')) + filename = abspath(join(plotdir, "wave_plot_matrix.png")) if isfile(filename): os.remove(filename) - M = wave.performance.wave_energy_flux_matrix(self.data['Hm0'], self.data['Te'], - self.data['J'], 'mean', self.Hm0_bins, self.Te_bins) + M = wave.performance.wave_energy_flux_matrix( + self.data["Hm0"], + self.data["Te"], + self.data["J"], + "mean", + self.Hm0_bins, + self.Te_bins, + ) plt.figure() wave.graphics.plot_matrix(M) - plt.savefig(filename, format='png') + plt.savefig(filename, format="png") plt.close() self.assertTrue(isfile(filename)) def test_powerperformance_workflow(self): - filename = abspath(join(plotdir, 'Capture Length Matrix mean.png')) + filename = abspath(join(plotdir, "Capture Length Matrix mean.png")) if isfile(filename): os.remove(filename) - P = pd.Series(np.random.normal(200, 40, 743),index = self.S.columns) - statistic = ['mean'] + P = pd.Series(np.random.normal(200, 40, 743), index=self.S.columns) + statistic = ["mean"] savepath = plotdir show_values = True h = 60 expected = 401239.4822345051 - x = self.S.T - CM,MAEP = wave.performance.power_performance_workflow(self.S, h, - P, statistic, savepath=savepath, show_values=show_values) + CM, MAEP = wave.performance.power_performance_workflow( + self.S, h, P, statistic, savepath=savepath, show_values=show_values + ) self.assertTrue(isfile(filename)) - self.assertEqual(list(CM.data_vars),self.expected_stats) + self.assertEqual(list(CM.data_vars), self.expected_stats) - error = (expected-MAEP)/expected # SSE + error = (expected - MAEP) / expected # SSE self.assertLess(error, 1e-6) -if __name__ == '__main__': +if __name__ == "__main__": unittest.main() diff --git a/mhkit/tests/wave/test_resource_metrics.py b/mhkit/tests/wave/test_resource_metrics.py index e927a6157..9cdf589fc 100644 --- a/mhkit/tests/wave/test_resource_metrics.py +++ b/mhkit/tests/wave/test_resource_metrics.py @@ -9,6 +9,7 @@ import mhkit.wave as wave from io import StringIO import pandas as pd +import xarray as xr import numpy as np import contextlib import unittest @@ -22,64 +23,65 @@ testdir = dirname(abspath(__file__)) -plotdir = join(testdir, 'plots') +plotdir = join(testdir, "plots") isdir = os.path.isdir(plotdir) -if not isdir: os.mkdir(plotdir) -datadir = normpath(join(testdir,relpath('../../../examples/data/wave'))) +if not isdir: + os.mkdir(plotdir) +datadir = normpath(join(testdir, relpath("../../../examples/data/wave"))) class TestResourceMetrics(unittest.TestCase): - @classmethod def setUpClass(self): - omega = np.arange(0.1,3.5,0.01) - self.f = omega/(2*np.pi) + omega = np.arange(0.1, 3.5, 0.01) + self.f = omega / (2 * np.pi) self.Hs = 2.5 self.Tp = 8 - file_name = join(datadir, 'ValData1.json') + file_name = join(datadir, "ValData1.json") with open(file_name, "r") as read_file: self.valdata1 = pd.DataFrame(json.load(read_file)) self.valdata2 = {} - file_name = join(datadir, 'ValData2_MC.json') + file_name = join(datadir, "ValData2_MC.json") with open(file_name, "r") as read_file: data = json.load(read_file) - self.valdata2['MC'] = data + self.valdata2["MC"] = data for i in data.keys(): # Calculate elevation spectra - elevation = pd.DataFrame(data[i]['elevation']) + elevation = pd.DataFrame(data[i]["elevation"]) elevation.index = elevation.index.astype(float) elevation.sort_index(inplace=True) - sample_rate = data[i]['sample_rate'] - NFFT = data[i]['NFFT'] - self.valdata2['MC'][i]['S'] = wave.resource.elevation_spectrum(elevation, - sample_rate, NFFT) + sample_rate = data[i]["sample_rate"] + NFFT = data[i]["NFFT"] + self.valdata2["MC"][i]["S"] = wave.resource.elevation_spectrum( + elevation, sample_rate, NFFT + ) - file_name = join(datadir, 'ValData2_AH.json') + file_name = join(datadir, "ValData2_AH.json") with open(file_name, "r") as read_file: data = json.load(read_file) - self.valdata2['AH'] = data + self.valdata2["AH"] = data for i in data.keys(): # Calculate elevation spectra - elevation = pd.DataFrame(data[i]['elevation']) + elevation = pd.DataFrame(data[i]["elevation"]) elevation.index = elevation.index.astype(float) elevation.sort_index(inplace=True) - sample_rate = data[i]['sample_rate'] - NFFT = data[i]['NFFT'] - self.valdata2['AH'][i]['S'] = wave.resource.elevation_spectrum(elevation, - sample_rate, NFFT) + sample_rate = data[i]["sample_rate"] + NFFT = data[i]["NFFT"] + self.valdata2["AH"][i]["S"] = wave.resource.elevation_spectrum( + elevation, sample_rate, NFFT + ) - file_name = join(datadir, 'ValData2_CDiP.json') + file_name = join(datadir, "ValData2_CDiP.json") with open(file_name, "r") as read_file: data = json.load(read_file) - self.valdata2['CDiP'] = data + self.valdata2["CDiP"] = data for i in data.keys(): - temp = pd.Series(data[i]['S']).to_frame('S') + temp = pd.Series(data[i]["S"]).to_frame("S") temp.index = temp.index.astype(float) - self.valdata2['CDiP'][i]['S'] = temp - + self.valdata2["CDiP"][i]["S"] = temp @classmethod def tearDownClass(self): @@ -87,14 +89,14 @@ def tearDownClass(self): def test_kfromw(self): for i in self.valdata1.columns: - f = np.array(self.valdata1[i]['w'])/(2*np.pi) - h = self.valdata1[i]['h'] - rho = self.valdata1[i]['rho'] + f = np.array(self.valdata1[i]["w"]) / (2 * np.pi) + h = self.valdata1[i]["h"] + rho = self.valdata1[i]["rho"] - expected = self.valdata1[i]['k'] + expected = self.valdata1[i]["k"] k = wave.resource.wave_number(f, h, rho) - calculated = k.loc[:,'k'].values - error = ((expected-calculated)**2).sum() # SSE + calculated = k.loc[:, "k"].values + error = ((expected - calculated) ** 2).sum() # SSE self.assertLess(error, 1e-6) @@ -102,105 +104,125 @@ def test_kfromw_one_freq(self): g = 9.81 f = 0.1 h = 1e9 - w = np.pi*2*f # deep water dispersion + w = np.pi * 2 * f # deep water dispersion expected = w**2 / g calculated = wave.resource.wave_number(f=f, h=h, g=g).values[0][0] - error = np.abs(expected-calculated) + error = np.abs(expected - calculated) self.assertLess(error, 1e-6) def test_wave_length(self): - k_list=[1,2,10,3] - l_expected = (2.*np.pi/np.array(k_list)).tolist() + k_array = np.asarray([1.0, 2.0, 10.0, 3.0]) - k_df = pd.DataFrame(k_list,index = [1,2,3,4]) - k_series= k_df[0] - k_array=np.array(k_list) + k_int = int(k_array[0]) + k_float = k_array[0] + k_df = pd.DataFrame(k_array, index=[1, 2, 3, 4]) + k_series = k_df[0] - for l in [k_list, k_df, k_series, k_array]: + for l in [k_array, k_int, k_float, k_df, k_series]: l_calculated = wave.resource.wave_length(l) - self.assertListEqual(l_expected,l_calculated.tolist()) - - idx=0 - k_int = k_list[idx] - l_calculated = wave.resource.wave_length(k_int) - self.assertEqual(l_expected[idx],l_calculated) + self.assertTrue(np.all(2.0 * np.pi / l == l_calculated)) def test_depth_regime(self): - expected = [True,True,False,True] - l_list=[1,2,10,3] - l_df = pd.DataFrame(l_list,index = [1,2,3,4]) - l_series= l_df[0] - l_array=np.array(l_list) h = 10 - for l in [l_list, l_df, l_series, l_array]: - calculated = wave.resource.depth_regime(l,h) - self.assertListEqual(expected,calculated.tolist()) - - idx=0 - l_int = l_list[idx] - calculated = wave.resource.depth_regime(l_int,h) - self.assertEqual(expected[idx],calculated) + # non-array like formats + l_int = 1 + l_float = 1.0 + expected = True + for l in [l_int, l_float]: + calculated = wave.resource.depth_regime(l, h) + self.assertTrue(np.all(expected == calculated)) + + # array-like formats + l_array = np.array([1, 2, 10, 3]) + l_df = pd.DataFrame(l_array, index=[1, 2, 3, 4]) + l_series = l_df[0] + l_da = xr.DataArray(l_series) + l_da.name = "data" + l_ds = l_da.to_dataset() + expected = [True, True, False, True] + for l in [l_array, l_series, l_da, l_ds]: + calculated = wave.resource.depth_regime(l, h) + self.assertTrue(np.all(expected == calculated)) + + # special formatting for pd.DataFrame + for l in [l_df]: + calculated = wave.resource.depth_regime(l, h) + self.assertTrue(np.all(expected == calculated[0])) def test_wave_celerity(self): # Depth regime ratio - dr_ratio=2 + dr_ratio = 2 # small change in f will give similar value cg - f=np.linspace(20.0001,20.0005,5) + f = np.linspace(20.0001, 20.0005, 5) # Choose index to spike at. cg spike is inversly proportional to k - k_idx=2 - k_tmp=[1, 1, 0.5, 1, 1] + k_idx = 2 + k_tmp = [1, 1, 0.5, 1, 1] k = pd.DataFrame(k_tmp, index=f) # all shallow - cg_shallow1 = wave.resource.wave_celerity(k, h=0.0001,depth_check=True) - cg_shallow2 = wave.resource.wave_celerity(k, h=0.0001,depth_check=False) - self.assertTrue(all(cg_shallow1.squeeze().values == - cg_shallow2.squeeze().values)) - + cg_shallow1 = wave.resource.wave_celerity(k, h=0.0001, depth_check=True) + cg_shallow2 = wave.resource.wave_celerity(k, h=0.0001, depth_check=False) + self.assertTrue( + all(cg_shallow1.squeeze().values == cg_shallow2.squeeze().values) + ) # all deep - cg = wave.resource.wave_celerity(k, h=1000,depth_check=True) - self.assertTrue(all(np.pi*f/k.squeeze().values == cg.squeeze().values)) + cg = wave.resource.wave_celerity(k, h=1000, depth_check=True) + self.assertTrue(all(np.pi * f / k.squeeze().values == cg.squeeze().values)) def test_energy_flux_deep(self): - # Dependent on mhkit.resource.BS spectrum - S = wave.resource.jonswap_spectrum(self.f,self.Tp,self.Hs) + S = wave.resource.jonswap_spectrum(self.f, self.Tp, self.Hs) Te = wave.resource.energy_period(S) Hm0 = wave.resource.significant_wave_height(S) - rho=1025 - g=9.80665 - coeff = rho*(g**2)/(64*np.pi) - J = coeff*(Hm0.squeeze()**2)*Te.squeeze() - h=-1 # not used when deep=True + rho = 1025 + g = 9.80665 + coeff = rho * (g**2) / (64 * np.pi) + J = coeff * (Hm0.squeeze() ** 2) * Te.squeeze() + + h = -1 # not used when deep=True J_calc = wave.resource.energy_flux(S, h, deep=True) self.assertTrue(J_calc.squeeze() == J) + def test_energy_flux_shallow(self): + S = wave.resource.jonswap_spectrum(self.f, self.Tp, self.Hs) + Te = wave.resource.energy_period(S) + Hm0 = wave.resource.significant_wave_height(S) + + rho = 1025 + g = 9.80665 + coeff = rho * (g**2) / (64 * np.pi) + J = coeff * (Hm0.squeeze() ** 2) * Te.squeeze() + + h = 1000 # effectively deep but without assumptions + J_calc = wave.resource.energy_flux(S, h, deep=False) + err = np.abs(J_calc.squeeze() - J) + self.assertLess(err, 1e-6) def test_moments(self): - for file_i in self.valdata2.keys(): # for each file MC, AH, CDiP + for file_i in self.valdata2.keys(): # for each file MC, AH, CDiP datasets = self.valdata2[file_i] - for s in datasets.keys(): # for each set + for s in datasets.keys(): # for each set data = datasets[s] - for m in data['m'].keys(): - expected = data['m'][m] - S = data['S'] - if s == 'CDiP1' or s == 'CDiP6': - f_bins=pd.Series(data['freqBinWidth']) + for m in data["m"].keys(): + expected = data["m"][m] + S = data["S"] + if s == "CDiP1" or s == "CDiP6": + f_bins = pd.Series(data["freqBinWidth"]) else: f_bins = None - calculated = wave.resource.frequency_moment(S, int(m) - ,frequency_bins=f_bins).iloc[0,0] - error = np.abs(expected-calculated)/expected + calculated = wave.resource.frequency_moment( + S, int(m), frequency_bins=f_bins + ).iloc[0, 0] + error = np.abs(expected - calculated) / expected self.assertLess(error, 0.01) - def test_energy_period_to_peak_period(self): # This test checks that if we perform the # Te to Tp conversion, we create a spectrum @@ -218,164 +240,172 @@ def test_energy_period_to_peak_period(self): Te_calc = wave.resource.energy_period(S).values[0][0] - error = np.abs(T - Te_calc)/Te_calc + error = np.abs(T - Te_calc) / Te_calc self.assertLess(error, 0.01) - def test_metrics(self): - for file_i in self.valdata2.keys(): # for each file MC, AH, CDiP + for file_i in self.valdata2.keys(): # for each file MC, AH, CDiP datasets = self.valdata2[file_i] - for s in datasets.keys(): # for each set - - + for s in datasets.keys(): # for each set data = datasets[s] - S = data['S'] - if file_i == 'CDiP': - f_bins=pd.Series(data['freqBinWidth']) + S = data["S"] + if file_i == "CDiP": + f_bins = pd.Series(data["freqBinWidth"]) else: f_bins = None # Hm0 - expected = data['metrics']['Hm0'] - calculated = wave.resource.significant_wave_height(S, - frequency_bins=f_bins).iloc[0,0] - error = np.abs(expected-calculated)/expected - #print('Hm0', expected, calculated, error) + expected = data["metrics"]["Hm0"] + calculated = wave.resource.significant_wave_height( + S, frequency_bins=f_bins + ).iloc[0, 0] + error = np.abs(expected - calculated) / expected + # print('Hm0', expected, calculated, error) self.assertLess(error, 0.01) # Te - expected = data['metrics']['Te'] - calculated = wave.resource.energy_period(S, - frequency_bins=f_bins).iloc[0,0] - error = np.abs(expected-calculated)/expected - #print('Te', expected, calculated, error) + expected = data["metrics"]["Te"] + calculated = wave.resource.energy_period(S, frequency_bins=f_bins).iloc[ + 0, 0 + ] + error = np.abs(expected - calculated) / expected + # print('Te', expected, calculated, error) self.assertLess(error, 0.01) # T0 - expected = data['metrics']['T0'] - calculated = wave.resource.average_zero_crossing_period(S, - frequency_bins=f_bins).iloc[0,0] - error = np.abs(expected-calculated)/expected - #print('T0', expected, calculated, error) + expected = data["metrics"]["T0"] + calculated = wave.resource.average_zero_crossing_period( + S, frequency_bins=f_bins + ).iloc[0, 0] + error = np.abs(expected - calculated) / expected + # print('T0', expected, calculated, error) self.assertLess(error, 0.01) # Tc - expected = data['metrics']['Tc'] - calculated = wave.resource.average_crest_period(S, - # Tc = Tavg**2 - frequency_bins=f_bins).iloc[0,0]**2 - error = np.abs(expected-calculated)/expected - #print('Tc', expected, calculated, error) + expected = data["metrics"]["Tc"] + calculated = ( + wave.resource.average_crest_period( + S, + # Tc = Tavg**2 + frequency_bins=f_bins, + ).iloc[0, 0] + ** 2 + ) + error = np.abs(expected - calculated) / expected + # print('Tc', expected, calculated, error) self.assertLess(error, 0.01) # Tm - expected = np.sqrt(data['metrics']['Tm']) - calculated = wave.resource.average_wave_period(S, - frequency_bins=f_bins).iloc[0,0] - error = np.abs(expected-calculated)/expected - #print('Tm', expected, calculated, error) + expected = np.sqrt(data["metrics"]["Tm"]) + calculated = wave.resource.average_wave_period( + S, frequency_bins=f_bins + ).iloc[0, 0] + error = np.abs(expected - calculated) / expected + # print('Tm', expected, calculated, error) self.assertLess(error, 0.01) # Tp - expected = data['metrics']['Tp'] - calculated = wave.resource.peak_period(S).iloc[0,0] - error = np.abs(expected-calculated)/expected - #print('Tp', expected, calculated, error) + expected = data["metrics"]["Tp"] + calculated = wave.resource.peak_period(S).iloc[0, 0] + error = np.abs(expected - calculated) / expected + # print('Tp', expected, calculated, error) self.assertLess(error, 0.001) # e - expected = data['metrics']['e'] - calculated = wave.resource.spectral_bandwidth(S, - frequency_bins=f_bins).iloc[0,0] - error = np.abs(expected-calculated)/expected - #print('e', expected, calculated, error) + expected = data["metrics"]["e"] + calculated = wave.resource.spectral_bandwidth( + S, frequency_bins=f_bins + ).iloc[0, 0] + error = np.abs(expected - calculated) / expected + # print('e', expected, calculated, error) self.assertLess(error, 0.001) # J - if file_i != 'CDiP': - for i,j in zip(data['h'],data['J']): - expected = data['J'][j] - calculated = wave.resource.energy_flux(S,i) - error = np.abs(expected-calculated.values)/expected + if file_i != "CDiP": + for i, j in zip(data["h"], data["J"]): + expected = data["J"][j] + calculated = wave.resource.energy_flux(S, i) + error = np.abs(expected - calculated.values) / expected self.assertLess(error, 0.1) # v - if file_i == 'CDiP': + if file_i == "CDiP": # this should be updated to run on other datasets - expected = data['metrics']['v'] - calculated = wave.resource.spectral_width(S, - frequency_bins=f_bins).iloc[0,0] - error = np.abs(expected-calculated)/expected + expected = data["metrics"]["v"] + calculated = wave.resource.spectral_width( + S, frequency_bins=f_bins + ).iloc[0, 0] + error = np.abs(expected - calculated) / expected self.assertLess(error, 0.01) - if file_i == 'MC': - expected = data['metrics']['v'] + if file_i == "MC": + expected = data["metrics"]["v"] # testing that default uniform frequency bin widths works - calculated = wave.resource.spectral_width(S).iloc[0,0] - error = np.abs(expected-calculated)/expected + calculated = wave.resource.spectral_width(S).iloc[0, 0] + error = np.abs(expected - calculated) / expected self.assertLess(error, 0.01) - def test_plot_elevation_timeseries(self): - filename = abspath(join(plotdir, 'wave_plot_elevation_timeseries.png')) + filename = abspath(join(plotdir, "wave_plot_elevation_timeseries.png")) if isfile(filename): os.remove(filename) - data = self.valdata2['MC'] - temp = pd.DataFrame(data[list(data.keys())[0]]['elevation']) + data = self.valdata2["MC"] + temp = pd.DataFrame(data[list(data.keys())[0]]["elevation"]) temp.index = temp.index.astype(float) temp.sort_index(inplace=True) - eta = temp.iloc[0:100,:] + eta = temp.iloc[0:100, :] plt.figure() wave.graphics.plot_elevation_timeseries(eta) - plt.savefig(filename, format='png') + plt.savefig(filename, format="png") plt.close() self.assertTrue(isfile(filename)) -class TestPlotResouceCharacterizations(unittest.TestCase): +class TestPlotResouceCharacterizations(unittest.TestCase): @classmethod def setUpClass(self): - f_name= 'Hm0_Te_46022.json' - self.Hm0Te = pd.read_json(join(datadir,f_name)) + f_name = "Hm0_Te_46022.json" + self.Hm0Te = pd.read_json(join(datadir, f_name)) + @classmethod def tearDownClass(self): pass - def test_plot_avg_annual_energy_matrix(self): - filename = abspath(join(plotdir, 'avg_annual_scatter_table.png')) + def test_plot_avg_annual_energy_matrix(self): + filename = abspath(join(plotdir, "avg_annual_scatter_table.png")) if isfile(filename): os.remove(filename) Hm0Te = self.Hm0Te Hm0Te.drop(Hm0Te[Hm0Te.Hm0 > 20].index, inplace=True) - J = np.random.random(len(Hm0Te))*100 + J = np.random.random(len(Hm0Te)) * 100 plt.figure() - fig = wave.graphics.plot_avg_annual_energy_matrix(Hm0Te.Hm0, - Hm0Te.Te, J, Hm0_bin_size=0.5, Te_bin_size=1) - plt.savefig(filename, format='png') + fig = wave.graphics.plot_avg_annual_energy_matrix( + Hm0Te.Hm0, Hm0Te.Te, J, Hm0_bin_size=0.5, Te_bin_size=1 + ) + plt.savefig(filename, format="png") plt.close() self.assertTrue(isfile(filename)) def test_plot_monthly_cumulative_distribution(self): - - filename = abspath(join(plotdir, 'monthly_cumulative_distribution.png')) + filename = abspath(join(plotdir, "monthly_cumulative_distribution.png")) if isfile(filename): os.remove(filename) - a = pd.date_range(start='1/1/2010', periods=10000, freq='h') - S = pd.Series(np.random.random(len(a)) , index=a) - ax=wave.graphics.monthly_cumulative_distribution(S) - plt.savefig(filename, format='png') + a = pd.date_range(start="1/1/2010", periods=10000, freq="h") + S = pd.Series(np.random.random(len(a)), index=a) + ax = wave.graphics.monthly_cumulative_distribution(S) + plt.savefig(filename, format="png") plt.close() self.assertTrue(isfile(filename)) -if __name__ == '__main__': +if __name__ == "__main__": unittest.main() diff --git a/mhkit/tests/wave/test_resource_spectrum.py b/mhkit/tests/wave/test_resource_spectrum.py index 30e4e3c4e..4907a5638 100644 --- a/mhkit/tests/wave/test_resource_spectrum.py +++ b/mhkit/tests/wave/test_resource_spectrum.py @@ -2,34 +2,24 @@ from pandas.testing import assert_frame_equal from numpy.testing import assert_allclose from scipy.interpolate import interp1d -from random import seed, randint import matplotlib.pylab as plt -from datetime import datetime -import xarray.testing as xrt +import xarray as xr import mhkit.wave as wave -from io import StringIO import pandas as pd import numpy as np -import contextlib import unittest -import netCDF4 -import inspect -import pickle -import time -import json -import sys import os testdir = dirname(abspath(__file__)) -plotdir = join(testdir, 'plots') +plotdir = join(testdir, "plots") isdir = os.path.isdir(plotdir) -if not isdir: os.mkdir(plotdir) -datadir = normpath(join(testdir,relpath('../../../examples/data/wave'))) +if not isdir: + os.mkdir(plotdir) +datadir = normpath(join(testdir, relpath("../../../examples/data/wave"))) class TestResourceSpectrum(unittest.TestCase): - @classmethod def setUpClass(self): Trep = 600 @@ -44,12 +34,12 @@ def tearDownClass(self): pass def test_pierson_moskowitz_spectrum(self): - S = wave.resource.pierson_moskowitz_spectrum(self.f,self.Tp,self.Hs) - Hm0 = wave.resource.significant_wave_height(S).iloc[0,0] - Tp0 = wave.resource.peak_period(S).iloc[0,0] + S = wave.resource.pierson_moskowitz_spectrum(self.f, self.Tp, self.Hs) + Hm0 = wave.resource.significant_wave_height(S).iloc[0, 0] + Tp0 = wave.resource.peak_period(S).iloc[0, 0] - errorHm0 = np.abs(self.Tp - Tp0)/self.Tp - errorTp0 = np.abs(self.Hs - Hm0)/self.Hs + errorHm0 = np.abs(self.Tp - Tp0) / self.Tp + errorTp0 = np.abs(self.Hs - Hm0) / self.Hs self.assertLess(errorHm0, 0.01) self.assertLess(errorTp0, 0.01) @@ -60,18 +50,20 @@ def test_pierson_moskowitz_spectrum_zero_freq(self): f_nonzero = np.arange(df, 1, df) S_zero = wave.resource.pierson_moskowitz_spectrum(f_zero, self.Tp, self.Hs) - S_nonzero = wave.resource.pierson_moskowitz_spectrum(f_nonzero, self.Tp, self.Hs) + S_nonzero = wave.resource.pierson_moskowitz_spectrum( + f_nonzero, self.Tp, self.Hs + ) self.assertEqual(S_zero.values.squeeze()[0], 0.0) self.assertGreater(S_nonzero.values.squeeze()[0], 0.0) def test_jonswap_spectrum(self): S = wave.resource.jonswap_spectrum(self.f, self.Tp, self.Hs) - Hm0 = wave.resource.significant_wave_height(S).iloc[0,0] - Tp0 = wave.resource.peak_period(S).iloc[0,0] + Hm0 = wave.resource.significant_wave_height(S).iloc[0, 0] + Tp0 = wave.resource.peak_period(S).iloc[0, 0] - errorHm0 = np.abs(self.Tp - Tp0)/self.Tp - errorTp0 = np.abs(self.Hs - Hm0)/self.Hs + errorHm0 = np.abs(self.Tp - Tp0) / self.Tp + errorTp0 = np.abs(self.Hs - Hm0) / self.Hs self.assertLess(errorHm0, 0.01) self.assertLess(errorTp0, 0.01) @@ -87,31 +79,36 @@ def test_jonswap_spectrum_zero_freq(self): self.assertEqual(S_zero.values.squeeze()[0], 0.0) self.assertGreater(S_nonzero.values.squeeze()[0], 0.0) - def test_surface_elevation_phases_np_and_pd(self): - S0 = wave.resource.jonswap_spectrum(self.f,self.Tp,self.Hs) - S1 = wave.resource.jonswap_spectrum(self.f,self.Tp,self.Hs*1.1) + def test_surface_elevation_phases_xr_and_pd(self): + S0 = wave.resource.jonswap_spectrum(self.f, self.Tp, self.Hs) + S1 = wave.resource.jonswap_spectrum(self.f, self.Tp, self.Hs * 1.1) S = pd.concat([S0, S1], axis=1) phases_np = np.random.rand(S.shape[0], S.shape[1]) * 2 * np.pi phases_pd = pd.DataFrame(phases_np, index=S.index, columns=S.columns) + phases_xr = xr.Dataset(phases_pd) - eta_np = wave.resource.surface_elevation(S, self.t, phases=phases_np, seed=1) + eta_xr = wave.resource.surface_elevation(S, self.t, phases=phases_xr, seed=1) eta_pd = wave.resource.surface_elevation(S, self.t, phases=phases_pd, seed=1) - assert_frame_equal(eta_np, eta_pd) + assert_frame_equal(eta_xr, eta_pd) def test_surface_elevation_frequency_bins_np_and_pd(self): - S0 = wave.resource.jonswap_spectrum(self.f,self.Tp,self.Hs) - S1 = wave.resource.jonswap_spectrum(self.f,self.Tp,self.Hs*1.1) + S0 = wave.resource.jonswap_spectrum(self.f, self.Tp, self.Hs) + S1 = wave.resource.jonswap_spectrum(self.f, self.Tp, self.Hs * 1.1) S = pd.concat([S0, S1], axis=1) eta0 = wave.resource.surface_elevation(S, self.t, seed=1) - f_bins_np = np.array([np.diff(S.index)[0]]*len(S)) - f_bins_pd = pd.DataFrame(f_bins_np, index=S.index, columns=['df']) + f_bins_np = np.array([np.diff(S.index)[0]] * len(S)) + f_bins_pd = pd.DataFrame(f_bins_np, index=S.index, columns=["df"]) - eta_np = wave.resource.surface_elevation(S, self.t, frequency_bins=f_bins_np, seed=1) - eta_pd = wave.resource.surface_elevation(S, self.t, frequency_bins=f_bins_pd, seed=1) + eta_np = wave.resource.surface_elevation( + S, self.t, frequency_bins=f_bins_np, seed=1 + ) + eta_pd = wave.resource.surface_elevation( + S, self.t, frequency_bins=f_bins_pd, seed=1 + ) assert_frame_equal(eta0, eta_np) assert_frame_equal(eta_np, eta_pd) @@ -120,19 +117,19 @@ def test_surface_elevation_moments(self): S = wave.resource.jonswap_spectrum(self.f, self.Tp, self.Hs) eta = wave.resource.surface_elevation(S, self.t, seed=1) dt = self.t[1] - self.t[0] - Sn = wave.resource.elevation_spectrum(eta, 1/dt, len(eta.values), - detrend=False, window='boxcar', - noverlap=0) + Sn = wave.resource.elevation_spectrum( + eta, 1 / dt, len(eta.values), detrend=False, window="boxcar", noverlap=0 + ) - m0 = wave.resource.frequency_moment(S,0).m0.values[0] - m0n = wave.resource.frequency_moment(Sn,0).m0.values[0] - errorm0 = np.abs((m0 - m0n)/m0) + m0 = wave.resource.frequency_moment(S, 0).m0.values[0] + m0n = wave.resource.frequency_moment(Sn, 0).m0.values[0] + errorm0 = np.abs((m0 - m0n) / m0) self.assertLess(errorm0, 0.01) - m1 = wave.resource.frequency_moment(S,1).m1.values[0] - m1n = wave.resource.frequency_moment(Sn,1).m1.values[0] - errorm1 = np.abs((m1 - m1n)/m1) + m1 = wave.resource.frequency_moment(S, 1).m1.values[0] + m1n = wave.resource.frequency_moment(Sn, 1).m1.values[0] + errorm1 = np.abs((m1 - m1n) / m1) self.assertLess(errorm1, 0.01) @@ -140,40 +137,43 @@ def test_surface_elevation_rmse(self): S = wave.resource.jonswap_spectrum(self.f, self.Tp, self.Hs) eta = wave.resource.surface_elevation(S, self.t, seed=1) dt = self.t[1] - self.t[0] - Sn = wave.resource.elevation_spectrum(eta, 1/dt, len(eta), - detrend=False, window='boxcar', - noverlap=0) + Sn = wave.resource.elevation_spectrum( + eta, 1 / dt, len(eta), detrend=False, window="boxcar", noverlap=0 + ) fSn = interp1d(Sn.index.values, Sn.values, axis=0) - rmse = (S.values - fSn(S.index.values))**2 - rmse_sum = (np.sum(rmse)/len(rmse))**0.5 + Sn_interp = fSn(S.index.values).squeeze() + rmse = (S.values.squeeze() - Sn_interp) ** 2 + rmse_sum = (np.sum(rmse) / len(rmse)) ** 0.5 self.assertLess(rmse_sum, 0.02) def test_ifft_sum_of_sines(self): S = wave.resource.jonswap_spectrum(self.f, self.Tp, self.Hs) - eta_ifft = wave.resource.surface_elevation(S, self.t, seed=1, method='ifft') - eta_sos = wave.resource.surface_elevation(S, self.t, seed=1, method='sum_of_sines') + eta_ifft = wave.resource.surface_elevation(S, self.t, seed=1, method="ifft") + eta_sos = wave.resource.surface_elevation( + S, self.t, seed=1, method="sum_of_sines" + ) - assert_allclose(eta_ifft, eta_sos) + assert_allclose(eta_ifft, eta_sos) def test_plot_spectrum(self): - filename = abspath(join(plotdir, 'wave_plot_spectrum.png')) + filename = abspath(join(plotdir, "wave_plot_spectrum.png")) if isfile(filename): os.remove(filename) - S = wave.resource.pierson_moskowitz_spectrum(self.f,self.Tp,self.Hs) + S = wave.resource.pierson_moskowitz_spectrum(self.f, self.Tp, self.Hs) plt.figure() wave.graphics.plot_spectrum(S) - plt.savefig(filename, format='png') + plt.savefig(filename, format="png") plt.close() self.assertTrue(isfile(filename)) def test_plot_chakrabarti(self): - filename = abspath(join(plotdir, 'wave_plot_chakrabarti.png')) + filename = abspath(join(plotdir, "wave_plot_chakrabarti.png")) if isfile(filename): os.remove(filename) @@ -185,7 +185,7 @@ def test_plot_chakrabarti(self): plt.savefig(filename) def test_plot_chakrabarti_np(self): - filename = abspath(join(plotdir, 'wave_plot_chakrabarti_np.png')) + filename = abspath(join(plotdir, "wave_plot_chakrabarti_np.png")) if isfile(filename): os.remove(filename) @@ -199,21 +199,22 @@ def test_plot_chakrabarti_np(self): self.assertTrue(isfile(filename)) def test_plot_chakrabarti_pd(self): - filename = abspath(join(plotdir, 'wave_plot_chakrabarti_pd.png')) + filename = abspath(join(plotdir, "wave_plot_chakrabarti_pd.png")) if isfile(filename): os.remove(filename) D = np.linspace(5, 15, 5) H = 10 * np.ones_like(D) lambda_w = 200 * np.ones_like(D) - df = pd.DataFrame([H.flatten(),lambda_w.flatten(),D.flatten()], - index=['H','lambda_w','D']).transpose() + df = pd.DataFrame( + [H.flatten(), lambda_w.flatten(), D.flatten()], index=["H", "lambda_w", "D"] + ).transpose() wave.graphics.plot_chakrabarti(df.H, df.lambda_w, df.D) plt.savefig(filename) self.assertTrue(isfile(filename)) -if __name__ == '__main__': + +if __name__ == "__main__": unittest.main() - \ No newline at end of file diff --git a/mhkit/tidal/__init__.py b/mhkit/tidal/__init__.py index b669360a6..2644bfdfa 100644 --- a/mhkit/tidal/__init__.py +++ b/mhkit/tidal/__init__.py @@ -1,4 +1,4 @@ from mhkit.tidal import graphics from mhkit.tidal import io -from mhkit.tidal import resource +from mhkit.tidal import resource from mhkit.tidal import performance diff --git a/mhkit/tidal/d3d.py b/mhkit/tidal/d3d.py deleted file mode 100644 index b11aa1569..000000000 --- a/mhkit/tidal/d3d.py +++ /dev/null @@ -1 +0,0 @@ -from mhkit.river.d3d import * \ No newline at end of file diff --git a/mhkit/tidal/graphics.py b/mhkit/tidal/graphics.py index 51459b527..0483f2080 100644 --- a/mhkit/tidal/graphics.py +++ b/mhkit/tidal/graphics.py @@ -1,5 +1,4 @@ import numpy as np -import pandas as pd import bisect from scipy.interpolate import interpn as _interpn from scipy.interpolate import interp1d @@ -7,6 +6,7 @@ from mhkit.river.resource import exceedance_probability from mhkit.tidal.resource import _histogram, _flood_or_ebb from mhkit.river.graphics import plot_velocity_duration_curve, _xy_plot +from mhkit.utils import convert_to_dataarray def _initialize_polar(ax=None, metadata=None, flood=None, ebb=None): @@ -28,24 +28,32 @@ def _initialize_polar(ax=None, metadata=None, flood=None, ebb=None): fig = plt.figure(figsize=(12, 8)) ax = plt.axes(polar=True) # Angles are measured clockwise from true north - ax.set_theta_zero_location('N') + ax.set_theta_zero_location("N") ax.set_theta_direction(-1) - xticks = ['N', 'NE', 'E', 'SE', 'S', 'SW', 'W', 'NW'] + xticks = ["N", "NE", "E", "SE", "S", "SW", "W", "NW"] # Polar plots do not have minor ticks, insert flood/ebb into major ticks xtickDegrees = [0.0, 45.0, 90.0, 135.0, 180.0, 225.0, 270.0, 315.0] # Set title and metadata box if metadata != None: # Set the Title - plt.title(metadata['name']) + plt.title(metadata["name"]) # List of strings for metadata box - bouy_str = [f'Lat = {float(metadata["lat"]):0.2f}$\degree$', - f'Lon = {float(metadata["lon"]):0.2f}$\degree$'] + bouy_str = [ + f'Lat = {float(metadata["lat"]):0.2f}$\degree$', + f'Lon = {float(metadata["lon"]):0.2f}$\degree$', + ] # Create string for text box - bouy_data = '\n'.join(bouy_str) + bouy_data = "\n".join(bouy_str) # Set the text box - ax.text(-0.3, 0.80, bouy_data, transform=ax.transAxes, fontsize=14, - verticalalignment='top', bbox=dict(facecolor='none', - edgecolor='k', pad=5)) + ax.text( + -0.3, + 0.80, + bouy_data, + transform=ax.transAxes, + fontsize=14, + verticalalignment="top", + bbox=dict(facecolor="none", edgecolor="k", pad=5), + ) # If defined plot flood and ebb directions as major ticks if flood != None: # Get flood direction in degrees @@ -56,7 +64,7 @@ def _initialize_polar(ax=None, metadata=None, flood=None, ebb=None): # Get location in list idxFlood = xtickDegrees.index(floodDirection) # Insert label at appropriate location - xticks[idxFlood:idxFlood] = ['\nFlood'] + xticks[idxFlood:idxFlood] = ["\nFlood"] if ebb != None: # Get flood direction in degrees ebbDirection = ebb @@ -66,8 +74,8 @@ def _initialize_polar(ax=None, metadata=None, flood=None, ebb=None): # Get location in list idxEbb = xtickDegrees.index(ebbDirection) # Insert label at appropriate location - xticks[idxEbb:idxEbb] = ['\nEbb'] - ax.set_xticks(np.array(xtickDegrees)*np.pi/180.) + xticks[idxEbb:idxEbb] = ["\nEbb"] + ax.set_xticks(np.array(xtickDegrees) * np.pi / 180.0) ax.set_xticklabels(xticks) return ax @@ -83,37 +91,32 @@ def _check_inputs(directions, velocities, flood, ebb): velocities: array-like Velocities in m/s flood: float - Direction in degrees added to theta ticks + Direction in degrees added to theta ticks ebb: float Direction in degrees added to theta ticks """ - if not isinstance(velocities, (np.ndarray, pd.Series)): - raise TypeError('velocities must be of type np.ndarry or pd.Series') - if isinstance(velocities, np.ndarray): - velocities = pd.Series(velocities) - - if not isinstance(directions, (np.ndarray, pd.Series)): - raise TypeError('directions must be of type np.ndarry or pd.Series') - if isinstance(directions, np.ndarray): - directions = pd.Series(directions) + velocities = convert_to_dataarray(velocities) + directions = convert_to_dataarray(directions) if len(velocities) != len(directions): - raise ValueError('velocities and directions must have the same length') + raise ValueError("velocities and directions must have the same length") if all(np.nan_to_num(velocities.values) < 0): - raise ValueError('All velocities must be positive') - if all(np.nan_to_num(directions.values) < 0) and all(np.nan_to_num(directions.values) > 360): - raise ValueError('directions must be between 0 and 360 degrees') + raise ValueError("All velocities must be positive") + if all(np.nan_to_num(directions.values) < 0) and all( + np.nan_to_num(directions.values) > 360 + ): + raise ValueError("directions must be between 0 and 360 degrees") if not isinstance(flood, (int, float, type(None))): - raise TypeError('flood must be of type int or float') + raise TypeError("flood must be of type int or float") if not isinstance(ebb, (int, float, type(None))): - raise TypeError('ebb must be of type int or float') + raise TypeError("ebb must be of type int or float") if flood is not None: if (flood < 0) and (flood > 360): - raise ValueError('flood must be between 0 and 360 degrees') + raise ValueError("flood must be between 0 and 360 degrees") if ebb is not None: if (ebb < 0) and (ebb > 360): - raise ValueError('ebb must be between 0 and 360 degrees') + raise ValueError("ebb must be between 0 and 360 degrees") def plot_rose( @@ -124,10 +127,10 @@ def plot_rose( ax=None, metadata=None, flood=None, - ebb=None + ebb=None, ): """ - Creates a polar histogram. Direction angles from binned histogram must + Creates a polar histogram. Direction angles from binned histogram must be specified such that 0 degrees is north. Parameters @@ -136,9 +139,9 @@ def plot_rose( Directions in degrees with 0 degrees specified as true north velocities: array-like Velocities in m/s - width_dir: float + width_dir: float Width of directional bins for histogram in degrees - width_vel: float + width_vel: float Width of velocity bins for histogram in m/s ax: float Polar plot axes to add polar histogram @@ -146,7 +149,7 @@ def plot_rose( If provided needs keys ['name', 'lat', 'lon'] for plot title and information box on plot flood: float - Direction in degrees added to theta ticks + Direction in degrees added to theta ticks ebb: float Direction in degrees added to theta ticks Returns @@ -158,45 +161,50 @@ def plot_rose( _check_inputs(directions, velocities, flood, ebb) if not isinstance(width_dir, (int, float)): - raise TypeError('width_dir must be of type int or float') + raise TypeError("width_dir must be of type int or float") if not isinstance(width_vel, (int, float)): - raise TypeError('width_vel must be of type int or float') + raise TypeError("width_vel must be of type int or float") if width_dir < 0: - raise ValueError('width_dir must be greater than 0') + raise ValueError("width_dir must be greater than 0") if width_vel < 0: - raise ValueError('width_vel must be greater than 0') + raise ValueError("width_vel must be greater than 0") # Calculate the 2D histogram - H, dir_edges, vel_edges = _histogram( - directions, velocities, width_dir, width_vel) + H, dir_edges, vel_edges = _histogram(directions, velocities, width_dir, width_vel) # Determine number of bins dir_bins = H.shape[0] vel_bins = H.shape[1] # Create the angles - thetas = np.arange(0, 2*np.pi, 2*np.pi/dir_bins) + thetas = np.arange(0, 2 * np.pi, 2 * np.pi / dir_bins) # Initialize the polar polt ax = _initialize_polar(ax=ax, metadata=metadata, flood=flood, ebb=ebb) # Set bar color based on wind speed colors = plt.cm.viridis(np.linspace(0, 1.0, vel_bins)) # Set the current speed bin label names # Calculate the 2D histogram - labels = [f'{i:.1f}-{j:.1f}' for i, - j in zip(vel_edges[:-1], vel_edges[1:])] + labels = [f"{i:.1f}-{j:.1f}" for i, j in zip(vel_edges[:-1], vel_edges[1:])] # Initialize the vertical-offset (polar radius) for the stacked bar chart. r_offset = np.zeros(dir_bins) for vel_bin in range(vel_bins): # Plot fist set of bars in all directions - ax.bar(thetas, H[:, vel_bin], width=(2*np.pi/dir_bins), - bottom=r_offset, color=colors[vel_bin], label=labels[vel_bin]) + ax.bar( + thetas, + H[:, vel_bin], + width=(2 * np.pi / dir_bins), + bottom=r_offset, + color=colors[vel_bin], + label=labels[vel_bin], + ) # Increase the radius offset in all directions r_offset = r_offset + H[:, vel_bin] # Add the a legend for current speed bins plt.legend( - loc='best', title='Velocity bins [m/s]', bbox_to_anchor=(1.29, 1.00), ncol=1) + loc="best", title="Velocity bins [m/s]", bbox_to_anchor=(1.29, 1.00), ncol=1 + ) # Get the r-ticks (polar y-ticks) yticks = plt.yticks() # Format y-ticks with units for clarity - rticks = [f'{y:.1f}%' for y in yticks[0]] + rticks = [f"{y:.1f}%" for y in yticks[0]] # Set the y-ticks plt.yticks(yticks[0], rticks) return ax @@ -210,10 +218,10 @@ def plot_joint_probability_distribution( ax=None, metadata=None, flood=None, - ebb=None + ebb=None, ): """ - Creates a polar histogram. Direction angles from binned histogram must + Creates a polar histogram. Direction angles from binned histogram must be specified such that 0 is north. Parameters @@ -222,9 +230,9 @@ def plot_joint_probability_distribution( Directions in degrees with 0 degrees specified as true north velocities: array-like Velocities in m/s - width_dir: float + width_dir: float Width of directional bins for histogram in degrees - width_vel: float + width_vel: float Width of velocity bins for histogram in m/s ax: float Polar plot axes to add polar histogram @@ -232,71 +240,68 @@ def plot_joint_probability_distribution( If provided needs keys ['name', 'Lat', 'Lon'] for plot title and information box on plot flood: float - Direction in degrees added to theta ticks + Direction in degrees added to theta ticks ebb: float Direction in degrees added to theta ticks Returns ------- ax: figure - Joint probability distribution + Joint probability distribution """ _check_inputs(directions, velocities, flood, ebb) if not isinstance(width_dir, (int, float)): - raise TypeError('width_dir must be of type int or float') + raise TypeError("width_dir must be of type int or float") if not isinstance(width_vel, (int, float)): - raise TypeError('width_vel must be of type int or float') + raise TypeError("width_vel must be of type int or float") if width_dir < 0: - raise ValueError('width_dir must be greater than 0') + raise ValueError("width_dir must be greater than 0") if width_vel < 0: - raise ValueError('width_vel must be greater than 0') + raise ValueError("width_vel must be greater than 0") # Calculate the 2D histogram - H, dir_edges, vel_edges = _histogram( - directions, velocities, width_dir, width_vel) + H, dir_edges, vel_edges = _histogram(directions, velocities, width_dir, width_vel) # Initialize the polar polt ax = _initialize_polar(ax=ax, metadata=metadata, flood=flood, ebb=ebb) # Set the current speed bin label names - labels = [f'{i:.1f}-{j:.1f}' for i, - j in zip(vel_edges[:-1], vel_edges[1:])] + labels = [f"{i:.1f}-{j:.1f}" for i, j in zip(vel_edges[:-1], vel_edges[1:])] # Set vel & dir bins to middle of bin except at ends - dir_bins = 0.5*(dir_edges[1:] + dir_edges[:-1]) # set all bins to middle - vel_bins = 0.5*(vel_edges[1:] + vel_edges[:-1]) + dir_bins = 0.5 * (dir_edges[1:] + dir_edges[:-1]) # set all bins to middle + vel_bins = 0.5 * (vel_edges[1:] + vel_edges[:-1]) # Reset end of bin range to edge of bin dir_bins[0] = dir_edges[0] vel_bins[0] = vel_edges[0] dir_bins[-1] = dir_edges[-1] vel_bins[-1] = vel_edges[-1] # Interpolate the bins back to specific data points - z = _interpn((dir_bins, vel_bins), - H, np.vstack([directions, velocities]).T, method="splinef2d", - bounds_error=False) + z = _interpn( + (dir_bins, vel_bins), + H, + np.vstack([directions, velocities]).T, + method="splinef2d", + bounds_error=False, + ) # Plot the most probable data last idx = z.argsort() # Convert to radians and order points by probability - theta, r, z = directions.values[idx] * \ - np.pi/180, velocities.values[idx], z[idx] + theta, r, z = directions.values[idx] * np.pi / 180, velocities.values[idx], z[idx] # Create scatter plot colored by probability density sx = ax.scatter(theta, r, c=z, s=5, edgecolor=None) # Create colorbar - plt.colorbar(sx, ax=ax, label='Joint Probability [%]') + plt.colorbar(sx, ax=ax, label="Joint Probability [%]") # Get the r-ticks (polar y-ticks) yticks = ax.get_yticks() # Set y-ticks labels ax.set_yticks(yticks) # to avoid matplotlib warning - ax.set_yticklabels([f'{y:.1f} $m/s$' for y in yticks]) + ax.set_yticklabels([f"{y:.1f} $m/s$" for y in yticks]) return ax def plot_current_timeseries( - directions, - velocities, - principal_direction, - label=None, - ax=None + directions, velocities, principal_direction, label=None, ax=None ): """ Returns a plot of velocity from an array of direction and speed @@ -313,7 +318,7 @@ def plot_current_timeseries( label: string Label to use in the legend ax : matplotlib axes object - Axes for plotting. If None, then a new figure with a single + Axes for plotting. If None, then a new figure with a single axes is used. Returns @@ -325,30 +330,29 @@ def plot_current_timeseries( _check_inputs(directions, velocities, flood=None, ebb=None) if not isinstance(principal_direction, (int, float)): - raise TypeError('principal_direction must be of type int or float') + raise TypeError("principal_direction must be of type int or float") if (principal_direction < 0) and (principal_direction > 360): - raise ValueError( - 'principal_direction must be between 0 and 360 degrees') + raise ValueError("principal_direction must be between 0 and 360 degrees") # Rotate coordinate system by supplied principal_direction principal_directions = directions - principal_direction # Calculate the velocity - velocity = velocities * np.cos(np.pi/180*principal_directions) + velocity = velocities * np.cos(np.pi / 180 * principal_directions) # Call on standard xy plotting - ax = _xy_plot(velocities.index, velocity, fmt='-', label=label, - xlabel='Time', ylabel='Velocity [$m/s$]', ax=ax) + ax = _xy_plot( + velocities.index, + velocity, + fmt="-", + label=label, + xlabel="Time", + ylabel="Velocity [$m/s$]", + ax=ax, + ) return ax -def tidal_phase_probability( - directions, - velocities, - flood, - ebb, - bin_size=0.1, - ax=None -): - """ +def tidal_phase_probability(directions, velocities, flood, ebb, bin_size=0.1, ax=None): + """ Discretizes the tidal series speed by bin size and returns a plot of the probability for each bin in the flood or ebb tidal phase. @@ -365,7 +369,7 @@ def tidal_phase_probability( bin_size: float Speed bin size. Optional. Deaful = 0.1 m/s ax : matplotlib axes object - Axes for plotting. If None, then a new figure with a single + Axes for plotting. If None, then a new figure with a single axes is used. Returns @@ -375,22 +379,22 @@ def tidal_phase_probability( _check_inputs(directions, velocities, flood, ebb) if bin_size < 0: - raise ValueError('bin_size must be greater than 0') + raise ValueError("bin_size must be greater than 0") if ax == None: fig, ax = plt.subplots(figsize=(12, 8)) isEbb = _flood_or_ebb(directions, flood, ebb) - decimals = round(bin_size/0.1) - N_bins = int(round(velocities.max(), decimals)/bin_size) + decimals = round(bin_size / 0.1) + N_bins = int(round(velocities.max(), decimals) / bin_size) H, bins = np.histogram(velocities, bins=N_bins) H_ebb, bins1 = np.histogram(velocities[isEbb], bins=bins) H_flood, bins2 = np.histogram(velocities[~isEbb], bins=bins) - p_ebb = H_ebb/H - p_flood = H_flood/H + p_ebb = H_ebb / H + p_flood = H_flood / H center = (bins[:-1] + bins[1:]) / 2 width = 0.9 * (bins[1] - bins[0]) @@ -398,32 +402,44 @@ def tidal_phase_probability( mask1 = np.ma.where(p_ebb >= p_flood) mask2 = np.ma.where(p_flood >= p_ebb) - ax.bar(center[mask1], height=p_ebb[mask1], edgecolor='black', width=width, - label='Ebb', color='blue') - ax.bar(center, height=p_flood, edgecolor='black', width=width, - alpha=1, label='Flood', color='orange') - ax.bar(center[mask2], height=p_ebb[mask2], alpha=1, edgecolor='black', - width=width, color='blue') - - plt.xlabel('Velocity [m/s]') - plt.ylabel('Probability') + ax.bar( + center[mask1], + height=p_ebb[mask1], + edgecolor="black", + width=width, + label="Ebb", + color="blue", + ) + ax.bar( + center, + height=p_flood, + edgecolor="black", + width=width, + alpha=1, + label="Flood", + color="orange", + ) + ax.bar( + center[mask2], + height=p_ebb[mask2], + alpha=1, + edgecolor="black", + width=width, + color="blue", + ) + + plt.xlabel("Velocity [m/s]") + plt.ylabel("Probability") plt.ylim(0, 1.0) plt.legend() - plt.grid(linestyle=':') + plt.grid(linestyle=":") return ax -def tidal_phase_exceedance( - directions, - velocities, - flood, - ebb, - bin_size=0.1, - ax=None -): +def tidal_phase_exceedance(directions, velocities, flood, ebb, bin_size=0.1, ax=None): """ - Returns a stacked area plot of the exceedance probability for the + Returns a stacked area plot of the exceedance probability for the flood and ebb tidal phases. Parameters @@ -435,21 +451,21 @@ def tidal_phase_exceedance( flood: float or int Principal component of flow in the flood direction [degrees] ebb: float or int - Principal component of flow in the ebb direction [degrees] + Principal component of flow in the ebb direction [degrees] bin_size: float - Speed bin size. Optional. Deaful = 0.1 m/s + Speed bin size. Optional. Deaful = 0.1 m/s ax : matplotlib axes object - Axes for plotting. If None, then a new figure with a single + Axes for plotting. If None, then a new figure with a single axes is used. Returns ------- - ax: figure + ax: figure """ _check_inputs(directions, velocities, flood, ebb) if bin_size < 0: - raise ValueError('bin_size must be greater than 0') + raise ValueError("bin_size must be greater than 0") if ax == None: fig, ax = plt.subplots(figsize=(12, 8)) @@ -459,17 +475,20 @@ def tidal_phase_exceedance( s_ebb = velocities[isEbb] s_flood = velocities[~isEbb] - F = exceedance_probability(velocities)['F'] - F_ebb = exceedance_probability(s_ebb)['F'] - F_flood = exceedance_probability(s_flood)['F'] + F = exceedance_probability(velocities)["F"] + F_ebb = exceedance_probability(s_ebb)["F"] + F_flood = exceedance_probability(s_flood)["F"] - decimals = round(bin_size/0.1) - s_new = np.arange(np.around(velocities.min(), decimals), - np.around(velocities.max(), decimals)+bin_size, bin_size) + decimals = round(bin_size / 0.1) + s_new = np.arange( + np.around(velocities.min(), decimals), + np.around(velocities.max(), decimals) + bin_size, + bin_size, + ) f_total = interp1d(velocities, F, bounds_error=False) - f_ebb = interp1d(s_ebb, F_ebb, bounds_error=False) - f_flood = interp1d(s_flood, F_flood, bounds_error=False) + f_ebb = interp1d(s_ebb, F_ebb, bounds_error=False) + f_flood = interp1d(s_flood, F_flood, bounds_error=False) F_total = f_total(s_new) F_ebb = f_ebb(s_new) @@ -477,12 +496,16 @@ def tidal_phase_exceedance( F_max_total = np.nanmax(F_ebb) + np.nanmax(F_flood) - ax.stackplot(s_new, F_ebb/F_max_total*100, - F_flood/F_max_total*100, labels=['Ebb', 'Flood']) + ax.stackplot( + s_new, + F_ebb / F_max_total * 100, + F_flood / F_max_total * 100, + labels=["Ebb", "Flood"], + ) - plt.xlabel('velocity [m/s]') - plt.ylabel('Probability of Exceedance') + plt.xlabel("velocity [m/s]") + plt.ylabel("Probability of Exceedance") plt.legend() - plt.grid(linestyle=':', linewidth=1) + plt.grid(linestyle=":", linewidth=1) return ax diff --git a/mhkit/tidal/io/__init__.py b/mhkit/tidal/io/__init__.py index 3e20434aa..3f75b8116 100644 --- a/mhkit/tidal/io/__init__.py +++ b/mhkit/tidal/io/__init__.py @@ -1 +1,2 @@ from mhkit.tidal.io import noaa +from mhkit.tidal.io import d3d diff --git a/mhkit/tidal/io/d3d.py b/mhkit/tidal/io/d3d.py new file mode 100644 index 000000000..67ec083d9 --- /dev/null +++ b/mhkit/tidal/io/d3d.py @@ -0,0 +1 @@ +from mhkit.river.io.d3d import * diff --git a/mhkit/tidal/io/noaa.py b/mhkit/tidal/io/noaa.py index 4c261fb43..f11820695 100644 --- a/mhkit/tidal/io/noaa.py +++ b/mhkit/tidal/io/noaa.py @@ -1,42 +1,55 @@ """ noaa.py -This module provides functions to fetch, process, and read NOAA (National Oceanic and Atmospheric Administration) -current data directly from the NOAA Tides and Currents API (https://tidesandcurrents.noaa.gov/api/). It supports -loading data into a pandas DataFrame, handling data in XML and JSON formats, and writing data to a JSON file. +This module provides functions to fetch, process, and read NOAA (National +Oceanic and Atmospheric Administration) current data directly from the +NOAA Tides and Currents API (https://tidesandcurrents.noaa.gov/api/). It +supports loading data into a pandas DataFrame, handling data in XML and +JSON formats, and writing data to a JSON file. Functions: ---------- -request_noaa_data(station, parameter, start_date, end_date, proxy=None, write_json=None): - Loads NOAA current data from the API into a pandas DataFrame, with optional support for proxy settings and - writing data to a JSON file. - -_json_to_dataframe(response): - Converts NOAA response data in JSON format into a pandas DataFrame and returns metadata. (Currently, this - function does not return the full dataset requested.) +request_noaa_data(station, parameter, start_date, end_date, proxy=None, + write_json=None): + Loads NOAA current data from the API into a pandas DataFrame, + with optional support for proxy settings and writing data to a JSON + file. _xml_to_dataframe(response): - Converts NOAA response data in XML format into a pandas DataFrame and returns metadata. + Converts NOAA response data in XML format into a pandas DataFrame + and returns metadata. read_noaa_json(filename): - Reads a JSON file containing NOAA data saved from the request_noaa_data function and returns a DataFrame with - timeseries site data and metadata. + Reads a JSON file containing NOAA data saved from the request_noaa_data + function and returns a DataFrame with timeseries site data and metadata. """ + +import os import xml.etree.ElementTree as ET import datetime import json import math +import shutil import pandas as pd import requests - - -def request_noaa_data(station, parameter, start_date, end_date, - proxy=None, write_json=None): +from mhkit.utils.cache import handle_caching + + +def request_noaa_data( + station, + parameter, + start_date, + end_date, + proxy=None, + write_json=None, + clear_cache=False, + to_pandas=True, +): """ - Loads NOAA current data directly from https://tidesandcurrents.noaa.gov/api/ using a - get request into a pandas DataFrame. NOAA sets max of 31 days between start and end date. - See https://co-ops.nos.noaa.gov/api/ for options. All times are reported as GMT and metric - units are returned for data. + Loads NOAA current data directly from https://tidesandcurrents.noaa.gov/api/ + into a pandas DataFrame. NOAA sets max of 31 days between start and end date. + See https://co-ops.nos.noaa.gov/api/ for options. All times are reported as + GMT and metric units are returned for data. Uses cached data if available. The request URL prints to the screen. @@ -49,158 +62,231 @@ def request_noaa_data(station, parameter, start_date, end_date, start_date : str Start date in the format yyyyMMdd end_date : str - End date in the format yyyyMMdd + End date in the format yyyyMMdd proxy : dict or None - To request data from behind a firewall, define a dictionary of proxy settings, - for example {"http": 'localhost:8080'} + To request data from behind a firewall, define a dictionary of proxy + settings, for example {"http": 'localhost:8080'} write_json : str or None Name of json file to write data + clear_cache : bool + If True, the cache for this specific request will be cleared. + to_pandas : bool, optional + Flag to output pandas instead of xarray. Default = True. Returns ------- - data : pandas DataFrame - Data indexed by datetime with columns named according to the parameter's + data : pandas DataFrame or xarray Dataset + Data indexed by datetime with columns named according to the parameter's variable description + metadata : dict or None + Request metadata. If returning xarray, metadata is instead attached to + the data's attributes. """ - # Convert start and end dates to datetime objects - begin = datetime.datetime.strptime(start_date, '%Y%m%d').date() - end = datetime.datetime.strptime(end_date, '%Y%m%d').date() - - # Determine the number of 30 day intervals - delta = 30 - interval = math.ceil(((end - begin).days)/delta) - - # Create date ranges with 30 day intervals - date_list = [ - begin + datetime.timedelta(days=i * delta) for i in range(interval + 1)] - date_list[-1] = end - - # Iterate over date_list (30 day intervals) and fetch data - data_frames = [] - for i in range(len(date_list) - 1): - start_date = date_list[i].strftime('%Y%m%d') - end_date = date_list[i + 1].strftime('%Y%m%d') - - api_query = f"begin_date={start_date}&end_date={end_date}&station={station}&product={parameter}&units=metric&time_zone=gmt&application=web_services&format=xml" - data_url = f"https://tidesandcurrents.noaa.gov/api/datagetter?{api_query}" - - print('Data request URL: ', data_url) - - # Get response - response = requests.get(url=data_url, proxies=proxy) - - # Convert to DataFrame and save in data_frames list - df, metadata = _xml_to_dataframe(response) - data_frames.append(df) - - # Concatenate all DataFrames - data = pd.concat(data_frames, ignore_index=False) - - # Remove duplicated date values - data = data.loc[~data.index.duplicated()] - - # Write json if specified - if write_json is not None: - with open(write_json, 'w') as outfile: - # Convert DataFrame to json - jsonData = data.to_json() - # Convert to python object data - pyData = json.loads(jsonData) - # Add metadata to pyData - pyData['metadata'] = metadata - # Wrtie the pyData to a json file - json.dump(pyData, outfile) - return data, metadata - - -def _json_to_dataframe(response): - ''' - Returns a dataframe and metadata from a NOAA - response. - TODO: This function currently does not return the - full dataset requested. - ''' - text = json.loads(response.text) - metadata = text['metadata'] - # import ipdb; ipdb.set_trace() - # Initialize DataFrame - data = pd.DataFrame.from_records( - text['data'][1], index=[text['data'][1]['t']]) - # Append all times to DataFrame - for i in range(1, len(text['data'])): - data.append(pd.DataFrame.from_records(text['data'][i], - index=[text['data'][i]['t']])) - # Convert index to DataFram - data.index = pd.to_datetime(data.index) - # Remove 't' becuase it is the index - del data['t'] - # List of columns which are string - cols = data.columns[data.dtypes.eq('object')] - # Convert columns to float - data[cols] = data[cols].apply(pd.to_numeric, errors='coerce') - return data, metadata + # Type check inputs + if not isinstance(station, str): + raise TypeError( + f"Expected 'station' to be of type str, but got {type(station)}" + ) + if not isinstance(parameter, str): + raise TypeError( + f"Expected 'parameter' to be of type str, but got {type(parameter)}" + ) + if not isinstance(start_date, str): + raise TypeError( + f"Expected 'start_date' to be of type str, but got {type(start_date)}" + ) + if not isinstance(end_date, str): + raise TypeError( + f"Expected 'end_date' to be of type str, but got {type(end_date)}" + ) + if proxy and not isinstance(proxy, dict): + raise TypeError( + f"Expected 'proxy' to be of type dict or None, but got {type(proxy)}" + ) + if write_json and not isinstance(write_json, str): + raise TypeError( + f"Expected 'write_json' to be of type str or None, but got {type(write_json)}" + ) + if not isinstance(clear_cache, bool): + raise TypeError( + f"Expected 'clear_cache' to be of type bool, but got {type(clear_cache)}" + ) + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type bool. Got: {type(to_pandas)}") + + # Define the path to the cache directory + cache_dir = os.path.join(os.path.expanduser("~"), ".cache", "mhkit", "noaa") + + # Create a unique filename based on the function parameters + hash_params = f"{station}_{parameter}_{start_date}_{end_date}" + + # Use handle_caching to manage cache + cached_data, cached_metadata, cache_filepath = handle_caching( + hash_params, cache_dir, write_json=write_json, clear_cache_file=clear_cache + ) + + if cached_data is not None: + if write_json: + shutil.copy(cache_filepath, write_json) + if to_pandas: + return cached_data, cached_metadata + else: + cached_data = cached_data.to_xarray() + cached_data.attrs = cached_metadata + return cached_data + # If no cached data is available, make the API request + # no coverage bc in coverage runs we have already cached the data/ run this code + else: # pragma: no cover + # Convert start and end dates to datetime objects + begin = datetime.datetime.strptime(start_date, "%Y%m%d").date() + end = datetime.datetime.strptime(end_date, "%Y%m%d").date() + + # Determine the number of 30 day intervals + delta = 30 + interval = math.ceil(((end - begin).days) / delta) + + # Create date ranges with 30 day intervals + date_list = [ + begin + datetime.timedelta(days=i * delta) for i in range(interval + 1) + ] + date_list[-1] = end + + # Iterate over date_list (30 day intervals) and fetch data + data_frames = [] + for i in range(len(date_list) - 1): + start_date = date_list[i].strftime("%Y%m%d") + end_date = date_list[i + 1].strftime("%Y%m%d") + + api_query = f"begin_date={start_date}&end_date={end_date}&station={station}&product={parameter}&units=metric&time_zone=gmt&application=web_services&format=xml" + data_url = f"https://tidesandcurrents.noaa.gov/api/datagetter?{api_query}" + + print("Data request URL: ", data_url) + + # Get response + try: + response = requests.get(url=data_url, proxies=proxy) + response.raise_for_status() + except requests.exceptions.HTTPError as err: + print(f"HTTP error occurred: {err}") + continue + except requests.exceptions.RequestException as err: + print(f"Error occurred: {err}") + continue + # Convert to DataFrame and save in data_frames list + df, metadata = _xml_to_dataframe(response) + data_frames.append(df) + + # Concatenate all DataFrames + data = pd.concat(data_frames, ignore_index=False) + + # Remove duplicated date values + data = data.loc[~data.index.duplicated()] + + # After making the API request and processing the response, write the + # response to a cache file + handle_caching( + hash_params, + cache_dir, + data=data, + metadata=metadata, + clear_cache_file=clear_cache, + ) + + if write_json: + shutil.copy(cache_filepath, write_json) + + if to_pandas: + return data, metadata + else: + data = data.to_xarray() + data.attrs = metadata + return data def _xml_to_dataframe(response): - ''' + """ Returns a dataframe from an xml response - ''' + """ root = ET.fromstring(response.text) metadata = None data = None for child in root: # Save meta data dictionary - if child.tag == 'metadata': + if child.tag == "metadata": metadata = child.attrib - elif child.tag == 'observations': + elif child.tag == "observations": data = child - elif child.tag == 'error': - print('***ERROR: Response returned error') + elif child.tag == "error": + print("***ERROR: Response returned error") return None if data is None: - print('***ERROR: No observations found') + print("***ERROR: No observations found") return None # Create a list of DataFrames then Concatenate - df = pd.concat([pd.DataFrame(obs.attrib, index=[0]) - for obs in data], ignore_index=True) + df = pd.concat( + [pd.DataFrame(obs.attrib, index=[0]) for obs in data], ignore_index=True + ) # Convert time to datetime - df['t'] = pd.to_datetime(df.t) - df = df.set_index('t') + df["t"] = pd.to_datetime(df.t) + df = df.set_index("t") df.drop_duplicates(inplace=True) # Convert data to float - df[['d', 's']] = df[['d', 's']].apply(pd.to_numeric) + df[["d", "s"]] = df[["d", "s"]].apply(pd.to_numeric) return df, metadata -def read_noaa_json(filename): - ''' - Returns site DataFrame and metadata from a json saved from the +def read_noaa_json(filename, to_pandas=True): + """ + Returns site DataFrame and metadata from a json saved from the request_noaa_data Parameters ---------- filename: string filename with path of json file to load + to_pandas : bool, optional + Flag to output pandas instead of xarray. Default = True. + Returns ------- data: DataFrame - Timeseries Site data of direction and speed - metadata: dictionary - Site metadata - ''' + Timeseries Site data of direction and speed + metadata : dictionary or None + Site metadata. If returning xarray, metadata is instead attached to + the data's attributes. + """ + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type bool. Got: {type(to_pandas)}") + with open(filename) as outfile: - jsonData = json.load(outfile) - # Get the metadata - metadata = jsonData['metadata'] - # Remove metadata entry - del jsonData['metadata'] - # Remainder is DataFrame - data = pd.DataFrame.from_dict(jsonData) - # Convert from epoch to date time - data.index = pd.to_datetime(data.index, unit='ms') - return data, metadata + json_data = json.load(outfile) + try: # original MHKiT format (deprecate in future) + # Get the metadata + metadata = json_data["metadata"] + # Remove metadata entry + del json_data["metadata"] + # Remainder is DataFrame + data = pd.DataFrame.from_dict(json_data) + # Convert from epoch to date time + data.index = pd.to_datetime(data.index, unit="ms") + + except ValueError: # using cache.py format + if "metadata" in json_data: + metadata = json_data.pop("metadata", None) + data = pd.DataFrame( + json_data["data"], + index=pd.to_datetime(json_data["index"]), + columns=json_data["columns"], + ) + + if to_pandas: + return data, metadata + else: + data = data.to_xarray() + data.attrs = metadata + return data diff --git a/mhkit/tidal/performance.py b/mhkit/tidal/performance.py index f3346003a..3a516bec7 100644 --- a/mhkit/tidal/performance.py +++ b/mhkit/tidal/performance.py @@ -1,12 +1,16 @@ import numpy as np -import pandas as pd import xarray as xr -import warnings +from mhkit.utils import convert_to_dataarray from mhkit import dolfyn -from mhkit.river.performance import (circular, ducted, rectangular, - multiple_circular, tip_speed_ratio, - power_coefficient) +from mhkit.river.performance import ( + circular, + ducted, + rectangular, + multiple_circular, + tip_speed_ratio, + power_coefficient, +) def _slice_circular_capture_area(diameter, hub_height, doppler_cell_size): @@ -29,15 +33,15 @@ def _slice_circular_capture_area(diameter, hub_height, doppler_cell_size): Returns --------- capture_area_slice: xarray.DataArray - Capture area sliced into horizontal slices of height + Capture area sliced into horizontal slices of height `doppler_cell_size`, centered on `hub height`. """ def area_of_circle_segment(radius, angle): # Calculating area of sector - area_of_sector = np.pi * radius**2 * (angle/360) + area_of_sector = np.pi * radius**2 * (angle / 360) # Calculating area of triangle - area_of_triangle = 0.5 * radius**2 * np.sin((np.pi*angle)/180) + area_of_triangle = 0.5 * radius**2 * np.sin((np.pi * angle) / 180) return area_of_sector - area_of_triangle def point_on_circle(y, r): @@ -47,44 +51,44 @@ def point_on_circle(y, r): d = diameter cs = doppler_cell_size - A_cap = np.pi*(d/2)**2 # m^2 + A_cap = np.pi * (d / 2) ** 2 # m^2 # Need to chop up capture area into slices based on bin size # For a cirle: - r_min = hub_height - d/2 - r_max = hub_height + d/2 - A_edge = np.arange(r_min, r_max+cs, cs) - A_rng = A_edge[:-1] + cs/2 # Center of each slice + r_min = hub_height - d / 2 + r_max = hub_height + d / 2 + A_edge = np.arange(r_min, r_max + cs, cs) + A_rng = A_edge[:-1] + cs / 2 # Center of each slice # y runs from the bottom edge of the lower centerline slice to # the top edge of the lowest slice # Will need to figure out y if the hub height isn't centered y = abs(A_edge - np.mean(A_edge)) - y[np.where(abs(y) > (d/2))] = d/2 + y[np.where(abs(y) > (d / 2))] = d / 2 # Even vs odd number of slices if y.size % 2: odd = 1 else: odd = 0 - y = y[:len(y)//2] + y = y[: len(y) // 2] y = np.append(y, 0) - x = point_on_circle(y, d/2) - radii = np.rad2deg(np.arctan(x/y)*2) + x = point_on_circle(y, d / 2) + radii = np.rad2deg(np.arctan(x / y) * 2) # Segments go from outside of circle towards middle - As = area_of_circle_segment(d/2, radii) + As = area_of_circle_segment(d / 2, radii) # Subtract segments to get area of slices As_slc = As[1:] - As[:-1] if not odd: # Make middle slice half whole - As_slc[-1] = As_slc[-1]*2 + As_slc[-1] = As_slc[-1] * 2 # Copy-flip the other slices to get the whole circle As_slc = np.append(As_slc, np.flip(As_slc[:-1])) else: As_slc = abs(As_slc) - return xr.DataArray(As_slc, coords={'range': A_rng}) + return xr.DataArray(As_slc, coords={"range": A_rng}) def _slice_rectangular_capture_area(height, width, hub_height, doppler_cell_size): @@ -110,72 +114,48 @@ def _slice_rectangular_capture_area(height, width, hub_height, doppler_cell_size Returns --------- capture_area_slice: xarray.DataArray - Capture area sliced into horizontal slices of height + Capture area sliced into horizontal slices of height `doppler_cell_size`, centered on `hub height`. """ # Need to chop up capture area into slices based on bin size # For a rectangle it's pretty simple cs = doppler_cell_size - r_min = hub_height - height/2 - r_max = hub_height + height/2 - A_edge = np.arange(r_min, r_max+cs, cs) - A_rng = A_edge[:-1] + cs/2 # Center of each slice - - As_slc = np.ones(len(A_rng))*width*cs - - return xr.DataArray(As_slc, coords={'range': A_rng}) - - -def _check_dtype(var, var_name): + r_min = hub_height - height / 2 + r_max = hub_height + height / 2 + A_edge = np.arange(r_min, r_max + cs, cs) + A_rng = A_edge[:-1] + cs / 2 # Center of each slice + + As_slc = np.ones(len(A_rng)) * width * cs + + return xr.DataArray(As_slc, coords={"range": A_rng}) + + +def power_curve( + power, + velocity, + hub_height, + doppler_cell_size, + sampling_frequency, + window_avg_time=600, + turbine_profile="circular", + diameter=None, + height=None, + width=None, + to_pandas=True, +): """ - Checks the datatype of a variable, converting pandas Series to xarray DataArray, - or raising an error if the datatype is neither. - - Parameters - ------------- - var: xr.DataArray or pd.Series - The variable to be checked. - - var_name: str - The name of the variable, used for error message. - - Returns - --------- - var: xr.DataArray - The input variable, converted to xr.DataArray if it was a pd.Series. - """ - - if isinstance(var, pd.Series): - var = var.to_xarray() - elif not isinstance(var, xr.DataArray): - raise TypeError(var_name.capitalize() + - ' must be of type xr.DataArray or pd.Series') - return var - - -def power_curve(power, - velocity, - hub_height, - doppler_cell_size, - sampling_frequency, - window_avg_time=600, - turbine_profile='circular', - diameter=None, - height=None, - width=None): - """ - Calculates power curve and power statistics for a marine energy + Calculates power curve and power statistics for a marine energy device based on IEC/TS 62600-200 section 9.3. Parameters ------------- - power: pandas.Series or xarray.DataArray (time) + power: numpy ndarray, pandas DataFrame, pandas Series, xarray DataArray, or xarray Dataset Device power output timeseries. - velocity: pandas.Series or xarray.DataArray ([range,] time) + velocity: numpy ndarray, pandas DataFrame, pandas Series, xarray DataArray, or xarray Dataset 1D or 2D streamwise sea water velocity or sea water speed. hub_height: numeric - Turbine hub height altitude above the seabed. Assumes ADCP + Turbine hub height altitude above the seabed. Assumes ADCP depth bins are referenced to the seafloor. doppler_cell_size: numeric ADCP depth bin size. @@ -191,111 +171,141 @@ def power_curve(power, Required for turbine_profile='rectangular'. Defaults to None. width: numeric, optional Required for turbine_profile='rectangular'. Defaults to None. + to_pandas: bool, optional + Flag to output pandas instead of xarray. Default = True. Returns --------- - pandas.DataFrame + device_power_curve: pandas DataFrame or xarray Dataset Power-weighted velocity, mean power, power std dev, max and min power vs hub-height velocity. """ # Velocity should be a 2D xarray or pandas array and have dims (range, time) # Power should have a timestamp coordinate/index - power = _check_dtype(power, 'power') - velocity = _check_dtype(velocity, 'velocity') + power = convert_to_dataarray(power) + velocity = convert_to_dataarray(velocity) if len(velocity.shape) != 2: - raise ValueError("Velocity should be 2 dimensional and have \ - dimensions of 'time' (temporal) and 'range' (spatial).") + raise ValueError( + "Velocity should be 2 dimensional and have \ + dimensions of 'time' (temporal) and 'range' (spatial)." + ) + + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type bool. Got: {type(to_pandas)}") # Numeric positive checks - numeric_params = [hub_height, doppler_cell_size, - sampling_frequency, window_avg_time] - numeric_param_names = ['hub_height', 'doppler_cell_size', - 'sampling_frequency', 'window_avg_time'] + numeric_params = [ + hub_height, + doppler_cell_size, + sampling_frequency, + window_avg_time, + ] + numeric_param_names = [ + "hub_height", + "doppler_cell_size", + "sampling_frequency", + "window_avg_time", + ] for param, name in zip(numeric_params, numeric_param_names): if not isinstance(param, (int, float)): - raise TypeError(f'{name} must be numeric.') + raise TypeError(f"{name} must be numeric.") if param <= 0: - raise ValueError(f'{name} must be positive.') + raise ValueError(f"{name} must be positive.") # Turbine profile related checks - if turbine_profile not in ['circular', 'rectangular']: + if turbine_profile not in ["circular", "rectangular"]: raise ValueError( - "`turbine_profile` must be one of 'circular' or 'rectangular'.") - if turbine_profile == 'circular': + "`turbine_profile` must be one of 'circular' or 'rectangular'." + ) + if turbine_profile == "circular": if diameter is None: raise TypeError( - "`diameter` cannot be None for input `turbine_profile` = 'circular'.") + "`diameter` cannot be None for input `turbine_profile` = 'circular'." + ) elif not isinstance(diameter, (int, float)) or diameter <= 0: raise ValueError("`diameter` must be a positive number.") else: # If the checks pass, calculate A_slc A_slc = _slice_circular_capture_area( - diameter, hub_height, doppler_cell_size) + diameter, hub_height, doppler_cell_size + ) else: # Rectangular profile if height is None or width is None: raise TypeError( - "`height` and `width` cannot be None for input `turbine_profile` = 'rectangular'.") - elif not all(isinstance(val, (int, float)) and val > 0 for val in [height, width]): + "`height` and `width` cannot be None for input `turbine_profile` = 'rectangular'." + ) + elif not all( + isinstance(val, (int, float)) and val > 0 for val in [height, width] + ): raise ValueError("`height` and `width` must be positive numbers.") else: # If the checks pass, calculate A_slc A_slc = _slice_rectangular_capture_area( - height, width, hub_height, doppler_cell_size) + height, width, hub_height, doppler_cell_size + ) # Streamwise data U = abs(velocity) - time = U['time'].values + time = U["time"].values # Interpolate power to velocity timestamps - P = power.interp(time=U['time'], method='linear') + P = power.interp(time=U["time"], method="linear") # Power weighted velocity in capture area # Interpolate U range to capture area slices, then cube and multiply by area - U_hat = U.interp(range=A_slc['range'], method='linear')**3 * A_slc + U_hat = U.interp(range=A_slc["range"], method="linear") ** 3 * A_slc # Average the velocity across the capture area and divide out area - U_hat = (U_hat.sum('range') / A_slc.sum()) ** (-1/3) + U_hat = (U_hat.sum("range") / A_slc.sum()) ** (-1 / 3) # Time-average velocity at hub-height - bnr = dolfyn.VelBinner(n_bin=window_avg_time * - sampling_frequency, fs=sampling_frequency) + bnr = dolfyn.VelBinner( + n_bin=window_avg_time * sampling_frequency, fs=sampling_frequency + ) # Hub-height velocity mean - mean_hub_vel = xr.DataArray(bnr.mean(U.sel(range=hub_height, method='nearest').values), - coords={'time': bnr.mean(time)}) + mean_hub_vel = xr.DataArray( + bnr.mean(U.sel(range=hub_height, method="nearest").values), + coords={"time": bnr.mean(time)}, + ) # Power-weighted hub-height velocity mean - U_hat_bar = xr.DataArray((bnr.mean(U_hat.values ** 3)) ** (-1/3), - coords={'time': bnr.mean(time)}) + U_hat_bar = xr.DataArray( + (bnr.mean(U_hat.values**3)) ** (-1 / 3), coords={"time": bnr.mean(time)} + ) # Average power - P_bar = xr.DataArray(bnr.mean(P.values), - coords={'time': bnr.mean(time)}) + P_bar = xr.DataArray(bnr.mean(P.values), coords={"time": bnr.mean(time)}) # Then reorganize into 0.1 m velocity bins and average U_bins = np.arange(0, np.nanmax(mean_hub_vel) + 0.1, 0.1) - U_hub_vel = mean_hub_vel.assign_coords( - {"time": mean_hub_vel}).rename({"time": "speed"}) + U_hub_vel = mean_hub_vel.assign_coords({"time": mean_hub_vel}).rename( + {"time": "speed"} + ) U_hub_mean = U_hub_vel.groupby_bins("speed", U_bins).mean() - U_hat_vel = U_hat_bar.assign_coords( - {"time": mean_hub_vel}).rename({"time": "speed"}) + U_hat_vel = U_hat_bar.assign_coords({"time": mean_hub_vel}).rename( + {"time": "speed"} + ) U_hat_mean = U_hat_vel.groupby_bins("speed", U_bins).mean() - P_bar_vel = P_bar.assign_coords( - {"time": mean_hub_vel}).rename({"time": "speed"}) + P_bar_vel = P_bar.assign_coords({"time": mean_hub_vel}).rename({"time": "speed"}) P_bar_mean = P_bar_vel.groupby_bins("speed", U_bins).mean() P_bar_std = P_bar_vel.groupby_bins("speed", U_bins).std() P_bar_max = P_bar_vel.groupby_bins("speed", U_bins).max() P_bar_min = P_bar_vel.groupby_bins("speed", U_bins).min() - out = pd.DataFrame((U_hub_mean.to_series(), - U_hat_mean.to_series(), - P_bar_mean.to_series(), - P_bar_std.to_series(), - P_bar_max.to_series(), - P_bar_min.to_series(), - )).T - out.columns = ['U_avg', 'U_avg_power_weighted', - 'P_avg', 'P_std', 'P_max', 'P_min'] - out.index.name = 'U_bins' + device_power_curve = xr.Dataset( + { + "U_avg": U_hub_mean, + "U_avg_power_weighted": U_hat_mean, + "P_avg": P_bar_mean, + "P_std": P_bar_std, + "P_max": P_bar_max, + "P_min": P_bar_min, + } + ) + device_power_curve = device_power_curve.rename({"speed_bins": "U_bins"}) - return out + if to_pandas: + device_power_curve = device_power_curve.to_pandas() + + return device_power_curve def _average_velocity_bins(U, U_hub, bin_size): @@ -314,7 +324,7 @@ def _average_velocity_bins(U, U_hub, bin_size): Returns --------- - xarray.DataArray + U_binned: xarray.DataArray Data grouped into velocity bins. """ @@ -322,10 +332,10 @@ def _average_velocity_bins(U, U_hub, bin_size): U_bins = np.arange(0, np.nanmax(U_hub) + bin_size, bin_size) # Group time-ensembles into velocity bins based on hub-height velocity and average - out = U.assign_coords({"time": U_hub}).rename({"time": "speed"}) - out = out.groupby_bins("speed", U_bins).mean() + U_binned = U.assign_coords({"time": U_hub}).rename({"time": "speed"}) + U_binned = U_binned.groupby_bins("speed", U_bins).mean() - return out + return U_binned def _apply_function(function, bnr, U): @@ -351,39 +361,41 @@ def _apply_function(function, bnr, U): applied, grouped into bins according to bnr. """ - if function == 'mean': + if function == "mean": # Average data into 5-10 minute ensembles return xr.DataArray( bnr.mean(abs(U).values), - coords={'range': U.range, - 'time': bnr.mean(U['time'].values)}) - elif function == 'rms': + coords={"range": U.range, "time": bnr.mean(U["time"].values)}, + ) + elif function == "rms": # Reshape tidal velocity - returns (range, ensemble-time, ensemble elements) U_reshaped = bnr.reshape(abs(U).values) # Take root-mean-square U_rms = np.sqrt(np.nanmean(U_reshaped**2, axis=-1)) return xr.DataArray( - U_rms, - coords={'range': U.range, - 'time': bnr.mean(U['time'].values)}) - elif function == 'std': + U_rms, coords={"range": U.range, "time": bnr.mean(U["time"].values)} + ) + elif function == "std": # Standard deviation return xr.DataArray( bnr.standard_deviation(U.values), - coords={'range': U.range, - 'time': bnr.mean(U['time'].values)}) + coords={"range": U.range, "time": bnr.mean(U["time"].values)}, + ) else: raise ValueError( - f"Unknown function {function}. Should be one of 'mean', 'rms', or 'std'") - - -def velocity_profiles(velocity, - hub_height, - water_depth, - sampling_frequency, - window_avg_time=600, - function='mean', - ): + f"Unknown function {function}. Should be one of 'mean', 'rms', or 'std'" + ) + + +def velocity_profiles( + velocity, + hub_height, + water_depth, + sampling_frequency, + window_avg_time=600, + function="mean", + to_pandas=True, +): """ Calculates profiles of the mean, root-mean-square (RMS), or standard deviation(std) of velocity. The chosen metric, specified by `function`, @@ -392,10 +404,10 @@ def velocity_profiles(velocity, Parameters ------------- - velocity : pandas.Series or xarray.DataArray ([range,] time) + velocity : numpy ndarray, pandas DataFrame, pandas Series, xarray DataArray, or xarray Dataset 1D or 2D streamwise sea water velocity or sea water speed. hub_height : numeric - Turbine hub height altitude above the seabed. Assumes ADCP depth bins + Turbine hub height altitude above the seabed. Assumes ADCP depth bins are referenced to the seafloor. water_depth : numeric Water depth to seafloor, in same units as velocity `range` coordinate. @@ -405,29 +417,36 @@ def velocity_profiles(velocity, Time averaging window in seconds. Defaults to 600. func : string Function to apply. One of 'mean','rms', or 'std' + to_pandas: bool, optional + Flag to output pandas instead of xarray. Default = True. Returns --------- - pandas.DataFrame + iec_profiles: pandas.DataFrame Average velocity profiles based on ensemble mean velocity. """ - velocity = _check_dtype(velocity, 'velocity') + velocity = convert_to_dataarray(velocity, "velocity") if len(velocity.shape) != 2: - raise ValueError("Velocity should be 2 dimensional and have \ - dimensions of 'time' (temporal) and 'range' (spatial).") + raise ValueError( + "Velocity should be 2 dimensional and have \ + dimensions of 'time' (temporal) and 'range' (spatial)." + ) - if function not in ['mean', 'rms', 'std']: + if function not in ["mean", "rms", "std"]: raise ValueError("`function` must be one of 'mean', 'rms', or 'std'.") + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type bool. Got: {type(to_pandas)}") # Streamwise data U = velocity # Create binner - bnr = dolfyn.VelBinner(n_bin=window_avg_time * - sampling_frequency, fs=sampling_frequency) + bnr = dolfyn.VelBinner( + n_bin=window_avg_time * sampling_frequency, fs=sampling_frequency + ) # Take velocity at hub height - mean_hub_vel = bnr.mean(U.sel(range=hub_height, method='nearest').values) + mean_hub_vel = bnr.mean(U.sel(range=hub_height, method="nearest").values) # Apply mean, root-mean-square, or standard deviation U_out = _apply_function(function, bnr, U) @@ -438,147 +457,123 @@ def velocity_profiles(velocity, # Extend top and bottom of profiles to the seafloor and sea surface # Clip off extra depth bins with nans rdx = profiles.isel(speed_bins=0).notnull().sum().values - profiles = profiles.isel(range=slice(None, rdx+1)) + profiles = profiles.isel(range=slice(None, rdx + 1)) # Set seafloor velocity to 0 m/s out_data = np.insert(profiles.data, 0, 0, axis=0) # Set max range to the user-provided water depth - new_range = np.insert(profiles['range'].data[:-1], 0, 0) + new_range = np.insert(profiles["range"].data[:-1], 0, 0) new_range = np.append(new_range, water_depth) # Create a profiles with new range - iec_profiles = xr.DataArray(out_data, coords={'range': new_range, - 'speed_bins': profiles['speed_bins']}) + iec_profiles = xr.DataArray( + out_data, coords={"range": new_range, "speed_bins": profiles["speed_bins"]} + ) # Forward fill to surface - iec_profiles = iec_profiles.ffill('range', limit=None) + iec_profiles = iec_profiles.ffill("range", limit=None) - return iec_profiles.to_pandas() + if to_pandas: + iec_profiles = iec_profiles.to_pandas() + return iec_profiles -def device_efficiency(power, - velocity, - water_density, - capture_area, - hub_height, - sampling_frequency, - window_avg_time=600): + +def device_efficiency( + power, + velocity, + water_density, + capture_area, + hub_height, + sampling_frequency, + window_avg_time=600, + to_pandas=True, +): """ Calculates marine energy device efficiency based on IEC/TS 62600-200 Section 9.7. Parameters ------------- - power : pandas.Series or xarray.DataArray (time) + power : numpy ndarray, pandas DataFrame, pandas Series, xarray DataArray, or xarray Dataset Device power output timeseries in Watts. - velocity : pandas.Series or xarray.DataArray ([range,] time) + velocity : numpy ndarray, pandas DataFrame, pandas Series, xarray DataArray, or xarray Dataset 1D or 2D streamwise sea water velocity or sea water speed in m/s. water_density : float, pandas.Series or xarray.DataArray Sea water density in kg/m^3. capture_area : numeric Swept area of marine energy device. hub_height : numeric - Turbine hub height altitude above the seabed. Assumes ADCP depth bins + Turbine hub height altitude above the seabed. Assumes ADCP depth bins are referenced to the seafloor. sampling_frequency : numeric ADCP sampling frequency in Hz. window_avg_time : int, optional Time averaging window in seconds. Defaults to 600. + to_pandas: bool, optional + Flag to output pandas instead of xarray. Default = True. Returns --------- - pandas.Series + device_eta : pandas.Series or xarray.DataArray Device efficiency (power coefficient) in percent. """ # Velocity should be a 2D xarray or pandas array and have dims (range, time) # Power should have a timestamp coordinate/index - power = _check_dtype(power, 'power') - velocity = _check_dtype(velocity, 'velocity') + power = convert_to_dataarray(power, "power") + velocity = convert_to_dataarray(velocity, "velocity") if len(velocity.shape) != 2: - raise ValueError("Velocity should be 2 dimensional and have \ - dimensions of 'time' (temporal) and 'range' (spatial).") + raise ValueError( + "Velocity should be 2 dimensional and have \ + dimensions of 'time' (temporal) and 'range' (spatial)." + ) + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type bool. Got: {type(to_pandas)}") # Streamwise data U = abs(velocity) - time = U['time'].values + time = U["time"].values # Power: Interpolate to velocity timeseries - power = _interpolate_power_to_velocity_timeseries(power, U) + power.interp(time=U["time"], method="linear") # Create binner - bnr = dolfyn.VelBinner(n_bin=window_avg_time * - sampling_frequency, fs=sampling_frequency) + bnr = dolfyn.VelBinner( + n_bin=window_avg_time * sampling_frequency, fs=sampling_frequency + ) # Hub-height velocity - mean_hub_vel = xr.DataArray(bnr.mean(U.sel(range=hub_height, method='nearest').values), - coords={'time': bnr.mean(time)}) + mean_hub_vel = xr.DataArray( + bnr.mean(U.sel(range=hub_height, method="nearest").values), + coords={"time": bnr.mean(time)}, + ) vel_hub = _average_velocity_bins(mean_hub_vel, mean_hub_vel, bin_size=0.1) # Water density rho_vel = _calculate_density(water_density, bnr, mean_hub_vel, time) # Bin average power - P_avg = xr.DataArray(bnr.mean(power.values), - coords={'time': bnr.mean(time)}) + P_avg = xr.DataArray(bnr.mean(power.values), coords={"time": bnr.mean(time)}) P_vel = _average_velocity_bins(P_avg, mean_hub_vel, bin_size=0.1) # Theoretical power resource - P_resource = 1/2 * rho_vel * capture_area * vel_hub**3 + P_resource = 1 / 2 * rho_vel * capture_area * vel_hub**3 # Efficiency eta = P_vel / P_resource - out = pd.DataFrame((vel_hub.to_series(), - eta.to_series(), - )).T - out.columns = ['U_avg', 'Efficiency'] - out.index.name = 'U_bins' + device_eta = xr.Dataset({"U_avg": vel_hub, "Efficiency": eta}) + device_eta = device_eta.rename({"speed_bins": "U_bins"}) - return out + if to_pandas: + device_eta = device_eta.to_pandas() - -def _interpolate_power_to_velocity_timeseries(power, U): - """ - Interpolates the power timeseries to match the velocity timeseries time points. - - This function checks if the input power is an xarray DataArray or a pandas Series - with a DatetimeIndex and performs interpolation accordingly. If the input power - does not match either of these types, a warning is issued and the original power - timeseries is returned. - - Parameters - ------------- - power : xarray.DataArray or pandas.Series - The device power output timeseries. - U : xarray.DataArray - 2D streamwise sea water velocity or sea water speed. - - Returns - --------- - xarray.DataArray or pandas.Series - Interpolated power timeseries. - - Raises - --------- - Warning - If the input power is not a xarray DataArray or pandas Series with - a DatetimeIndex, a warning is issued stating that the function assumes the - power timestamps match the velocity timestamps. - """ - - if 'xarray' in type(power).__module__: - return power.interp(time=U['time'], method='linear') - elif 'pandas' in type(power).__module__ and isinstance(power.index, pd.DatetimeIndex): - return power.to_xarray().interp(time=U['time'], method='linear') - else: - warnings.warn( - "Assuming `power` timestamps match `velocity` timestamps") - return power + return device_eta def _calculate_density(water_density, bnr, mean_hub_vel, time): """ Calculates the averaged density for the given time period. - This function first checks if the water_density is a scalar or an array. - If it is an array, the function calculates the mean density over the time - period using the binner object 'bnr', and then averages it over velocity bins. + This function first checks if the water_density is a scalar or an array. + If it is an array, the function calculates the mean density over the time + period using the binner object 'bnr', and then averages it over velocity bins. If it is a scalar, it directly returns the input density. Parameters @@ -595,13 +590,14 @@ def _calculate_density(water_density, bnr, mean_hub_vel, time): Returns --------- xarray.DataArray or float - The averaged water density over velocity bins if water_density is an array, + The averaged water density over velocity bins if water_density is an array, or the input scalar water_density. """ if np.size(water_density) > 1: - rho_avg = xr.DataArray(bnr.mean(water_density.values), - coords={'time': bnr.mean(time)}) + rho_avg = xr.DataArray( + bnr.mean(water_density.values), coords={"time": bnr.mean(time)} + ) return _average_velocity_bins(rho_avg, mean_hub_vel, bin_size=0.1) else: return water_density diff --git a/mhkit/tidal/resource.py b/mhkit/tidal/resource.py index ef9961780..e6b6d21c4 100644 --- a/mhkit/tidal/resource.py +++ b/mhkit/tidal/resource.py @@ -1,10 +1,11 @@ import numpy as np import math -import pandas as pd -from mhkit.river.resource import exceedance_probability, Froude_number +from mhkit.river.resource import exceedance_probability, Froude_number +from mhkit.utils import convert_to_dataarray + def _histogram(directions, velocities, width_dir, width_vel): - ''' + """ Wrapper around numpy histogram 2D. Used to find joint probability between directions and velocities. Returns joint probability H as [%]. @@ -14,9 +15,9 @@ def _histogram(directions, velocities, width_dir, width_vel): Directions in degrees with 0 degrees specified as true north velocities: array-like Velocities in m/s - width_dir: float + width_dir: float Width of directional bins for histogram in degrees - width_vel: float + width_vel: float Width of velocity bins for histogram in m/s Returns ------- @@ -26,17 +27,22 @@ def _histogram(directions, velocities, width_dir, width_vel): List of directional bin edges vel_edges: list List of velocity bin edges - ''' + """ - # Number of directional bins - N_dir = math.ceil(360/width_dir) - # Max bin (round up to nearest integer) + # Number of directional bins + N_dir = math.ceil(360 / width_dir) + # Max bin (round up to nearest integer) vel_max = math.ceil(velocities.max()) # Number of velocity bins - N_vel = math.ceil(vel_max/width_vel) + N_vel = math.ceil(vel_max / width_vel) # 2D Histogram of current speed and direction - H, dir_edges, vel_edges = np.histogram2d(directions, velocities, bins=(N_dir,N_vel), - range=[[0,360],[0,vel_max]], density=True) + H, dir_edges, vel_edges = np.histogram2d( + directions, + velocities, + bins=(N_dir, N_vel), + range=[[0, 360], [0, vel_max]], + density=True, + ) # density = true therefore bin value * bin area summed =1 bin_area = width_dir * width_vel # Convert H values to percent [%] @@ -45,9 +51,9 @@ def _histogram(directions, velocities, width_dir, width_vel): def _normalize_angle(degree): - ''' + """ Normalizes degrees to be between 0 and 360 - + Parameters ---------- degree: int or float @@ -56,28 +62,28 @@ def _normalize_angle(degree): ------- new_degree: float Normalized between 0 and 360 degrees - ''' + """ # Set new degree as remainder - new_degree = degree%360 + new_degree = degree % 360 # Ensure positive - new_degree = (new_degree + 360) % 360 + new_degree = (new_degree + 360) % 360 return new_degree def principal_flow_directions(directions, width_dir): - ''' + """ Calculates principal flow directions for ebb and flood cycles - - The weighted average (over the working velocity range of the TEC) - should be considered to be the principal direction of the current, - and should be used for both the ebb and flood cycles to determine - the TEC optimum orientation. + + The weighted average (over the working velocity range of the TEC) + should be considered to be the principal direction of the current, + and should be used for both the ebb and flood cycles to determine + the TEC optimum orientation. Parameters ---------- - directions: pandas.Series or numpy.ndarray + directions: numpy ndarray, pandas DataFrame, pandas Series, xarray DataArray, or xarray Dataset Flow direction in degrees CW from North, from 0 to 360 - width_dir: float + width_dir: float Width of directional bins for histogram in degrees Returns @@ -87,74 +93,79 @@ def principal_flow_directions(directions, width_dir): Notes ----- - One must determine which principal direction is flood and which is + One must determine which principal direction is flood and which is ebb based on knowledge of the measurement site. - ''' + """ - if isinstance(directions, np.ndarray): - directions=pd.Series(directions) - assert(all(directions>=0) and all(directions<=360), - 'flood must be between 0 and 360 degrees') + directions = convert_to_dataarray(directions) + if any(directions < 0) or any(directions > 360): + violating_values = [d for d in directions if d < 0 or d > 360] + raise ValueError( + f"directions must be between 0 and 360 degrees. Values out of range: {violating_values}" + ) - # Number of directional bins - N_dir=int(360/width_dir) + # Number of directional bins + N_dir = int(360 / width_dir) # Compute directional histogram - H1, dir_edges = np.histogram(directions, bins=N_dir,range=[0,360], density=True) - # Convert to perecnt - H1 = H1 * 100 # [%] + H1, dir_edges = np.histogram(directions, bins=N_dir, range=[0, 360], density=True) + # Convert to percent + H1 = H1 * 100 # [%] # Determine if there are an even or odd number of bins - odd = bool( N_dir % 2 ) + odd = bool(N_dir % 2) # Shift by 180 degrees and sum if odd: # Then split middle bin counts to left and right - H0to180 = H1[0:N_dir//2] - H180to360 = H1[N_dir//2+1:] - H0to180[-1] += H1[N_dir//2]/2 - H180to360[0] += H1[N_dir//2]/2 - #Add the two + H0to180 = H1[0 : N_dir // 2] + H180to360 = H1[N_dir // 2 + 1 :] + H0to180[-1] += H1[N_dir // 2] / 2 + H180to360[0] += H1[N_dir // 2] / 2 + # Add the two H180 = H0to180 + H180to360 else: - H180 = H1[0:N_dir//2] + H1[N_dir//2:N_dir+1] + H180 = H1[0 : N_dir // 2] + H1[N_dir // 2 : N_dir + 1] # Find the maximum value maxDegreeStacked = H180.argmax() # Shift by 90 to find angles normal to principal direction - floodEbbNormalDegree1 = _normalize_angle(maxDegreeStacked + 90.) - # Find the complimentary angle - floodEbbNormalDegree2 = _normalize_angle(floodEbbNormalDegree1+180.) + floodEbbNormalDegree1 = _normalize_angle(maxDegreeStacked + 90.0) + # Find the complimentary angle + floodEbbNormalDegree2 = _normalize_angle(floodEbbNormalDegree1 + 180.0) # Reset values so that the Degree1 is the smaller angle, and Degree2 the large floodEbbNormalDegree1 = min(floodEbbNormalDegree1, floodEbbNormalDegree2) - floodEbbNormalDegree2 = floodEbbNormalDegree1 + 180. + floodEbbNormalDegree2 = floodEbbNormalDegree1 + 180.0 # Slice directions on the 2 semi circles - d1 = directions[directions.between(floodEbbNormalDegree1, - floodEbbNormalDegree2)] - d2 = directions[~directions.between(floodEbbNormalDegree1, - floodEbbNormalDegree2)] + mask = (directions >= floodEbbNormalDegree1) & (directions <= floodEbbNormalDegree2) + d1 = directions[mask] + d2 = directions[~mask] # Shift second set of of directions to not break between 360 and 0 - d2 -= 180. + d2 -= 180 # Renormalize the points (gets rid of negatives) d2 = _normalize_angle(d2) # Number of bins for semi-circle - n_dir = int(180/width_dir) + n_dir = int(180 / width_dir) # Compute 1D histograms on both semi circles - Hd1, dir1_edges = np.histogram(d1, bins=n_dir,density=True) - Hd2, dir2_edges = np.histogram(d2, bins=n_dir,density=True) - # Convert to perecnt - Hd1 = Hd1 * 100 # [%] - Hd2 = Hd2 * 100 # [%] + Hd1, dir1_edges = np.histogram(d1, bins=n_dir, density=True) + Hd2, dir2_edges = np.histogram(d2, bins=n_dir, density=True) + # Convert to percent + Hd1 = Hd1 * 100 # [%] + Hd2 = Hd2 * 100 # [%] # Principal Directions average of the 2 bins - PrincipalDirection1 = 0.5 * (dir1_edges[Hd1.argmax()]+ dir1_edges[Hd1.argmax()+1]) - PrincipalDirection2 = 0.5 * (dir2_edges[Hd2.argmax()]+ dir2_edges[Hd2.argmax()+1])+180.0 + PrincipalDirection1 = 0.5 * ( + dir1_edges[Hd1.argmax()] + dir1_edges[Hd1.argmax() + 1] + ) + PrincipalDirection2 = ( + 0.5 * (dir2_edges[Hd2.argmax()] + dir2_edges[Hd2.argmax() + 1]) + 180.0 + ) + + return PrincipalDirection1, PrincipalDirection2 - return PrincipalDirection1, PrincipalDirection2 - def _flood_or_ebb(d, flood, ebb): - ''' - Returns a mask which is True for directions on the ebb side of the - midpoints between the flood and ebb directions on the unit circle + """ + Returns a mask which is True for directions on the ebb side of the + midpoints between the flood and ebb directions on the unit circle and False for directions on the Flood side. - + Parameters ---------- d: array-like @@ -163,24 +174,23 @@ def _flood_or_ebb(d, flood, ebb): Principal component of flow in the flood direction in degrees ebb: float or int Principal component of flow in the ebb direction in degrees - + Returns ------- is_ebb: boolean array - array of length N which is True for directions on the ebb side + array of length N which is True for directions on the ebb side of the midpoints between flood and ebb on the unit circle and false otherwise. - ''' + """ max_angle = max(ebb, flood) min_angle = min(ebb, flood) - - lower_split = (min_angle + (360 - max_angle + min_angle)/2 ) % 360 + + lower_split = (min_angle + (360 - max_angle + min_angle) / 2) % 360 upper_split = lower_split + 180 - + if lower_split <= ebb < upper_split: is_ebb = ((d < upper_split) & (d >= lower_split)).values else: is_ebb = ~((d < upper_split) & (d >= lower_split)).values - - return is_ebb + return is_ebb diff --git a/mhkit/utils.py b/mhkit/utils.py deleted file mode 100644 index 65ba2b918..000000000 --- a/mhkit/utils.py +++ /dev/null @@ -1,299 +0,0 @@ -from pecos.utils import index_to_datetime -import matplotlib.pyplot as plt -import datetime as dt -from mhkit import qc -import pandas as pd -import numpy as np - - -_matlab = False # Private variable indicating if mhkit is run through matlab - -def get_statistics(data,freq,period=600,vector_channels=[]): - """ - Calculate mean, max, min and stdev statistics of continuous data for a - given statistical window. Default length of statistical window (period) is - based on IEC TS 62600-3:2020 ED1. Also allows calculation of statistics for multiple statistical - windows of continuous data and accounts for vector/directional channels. - - Parameters - ------------ - data : pandas DataFrame - Data indexed by datetime with columns of data to be analyzed - freq : float/int - Sample rate of data [Hz] - period : float/int - Statistical window of interest [sec], default = 600 - vector_channels : string or list (optional) - List of vector/directional channel names formatted in deg (0-360) - - Returns - --------- - means,maxs,mins,stdevs : pandas DataFrame - Calculated statistical values from the data, indexed by the first timestamp - """ - # Check data type - assert isinstance(data, pd.DataFrame), 'data must be of type pd.DataFrame' - assert isinstance(freq, (float,int)), 'freq must be of type int or float' - assert isinstance(period, (float,int)), 'freq must be of type int or float' - # catch if vector_channels is not an string array - if isinstance(vector_channels,str): vector_channels = [vector_channels] - assert isinstance(vector_channels, list), 'vector_channels must be a list of strings' - - # Check timestamp using qc module - data.index = data.index.round('1ms') - dataQC = qc.check_timestamp(data,1/freq) - dataQC = dataQC['cleaned_data'] - - # Check to see if data length contains enough data points for statistical window - if len(dataQC)%(period*freq) > 0: - remain = len(dataQC) % (period*freq) - dataQC = dataQC.iloc[0:-int(remain)] - print('WARNING: there were not enough data points in the last statistical period. Last '+str(remain)+' points were removed.') - - # Pre-allocate lists - time = [] - means = [] - maxs = [] - mins = [] - stdev = [] - - # Get data chunks to performs stats on - step = period*freq - for i in range(int(len(dataQC)/(period*freq))): - datachunk = dataQC.iloc[i*step:(i+1)*step] - # Check whether there are any NaNs in datachunk - if datachunk.isnull().any().any(): - print('NaNs found in statistical window...check timestamps!') - input('Press to continue') - continue - else: - # Get stats - time.append(datachunk.index.values[0]) # time vector - maxs.append(datachunk.max()) # maxes - mins.append(datachunk.min()) # mins - means.append(datachunk.mean()) # means - stdev.append(datachunk.std()) # standard deviation - # calculate vector averages and std - for v in vector_channels: - vector_avg, vector_std = vector_statistics(datachunk[v]) - means[i][v] = vector_avg # overwrite scalar average for channel - stdev[i][v] = vector_std # overwrite scalar std for channel - - # Convert to DataFrames and set index - means = pd.DataFrame(means,index=time) - maxs = pd.DataFrame(maxs,index=time) - mins = pd.DataFrame(mins,index=time) - stdevs = pd.DataFrame(stdev,index=time) - - return means,maxs,mins,stdevs - -def vector_statistics(data): - """ - Function used to calculate statistics for vector/directional channels based on - routine from Campbell data logger and Yamartino algorithm - - Parameters - ---------- - data : pandas Series, numpy array, list - Vector channel to calculate statistics on [deg, 0-360] - - Returns - ------- - vector_avg : numpy array - Vector mean statistic - vector_std : numpy array - Vector standard deviation statistic - """ - try: data = np.array(data) - except: pass - assert isinstance(data, np.ndarray), 'data must be of type np.ndarray' - - # calculate mean - Ux = sum(np.sin(data*np.pi/180))/len(data) - Uy = sum(np.cos(data*np.pi/180))/len(data) - vector_avg = (90 - np.arctan2(Uy,Ux)*180/np.pi) - if vector_avg<0: vector_avg = vector_avg+360 - elif vector_avg>360: vector_avg = vector_avg-360 - # calculate standard deviation - magsum = round((Ux**2 + Uy**2)*1e8)/1e8 # round to 8th decimal place to reduce roundoff error - epsilon = (1-magsum)**0.5 - if not np.isreal(epsilon): # check if epsilon is imaginary (error) - vector_std = 0 - print('WARNING: epsilon contains imaginary value') - else: - vector_std = np.arcsin(epsilon)*(1+0.1547*epsilon**3)*180/np.pi - - return vector_avg, vector_std - -def unwrap_vector(data): - """ - Function used to unwrap vectors into 0-360 deg range - - Parameters - ------------ - data : pandas Series, numpy array, list - Data points to be unwrapped [deg] - - Returns - --------- - data : numpy array - Data points unwrapped between 0-360 deg - """ - # Check data types - try: - data = np.array(data) - except: - pass - assert isinstance(data, np.ndarray), 'data must be of type np.ndarray' - - # Loop through and unwrap points - for i in range(len(data)): - if data[i] < 0: - data[i] = data[i]+360 - elif data[i] > 360: - data[i] = data[i]-360 - if max(data) > 360 or min(data) < 0: - data = unwrap_vector(data) - return data - -def matlab_to_datetime(matlab_datenum): - """ - Convert MATLAB datenum format to Python datetime - - Parameters - ------------ - matlab_datenum : numpy array - MATLAB datenum to be converted - - Returns - --------- - time : DateTimeIndex - Python datetime values - """ - # Check data types - try: - matlab_datenum = np.array(matlab_datenum,ndmin=1) - except: - pass - assert isinstance(matlab_datenum, np.ndarray), 'data must be of type np.ndarray' - - # Pre-allocate - time = [] - # loop through dates and convert - for t in matlab_datenum: - day = dt.datetime.fromordinal(int(t)) - dayfrac = dt.timedelta(days=t%1) - dt.timedelta(days = 366) - time.append(day + dayfrac) - - time = np.array(time) - time = pd.to_datetime(time) - return time - -def excel_to_datetime(excel_num): - """ - Convert Excel datenum format to Python datetime - - Parameters - ------------ - excel_num : numpy array - Excel datenums to be converted - - Returns - --------- - time : DateTimeIndex - Python datetime values - """ - # Check data types - try: - excel_num = np.array(excel_num) - except: - pass - assert isinstance(excel_num, np.ndarray), 'data must be of type np.ndarray' - - # Convert to datetime - time = pd.to_datetime('1899-12-30')+pd.to_timedelta(excel_num,'D') - - return time - - -def magnitude_phase(x,y,z=None): - ''' - Retuns magnitude and phase in two or three dimensions. - - Parameters - ---------- - x: array_like - x-component - y: array_like - y-component - z: array_like - z-component defined positive up. (Optional) Default None. - - Returns - ------- - mag: float or array - magnitude of the vector - theta: float or array - radians from the x-axis - phi: float or array - radians from z-axis defined as positive up. Optional: only - returned when z is passed. - ''' - x=np.array(x) - y=np.array(y) - - threeD=False - if not isinstance(z, type(None)): - z=np.array(z) - threeD=True - - assert isinstance(x, (float,int,np.ndarray)) - assert isinstance(y, (float,int,np.ndarray)) - assert isinstance(z, (type(None),float,int,np.ndarray)) - - if threeD: - mag = np.sqrt(x**2 + y**2 + z**2) - theta = np.arctan2(y,x) - phi = np.arctan2(np.sqrt(x**2+y**2),z) - return mag, theta, phi - else: - mag = np.sqrt(x**2 + y**2) - theta = np.arctan2(y, x) - return mag, theta - -def unorm(x, y ,z): - ''' - Calculates the root mean squared value given three arrays. - - Parameters - ---------- - x: array - One input for the root mean squared calculation.(eq. x velocity) - y: array - One input for the root mean squared calculation.(eq. y velocity) - z: array - One input for the root mean squared calculation.(eq. z velocity) - - Returns - ------- - unorm : array - The root mean squared of x, y, and z. - - Example - ------- - If the inputs are [1,2,3], [4,5,6], and [7,8,9] the code take the - cordinationg value from each array and calculates the root mean squared. - The resulting output is [ 8.1240384, 9.64365076, 11.22497216]. - ''' - - assert isinstance(x,(np.ndarray, np.float64, pd.Series)), 'x must be an array' - assert isinstance(y,(np.ndarray, np.float64, pd.Series)), 'y must be an array' - assert isinstance(z,(np.ndarray, np.float64, pd.Series)), 'z must be an array' - assert all([len(x) == len(y), len (y) ==len (z)]), ('lengths of arrays must' - +' match') - - xyz = np.array([x,y,z]) - unorm = np.linalg.norm(xyz, axis= 0) - - return unorm - \ No newline at end of file diff --git a/mhkit/utils/__init__.py b/mhkit/utils/__init__.py new file mode 100644 index 000000000..e195d4569 --- /dev/null +++ b/mhkit/utils/__init__.py @@ -0,0 +1,18 @@ +from .time_utils import matlab_to_datetime, excel_to_datetime +from .stat_utils import ( + get_statistics, + vector_statistics, + unwrap_vector, + magnitude_phase, + unorm, +) +from .cache import handle_caching, clear_cache +from .upcrossing import upcrossing, peaks, troughs, heights, periods, custom +from .type_handling import ( + to_numeric_array, + convert_to_dataset, + convert_to_dataarray, + convert_nested_dict_and_pandas, +) + +_matlab = False # Private variable indicating if mhkit is run through matlab diff --git a/mhkit/utils/cache.py b/mhkit/utils/cache.py new file mode 100644 index 000000000..423a12757 --- /dev/null +++ b/mhkit/utils/cache.py @@ -0,0 +1,244 @@ +""" +This module provides functionality for managing cache files to optimize +network requests and computations for handling data. The module focuses +on enabling users to read from and write to cache files, as well as +perform cache clearing operations. Cache files are utilized to store data +temporarily, mitigating the need to re-fetch or recompute the same data multiple +times, which can be especially useful in network-dependent tasks. + +The module consists of two main functions: + +1. `handle_caching`: + This function manages the caching of data. It provides options to read from + and write to cache files, depending on whether the data is already provided + or if it needs to be fetched from the cache. If a cache file corresponding + to the given parameters already exists, the function can either load data + from it or clear it based on the parameters passed. It also offers the ability + to store associated metadata along with the data and supports both JSON and + pickle file formats for caching. This function returns the loaded data and + metadata from the cache file, along with the cache file path. + +2. `clear_cache`: + This function enables the clearing of either specific sub-directories or the + entire cache directory, depending on the parameter passed. It removes the + specified directory and then recreates it to ensure future caching tasks can + be executed without any issues. If the specified directory does not exist, + the function prints an indicative message. + +Module Dependencies: +-------------------- + - hashlib: For creating unique filenames based on hashed parameters. + - json: For reading and writing JSON formatted cache files. + - os: For performing operating system dependent tasks like directory creation. + - re: For regular expression operations to match datetime formatted strings. + - shutil: For performing high-level file operations like copying and removal. + - pickle: For reading and writing pickle formatted cache files. + - pandas: For handling data in DataFrame format. + +Author: ssolson +Date: 2023-09-26 +""" + +import hashlib +import json +import os +import re +import shutil +import pickle +import pandas as pd + + +def handle_caching( + hash_params, + cache_dir, + data=None, + metadata=None, + write_json=None, + clear_cache_file=False, +): + """ + Handles caching of data to avoid redundant network requests or + computations. + + The function checks if a cache file exists for the given parameters. + If it does, the function will load data from the cache file, unless + the `clear_cache_file` parameter is set to `True`, in which case the + cache file is cleared. If the cache file does not exist and the + `data` parameter is not `None`, the function will store the + provided data in a cache file. + + Parameters + ---------- + hash_params : str + The parameters to be hashed and used as the filename for the cache file. + cache_dir : str + The directory where the cache files are stored. + data : pandas DataFrame or None + The data to be stored in the cache file. If `None`, the function + will attempt to load data from the cache file. + metadata : dict or None + Metadata associated with the data. This will be stored in the + cache file along with the data. + write_json : str or None + If specified, the cache file will be copied to a file with this name. + clear_cache_file : bool + If `True`, the cache file for the given parameters will be cleared. + + Returns + ------- + data : pandas DataFrame or None + The data loaded from the cache file. If data was provided as a + parameter, the same data will be returned. If the cache file + does not exist and no data was provided, `None` will be returned. + metadata : dict or None + The metadata loaded from the cache file. If metadata was provided + as a parameter, the same metadata will be returned. If the cache + file does not exist and no metadata was provided, `None` will be + returned. + cache_filepath : str + The path to the cache file. + """ + + # Check if 'cdip' is in cache_dir, then use .pkl instead of .json + file_extension = ( + ".pkl" + if "cdip" in cache_dir or "hindcast" in cache_dir or "ndbc" in cache_dir + else ".json" + ) + + # Make cache directory if it doesn't exist + if not os.path.isdir(cache_dir): + os.makedirs(cache_dir) + + # Create a unique filename based on the function parameters + cache_filename = ( + hashlib.md5(hash_params.encode("utf-8")).hexdigest() + file_extension + ) + cache_filepath = os.path.join(cache_dir, cache_filename) + + # If clear_cache_file is True, remove the cache file for this request + if clear_cache_file and os.path.isfile(cache_filepath): + os.remove(cache_filepath) + print(f"Cleared cache for {cache_filepath}") + + # If a cached file exists, load and return the data from the file + if os.path.isfile(cache_filepath) and data is None: + if file_extension == ".json": + with open(cache_filepath, encoding="utf-8") as f: + jsonData = json.load(f) + + # Extract metadata if it exists + if "metadata" in jsonData: + metadata = jsonData.pop("metadata", None) + + # Check if index is datetime formatted + if all( + re.match(r"\d{4}-\d{2}-\d{2} \d{2}:\d{2}:\d{2}", str(dt)) + for dt in jsonData["index"] + ): + data = pd.DataFrame( + jsonData["data"], + index=pd.to_datetime(jsonData["index"]), + columns=jsonData["columns"], + ) + else: + data = pd.DataFrame( + jsonData["data"], + index=jsonData["index"], + columns=jsonData["columns"], + ) + + # Convert the rest to DataFrame + data = pd.DataFrame( + jsonData["data"], + index=pd.to_datetime(jsonData["index"]), + columns=jsonData["columns"], + ) + + elif file_extension == ".pkl": + with open(cache_filepath, "rb") as f: + data, metadata = pickle.load(f) + + if write_json: + shutil.copy(cache_filepath, write_json) + + return data, metadata, cache_filepath + + # If a cached file does not exist and data is provided, + # store the data in a cache file + elif data is not None: + if file_extension == ".json": + # Convert DataFrame to python dict + pyData = data.to_dict(orient="split") + # Add metadata to pyData + pyData["metadata"] = metadata + # Check if index is datetime indexed + if isinstance(data.index, pd.DatetimeIndex): + pyData["index"] = [ + dt.strftime("%Y-%m-%d %H:%M:%S") for dt in pyData["index"] + ] + else: + pyData["index"] = list(data.index) + with open(cache_filepath, "w", encoding="utf-8") as f: + json.dump(pyData, f) + + elif file_extension == ".pkl": + with open(cache_filepath, "wb") as f: + pickle.dump((data, metadata), f) + + if write_json: + shutil.copy(cache_filepath, write_json) + + return data, metadata, cache_filepath + # If data is not provided and the cache file doesn't exist, return cache_filepath + return None, None, cache_filepath + + +def clear_cache(specific_dir=None): + """ + Clears the cache. + + The function checks if a specific directory or the entire cache directory + exists. If it does, the function will remove the directory and recreate it. + If the directory does not exist, a message indicating is printed. + + Parameters + ---------- + specific_dir : str or None, optional + Specific sub-directory to clear. If None, the entire cache is cleared. + Default is None. + + Returns + ------- + None + """ + cache_dir = os.path.join(os.path.expanduser("~"), ".cache", "mhkit") + + # Consider generating this from a system folder search + folders = { + "river": "river", + "tidal": "tidal", + "wave": "wave", + "usgs": os.path.join("river", "usgs"), + "noaa": os.path.join("tidal", "noaa"), + "ndbc": os.path.join("wave", "ndbc"), + "cdip": os.path.join("wave", "cdip"), + "hindcast": os.path.join("wave", "hindcast"), + } + + # If specific_dir is provided and matches a key in the folders dictionary, + # use its corresponding value + if specific_dir and specific_dir in folders: + specific_dir = folders[specific_dir] + + # Construct the path to the directory to be cleared + path_to_clear = os.path.join(cache_dir, specific_dir) if specific_dir else cache_dir + + # Check if the directory exists + if os.path.exists(path_to_clear): + # Clear the directory + shutil.rmtree(path_to_clear) + # Recreate the directory after deletion + os.makedirs(path_to_clear) + else: + print(f"The directory {path_to_clear} does not exist.") diff --git a/mhkit/utils/stat_utils.py b/mhkit/utils/stat_utils.py new file mode 100644 index 000000000..f0a7e2994 --- /dev/null +++ b/mhkit/utils/stat_utils.py @@ -0,0 +1,270 @@ +from mhkit import qc +import pandas as pd +import numpy as np + + +def get_statistics(data, freq, period=600, vector_channels=[]): + """ + Calculate mean, max, min and stdev statistics of continuous data for a + given statistical window. Default length of statistical window (period) is + based on IEC TS 62600-3:2020 ED1. Also allows calculation of statistics for multiple statistical + windows of continuous data and accounts for vector/directional channels. + + Parameters + ------------ + data : pandas DataFrame + Data indexed by datetime with columns of data to be analyzed + freq : float/int + Sample rate of data [Hz] + period : float/int + Statistical window of interest [sec], default = 600 + vector_channels : string or list (optional) + List of vector/directional channel names formatted in deg (0-360) + + Returns + --------- + means,maxs,mins,stdevs : pandas DataFrame + Calculated statistical values from the data, indexed by the first timestamp + """ + # Check data type + if not isinstance(data, pd.DataFrame): + raise TypeError(f"data must be of type pd.DataFrame. Got: {type(data)}") + if not isinstance(freq, (float, int)): + raise TypeError(f"freq must be of type int or float. Got: {type(freq)}") + if not isinstance(period, (float, int)): + raise TypeError(f"period must be of type int or float. Got: {type(period)}") + # catch if vector_channels is not an string array + if isinstance(vector_channels, str): + vector_channels = [vector_channels] + if not isinstance(vector_channels, list): + raise TypeError( + f"vector_channels must be a list of strings. Got: {type(vector_channels)}" + ) + + # Check timestamp using qc module + data.index = data.index.round("1ms") + dataQC = qc.check_timestamp(data, 1 / freq) + dataQC = dataQC["cleaned_data"] + + # Check to see if data length contains enough data points for statistical window + if len(dataQC) % (period * freq) > 0: + remain = len(dataQC) % (period * freq) + dataQC = dataQC.iloc[0 : -int(remain)] + print( + "WARNING: there were not enough data points in the last statistical period. Last " + + str(remain) + + " points were removed." + ) + + # Pre-allocate lists + time = [] + means = [] + maxs = [] + mins = [] + stdev = [] + + # Get data chunks to performs stats on + step = period * freq + for i in range(int(len(dataQC) / (period * freq))): + datachunk = dataQC.iloc[i * step : (i + 1) * step] + # Check whether there are any NaNs in datachunk + if datachunk.isnull().any().any(): + print("NaNs found in statistical window...check timestamps!") + input("Press to continue") + continue + else: + # Get stats + time.append(datachunk.index.values[0]) # time vector + maxs.append(datachunk.max()) # maxes + mins.append(datachunk.min()) # mins + means.append(datachunk.mean()) # means + stdev.append(datachunk.std()) # standard deviation + # calculate vector averages and std + for v in vector_channels: + vector_avg, vector_std = vector_statistics(datachunk[v]) + # overwrite scalar average for channel + means[i][v] = vector_avg + stdev[i][v] = vector_std # overwrite scalar std for channel + + # Convert to DataFrames and set index + means = pd.DataFrame(means, index=time) + maxs = pd.DataFrame(maxs, index=time) + mins = pd.DataFrame(mins, index=time) + stdevs = pd.DataFrame(stdev, index=time) + + return means, maxs, mins, stdevs + + +def vector_statistics(data): + """ + Function used to calculate statistics for vector/directional channels based on + routine from Campbell data logger and Yamartino algorithm + + Parameters + ---------- + data : pandas Series, numpy array, list + Vector channel to calculate statistics on [deg, 0-360] + + Returns + ------- + vector_avg : numpy array + Vector mean statistic + vector_std : numpy array + Vector standard deviation statistic + """ + try: + data = np.array(data) + except: + pass + if not isinstance(data, np.ndarray): + raise TypeError(f"data must be of type np.ndarray. Got: {type(data)}") + + # calculate mean + Ux = sum(np.sin(data * np.pi / 180)) / len(data) + Uy = sum(np.cos(data * np.pi / 180)) / len(data) + vector_avg = 90 - np.arctan2(Uy, Ux) * 180 / np.pi + if vector_avg < 0: + vector_avg = vector_avg + 360 + elif vector_avg > 360: + vector_avg = vector_avg - 360 + # calculate standard deviation + # round to 8th decimal place to reduce roundoff error + magsum = round((Ux**2 + Uy**2) * 1e8) / 1e8 + epsilon = (1 - magsum) ** 0.5 + if not np.isreal(epsilon): # check if epsilon is imaginary (error) + vector_std = 0 + print("WARNING: epsilon contains imaginary value") + else: + vector_std = np.arcsin(epsilon) * (1 + 0.1547 * epsilon**3) * 180 / np.pi + + return vector_avg, vector_std + + +def unwrap_vector(data): + """ + Function used to unwrap vectors into 0-360 deg range + + Parameters + ------------ + data : pandas Series, numpy array, list + Data points to be unwrapped [deg] + + Returns + --------- + data : numpy array + Data points unwrapped between 0-360 deg + """ + # Check data types + try: + data = np.array(data) + except: + pass + if not isinstance(data, np.ndarray): + raise TypeError(f"data must be of type np.ndarray. Got: {type(data)}") + + # Loop through and unwrap points + for i in range(len(data)): + if data[i] < 0: + data[i] = data[i] + 360 + elif data[i] > 360: + data[i] = data[i] - 360 + if max(data) > 360 or min(data) < 0: + data = unwrap_vector(data) + return data + + +def magnitude_phase(x, y, z=None): + """ + Retuns magnitude and phase in two or three dimensions. + + Parameters + ---------- + x: array_like + x-component + y: array_like + y-component + z: array_like + z-component defined positive up. (Optional) Default None. + + Returns + ------- + mag: float or array + magnitude of the vector + theta: float or array + radians from the x-axis + phi: float or array + radians from z-axis defined as positive up. Optional: only + returned when z is passed. + """ + x = np.array(x) + y = np.array(y) + + threeD = False + if not isinstance(z, type(None)): + z = np.array(z) + threeD = True + + if not isinstance(x, (float, int, np.ndarray)): + raise TypeError(f"x must be of type float, int, or np.ndarray. Got: {type(x)}") + if not isinstance(y, (float, int, np.ndarray)): + raise TypeError(f"y must be of type float, int, or np.ndarray. Got: {type(y)}") + if not isinstance(z, (type(None), float, int, np.ndarray)): + raise TypeError( + f"If specified, z must be of type float, int, or np.ndarray. Got: {type(z)}" + ) + + if threeD: + mag = np.sqrt(x**2 + y**2 + z**2) + theta = np.arctan2(y, x) + phi = np.arctan2(np.sqrt(x**2 + y**2), z) + return mag, theta, phi + else: + mag = np.sqrt(x**2 + y**2) + theta = np.arctan2(y, x) + return mag, theta + + +def unorm(x, y, z): + """ + Calculates the root mean squared value given three arrays. + + Parameters + ---------- + x: array + One input for the root mean squared calculation.(eq. x velocity) + y: array + One input for the root mean squared calculation.(eq. y velocity) + z: array + One input for the root mean squared calculation.(eq. z velocity) + + Returns + ------- + unorm : array + The root mean squared of x, y, and z. + + Example + ------- + If the inputs are [1,2,3], [4,5,6], and [7,8,9] the code take the + cordinationg value from each array and calculates the root mean squared. + The resulting output is [ 8.1240384, 9.64365076, 11.22497216]. + """ + + if not isinstance(x, (np.ndarray, np.float64, pd.Series)): + raise TypeError( + f"x must be of type np.ndarray, np.float64, or pd.Series. Got: {type(x)}" + ) + if not isinstance(y, (np.ndarray, np.float64, pd.Series)): + raise TypeError( + f"y must be of type np.ndarray, np.float64, or pd.Series. Got: {type(y)}" + ) + if not isinstance(z, (np.ndarray, np.float64, pd.Series)): + raise TypeError( + f"z must be of type np.ndarray, np.float64, or pd.Series. Got: {type(z)}" + ) + if not all([len(x) == len(y), len(y) == len(z)]): + raise ValueError("lengths of arrays must match") + + xyz = np.array([x, y, z]) + unorm = np.linalg.norm(xyz, axis=0) + + return unorm diff --git a/mhkit/utils/time_utils.py b/mhkit/utils/time_utils.py new file mode 100644 index 000000000..643219c9b --- /dev/null +++ b/mhkit/utils/time_utils.py @@ -0,0 +1,66 @@ +import datetime as dt +import pandas as pd +import numpy as np + + +def matlab_to_datetime(matlab_datenum): + """ + Convert MATLAB datenum format to Python datetime + + Parameters + ------------ + matlab_datenum : numpy array + MATLAB datenum to be converted + + Returns + --------- + time : DateTimeIndex + Python datetime values + """ + # Check data types + try: + matlab_datenum = np.array(matlab_datenum, ndmin=1) + except: + pass + if not isinstance(matlab_datenum, np.ndarray): + raise TypeError(f"data must be of type np.ndarray. Got: {type(data)}") + + # Pre-allocate + time = [] + # loop through dates and convert + for t in matlab_datenum: + day = dt.datetime.fromordinal(int(t)) + dayfrac = dt.timedelta(days=t % 1) - dt.timedelta(days=366) + time.append(day + dayfrac) + + time = np.array(time) + time = pd.to_datetime(time) + return time + + +def excel_to_datetime(excel_num): + """ + Convert Excel datenum format to Python datetime + + Parameters + ------------ + excel_num : numpy array + Excel datenums to be converted + + Returns + --------- + time : DateTimeIndex + Python datetime values + """ + # Check data types + try: + excel_num = np.array(excel_num) + except: + pass + if not isinstance(excel_num, np.ndarray): + raise TypeError(f"excel_num must be of type np.ndarray. Got: {type(excel_num)}") + + # Convert to datetime + time = pd.to_datetime("1899-12-30") + pd.to_timedelta(excel_num, "D") + + return time diff --git a/mhkit/utils/type_handling.py b/mhkit/utils/type_handling.py new file mode 100644 index 000000000..2b6c5b920 --- /dev/null +++ b/mhkit/utils/type_handling.py @@ -0,0 +1,211 @@ +import numpy as np +import pandas as pd +import xarray as xr + + +def to_numeric_array(data, name): + """ + Convert input data to a numeric array, ensuring all elements are numeric. + """ + if isinstance(data, (list, np.ndarray, pd.Series, xr.DataArray)): + data = np.asarray(data) + if not np.issubdtype(data.dtype, np.number): + raise TypeError( + (f"{name} must contain numeric data." + f" Got data type: {data.dtype}") + ) + else: + raise TypeError( + ( + f"{name} must be a list, np.ndarray, pd.Series," + + f" or xr.DataArray. Got: {type(data)}" + ) + ) + return data + + +def convert_to_dataset(data, name="data"): + """ + Converts the given data to an xarray.Dataset. + + This function is designed to handle inputs that can be either a pandas DataFrame, a pandas Series, + an xarray DataArray, or an xarray Dataset. It ensures that the output is consistently an xarray.Dataset. + + Parameters + ---------- + data: pandas Series, pandas DataFrame, xarray DataArray, or xarray Dataset + The data to be converted. + + name: str (Optional) + The name to assign to the data variable in case the input is an xarray DataArray without a name. + Default value is 'data'. + + Returns + ------- + xarray.Dataset + The input data converted to an xarray.Dataset. If the input is already an xarray.Dataset, + it is returned as is. + + Examples + -------- + >>> df = pd.DataFrame({'A': [1, 2, 3], 'B': [4, 5, 6]}) + >>> ds = convert_to_dataset(df) + >>> type(ds) + + + >>> series = pd.Series([1, 2, 3], name='C') + >>> ds = convert_to_dataset(series) + >>> type(ds) + + + >>> data_array = xr.DataArray([1, 2, 3]) + >>> ds = convert_to_dataset(data_array, name='D') + >>> type(ds) + + """ + if not isinstance(data, (pd.DataFrame, pd.Series, xr.DataArray, xr.Dataset)): + raise TypeError( + "Input data must be of type pandas.DataFrame, pandas.Series, " + "xarray.DataArray, or xarray.Dataset." + f"Got {type(data)}." + ) + + if not isinstance(name, str): + raise TypeError("The 'name' parameter must be a string" f"Got {type(name)}.") + + # Takes data that could be pd.DataFrame, pd.Series, xr.DataArray, or + # xr.Dataset and converts it to xr.Dataset + if isinstance(data, pd.DataFrame): + # xr.Dataset(data) is drastically faster (1e1 - 1e2x faster) than using pd.DataFrame.to_xarray() + data = xr.Dataset(data) + + if isinstance(data, pd.Series): + # Converting to a DataArray then to a dataset makes the variable and + # dimension naming cleaner than going straight to a Dataset with + # xr.Dataset(pd.Series) + data = xr.DataArray(data) + + if isinstance(data, xr.DataArray): + # xr.DataArray.to_dataset() breaks if the data variable is unnamed + if data.name == None: + data.name = name + data = data.to_dataset() + + return data + + +def convert_to_dataarray(data, name="data"): + """ + Converts the given data to an xarray.DataArray. + + This function is designed to handle inputs that can be either a numpy ndarray, pandas Series, + or an xarray DataArray. For convenience, pandas DataFrame and xarray Dataset can also be input + but may only contain a single variable. The function ensures that the output is consistently + an xarray.DataArray. + + Parameters + ---------- + data: numpy ndarray, pandas DataFrame, pandas Series, xarray DataArray, or xarray Dataset + The data to be converted. + + name: str (Optional) + The name to overwrite the name of the input data variable for pandas or xarray input. + Default value is 'data'. + + Returns + ------- + xarray.DataArray + The input data converted to an xarray.DataArray. If the input is already an xarray.DataArray, + it is returned as is. + + Examples + -------- + >>> df = pd.DataFrame({'A': [1, 2, 3]}) + >>> da = convert_to_dataarray(df) + >>> type(da) + + + >>> series = pd.Series([1, 2, 3], name='C') + >>> da = convert_to_dataarray(series) + >>> type(da) + + + >>> data_array = xr.DataArray([1, 2, 3]) + >>> da = convert_to_dataarray(data_array, name='D') + >>> type(da) + + """ + if not isinstance( + data, (np.ndarray, pd.DataFrame, pd.Series, xr.DataArray, xr.Dataset) + ): + raise TypeError( + "Input data must be of type np.ndarray, pandas.DataFrame, pandas.Series, " + f"xarray.DataArray, or xarray.Dataset. Got {type(data)}" + ) + + if not isinstance(name, str): + raise TypeError(f"The 'name' parameter must be a string. Got {type(name)}") + + # Checks pd.DataFrame input and converts to pd.Series if possible + if isinstance(data, pd.DataFrame): + if data.shape[1] > 1: + raise ValueError( + "If the input data is a pd.DataFrame or xr.Dataset, it must contain one variable. Got {data.shape[1]}" + ) + else: + # use iloc instead of squeeze. For DataFrames/Series with only a + # single value, squeeze returns a scalar, which is unexpected. + # iloc will return a Series as expected + data = data.iloc[:, 0] + + # Checks xr.Dataset input and converts to xr.DataArray if possible + if isinstance(data, xr.Dataset): + keys = list(data.keys()) + if len(keys) > 1: + raise ValueError( + "If the input data is a pd.DataFrame or xr.Dataset, it must contain one variable. Got {len(data.keys())}" + ) + else: + data = data.to_array() + data = data.sel( + variable=keys[0] + ) # removes the variable dimension, further simplifying the dataarray + + # Converts pd.Series to xr.DataArray + if isinstance(data, pd.Series): + data = data.to_xarray() + + # Converts np.ndarray to xr.DataArray. Assigns a simple 0-based dimension named index + if isinstance(data, np.ndarray): + data = xr.DataArray( + data=data, dims="index", coords={"index": np.arange(len(data))} + ) + + # If there's no data name, add one to prevent issues calling or converting the dataArray later one + if data.name == None: + data.name = name + + return data + + +def convert_nested_dict_and_pandas(data): + """ + Recursively searches inside nested dictionaries for pandas DataFrames to + convert to xarray Datasets. Typically called by wave.io functions that read + SWAN, WEC-Sim, CDIP, NDBC data. + + Parameters + ---------- + data: dictionary of dictionaries and pandas DataFrames + + Returns + ------- + data : dictionary of dictionaries and xarray Datasets + + """ + for key in data.keys(): + if isinstance(data[key], pd.DataFrame): + data[key] = convert_to_dataset(data[key]) + elif isinstance(data[key], dict): + data[key] = convert_nested_dict_and_pandas(data[key]) + + return data diff --git a/mhkit/utils/upcrossing.py b/mhkit/utils/upcrossing.py new file mode 100644 index 000000000..5993d6544 --- /dev/null +++ b/mhkit/utils/upcrossing.py @@ -0,0 +1,250 @@ +""" +Upcrossing Analysis Functions +============================= +This module contains a collection of functions that facilitate upcrossing +analyses. + +Key Functions: +-------------- +- `upcrossing`: Finds the zero upcrossing points. + +- `peaks`: Finds the peaks between zero crossings. + +- `troughs`: Finds the troughs between zero crossings. + +- `heights`: Calculates the height between zero crossings. + +- `periods`: Calculates the period between zero crossings. + +- `custom`: Applies a custom, user-defined function between zero crossings. + +Dependencies: +------------- +- numpy: Data analysis + +Author: +------- +mbruggs +akeeste + +Date: +----- +2023-10-10 + + +""" + +import numpy as np + + +def _apply(t, data, f, inds): + if inds is None: + inds = upcrossing(t, data) + + n = inds.size - 1 + + vals = np.empty(n) + for i in range(n): + vals[i] = f(inds[i], inds[i + 1]) + + return vals + + +def upcrossing(t, data): + """ + Finds the zero upcrossing points. + + Parameters + ---------- + t: np.array + Time array. + data: np.array + Signal time series. + + Returns + ------- + inds: np.array + Zero crossing indices + """ + # Check data types + if not isinstance(t, np.ndarray): + raise TypeError(f"t must be of type np.ndarray. Got: {type(t)}") + if not isinstance(data, np.ndarray): + raise TypeError(f"data must be of type np.ndarray. Got: {type(data)}") + if len(data.shape) != 1: + raise ValueError("only 1D data supported, try calling squeeze()") + + # eliminate zeros + zeroMask = data == 0 + data[zeroMask] = 0.5 * np.min(np.abs(data)) + + # zero up-crossings + diff = np.diff(np.sign(data)) + zeroUpCrossings_mask = (diff == 2) | (diff == 1) + zeroUpCrossings_index = np.where(zeroUpCrossings_mask)[0] + + return zeroUpCrossings_index + + +def peaks(t, data, inds=None): + """ + Finds the peaks between zero crossings. + + Parameters + ---------- + t: np.array + Time array. + data: np.array + Signal time-series. + inds: np.array + Optional indices for the upcrossing. Useful + when using several of the upcrossing methods + to avoid repeating the upcrossing analysis + each time. + + Returns + ------- + peaks: np.array + Peak values of the time-series + + """ + # Check data types + if not isinstance(t, np.ndarray): + raise TypeError(f"t must be of type np.ndarray. Got: {type(t)}") + if not isinstance(data, np.ndarray): + raise TypeError(f"data must be of type np.ndarray. Got: {type(data)}") + + return _apply(t, data, lambda ind1, ind2: np.max(data[ind1:ind2]), inds) + + +def troughs(t, data, inds=None): + """ + Finds the troughs between zero crossings. + + Parameters + ---------- + t: np.array + Time array. + data: np.array + Signal time-series. + inds: np.array + Optional indices for the upcrossing. Useful + when using several of the upcrossing methods + to avoid repeating the upcrossing analysis + each time. + + Returns + ------- + troughs: np.array + Trough values of the time-series + + """ + # Check data types + if not isinstance(t, np.ndarray): + raise TypeError(f"t must be of type np.ndarray. Got: {type(t)}") + if not isinstance(data, np.ndarray): + raise TypeError(f"data must be of type np.ndarray. Got: {type(data)}") + + return _apply(t, data, lambda ind1, ind2: np.min(data[ind1:ind2]), inds) + + +def heights(t, data, inds=None): + """ + Calculates the height between zero crossings. + + The height is defined as the max value - min value + between the zero crossing points. + + Parameters + ---------- + t: np.array + Time array. + data: np.array + Signal time-series. + inds: np.array + Optional indices for the upcrossing. Useful + when using several of the upcrossing methods + to avoid repeating the upcrossing analysis + each time. + + Returns + ------- + heights: np.array + Height values of the time-series + """ + # Check data types + if not isinstance(t, np.ndarray): + raise TypeError(f"t must be of type np.ndarray. Got: {type(t)}") + if not isinstance(data, np.ndarray): + raise TypeError(f"data must be of type np.ndarray. Got: {type(data)}") + + def func(ind1, ind2): + return np.max(data[ind1:ind2]) - np.min(data[ind1:ind2]) + + return _apply(t, data, func, inds) + + +def periods(t, data, inds=None): + """ + Calculates the period between zero crossings. + + Parameters + ---------- + t: np.array + Time array. + data: np.array + Signal time-series. + inds: np.array + Optional indices for the upcrossing. Useful + when using several of the upcrossing methods + to avoid repeating the upcrossing analysis + each time. + + Returns + ------- + periods: np.array + Period values of the time-series + """ + # Check data types + if not isinstance(t, np.ndarray): + raise TypeError(f"t must be of type np.ndarray. Got: {type(t)}") + if not isinstance(data, np.ndarray): + raise TypeError(f"data must be of type np.ndarray. Got: {type(data)}") + + return _apply(t, data, lambda ind1, ind2: t[ind2] - t[ind1], inds) + + +def custom(t, data, func, inds=None): + """ + Applies a custom function to the timeseries data between upcrossing points. + + Parameters + ---------- + t: np.array + Time array. + data: np.array + Signal time-series. + func: f(ind1, ind2) -> np.array + Function to apply between the zero crossing periods + given t[ind1], t[ind2], where ind1 < ind2, correspond + to the start and end of an upcrossing section. + inds: np.array + Optional indices for the upcrossing. Useful + when using several of the upcrossing methods + to avoid repeating the upcrossing analysis + each time. + + Returns + ------- + values: np.array + Custom values of the time-series + """ + # Check data types + if not isinstance(t, np.ndarray): + raise TypeError(f"t must be of type np.ndarray. Got: {type(t)}") + if not isinstance(data, np.ndarray): + raise TypeError(f"data must be of type np.ndarray. Got: {type(data)}") + if not callable(func): + raise ValueError("func must be callable") + + return _apply(t, data, func, inds) diff --git a/mhkit/wave/__init__.py b/mhkit/wave/__init__.py index 3a963ced8..f84c667cd 100644 --- a/mhkit/wave/__init__.py +++ b/mhkit/wave/__init__.py @@ -2,4 +2,4 @@ from mhkit.wave import io from mhkit.wave import graphics from mhkit.wave import performance -from mhkit.wave import contours \ No newline at end of file +from mhkit.wave import contours diff --git a/mhkit/wave/contours.py b/mhkit/wave/contours.py index 0574573f9..905c560b8 100644 --- a/mhkit/wave/contours.py +++ b/mhkit/wave/contours.py @@ -6,11 +6,16 @@ import scipy.stats as stats import scipy.interpolate as interp import numpy as np +import warnings +from mhkit.utils import to_numeric_array +import matplotlib -### Contours -def environmental_contours(x1, x2, sea_state_duration, return_period, - method, **kwargs): +mpl_version = tuple(map(int, matplotlib.__version__.split("."))) + + +# Contours +def environmental_contours(x1, x2, sea_state_duration, return_period, method, **kwargs): """ Returns a Dictionary of x1 and x2 components for each contour method passed. A method may be one of the following: @@ -20,9 +25,9 @@ def environmental_contours(x1, x2, sea_state_duration, return_period, Parameters ---------- - x1: array + x1: list, np.ndarray, pd.Series, xr.DataArray Component 1 data - x2: array + x2: list, np.ndarray, pd.Series, xr.DataArray Component 2 data sea_state_duration : int or float `x1` and `x2` averaging period in seconds @@ -73,24 +78,26 @@ def environmental_contours(x1, x2, sea_state_duration, return_period, copulas: Dictionary Dictionary of x1 and x2 copula components for each copula method """ - try: - x1 = np.array(x1) - except: - pass - try: - x2 = np.array(x2) - except: - pass - assert isinstance(x1, np.ndarray), 'x1 must be of type np.ndarray' - assert isinstance(x2, np.ndarray), 'x2 must be of type np.ndarray' - assert isinstance(sea_state_duration, (int, float)), ( - 'sea_state_duration must be of type int or float') - assert isinstance(return_period, (int, float, np.ndarray)), ( - 'return_period must be of type int, float, or array') + x1 = to_numeric_array(x1, "x1") + x2 = to_numeric_array(x2, "x2") + if not isinstance(x1, np.ndarray) or x1.ndim == 0: + raise TypeError(f"x1 must be a non-scalar array. Got: {type(x1)}") + if not isinstance(x2, np.ndarray) or x2.ndim == 0: + raise TypeError(f"x2 must be a non-scalar array. Got: {type(x2)}") + if len(x1) != len(x2): + raise ValueError("The lengths of x1 and x2 must be equal.") + if not isinstance(sea_state_duration, (int, float)): + raise TypeError( + f"sea_state_duration must be of type int or float. Got: {type(sea_state_duration)}" + ) + if not isinstance(return_period, (int, float, np.ndarray)): + raise TypeError( + f"return_period must be of type int, float, or np.ndarray. Got: {type(return_period)}" + ) bin_val_size = kwargs.get("bin_val_size", 0.25) nb_steps = kwargs.get("nb_steps", 1000) - initial_bin_max_val = kwargs.get("initial_bin_max_val", 1.) + initial_bin_max_val = kwargs.get("initial_bin_max_val", 1.0) min_bin_count = kwargs.get("min_bin_count", 40) bandwidth = kwargs.get("bandwidth", None) Ndata_bivariate_KDE = kwargs.get("Ndata_bivariate_KDE", 100) @@ -100,38 +107,56 @@ def environmental_contours(x1, x2, sea_state_duration, return_period, PCA_bin_size = kwargs.get("PCA_bin_size", 250) return_fit = kwargs.get("return_fit", False) - assert isinstance(PCA, (dict, type(None))), ( - 'If specified PCA must be a dict') - assert isinstance(PCA_bin_size, int), 'PCA_bin_size must be of type int' - assert isinstance(return_fit, bool), 'return_fit must be of type bool' - assert isinstance(bin_val_size, (int, float)), ( - 'bin_val_size must be of type int or float') - assert isinstance(nb_steps, int), 'nb_steps must be of type int' - assert isinstance(min_bin_count, int), ('min_bin_count must be of ' - + 'type int') - assert isinstance(initial_bin_max_val, (int, float)), ( - 'initial_bin_max_val must be of type int or float') - if bandwidth == None: - assert(not 'bivariate_KDE' in method), ( - 'Must specify keyword bandwidth with bivariate KDE method') + if not isinstance(max_x1, (int, float, type(None))): + raise TypeError(f"If specified, max_x1 must be a dict. Got: {type(PCA)}") + if not isinstance(max_x2, (int, float, type(None))): + raise TypeError(f"If specified, max_x2 must be a dict. Got: {type(PCA)}") + if not isinstance(PCA, (dict, type(None))): + raise TypeError(f"If specified, PCA must be a dict. Got: {type(PCA)}") + if not isinstance(PCA_bin_size, int): + raise TypeError(f"PCA_bin_size must be of type int. Got: {type(PCA_bin_size)}") + if not isinstance(return_fit, bool): + raise TypeError(f"return_fit must be of type bool. Got: {type(return_fit)}") + if not isinstance(bin_val_size, (int, float)): + raise TypeError( + f"bin_val_size must be of type int or float. Got: {type(bin_val_size)}" + ) + if not isinstance(nb_steps, int): + raise TypeError(f"nb_steps must be of type int. Got: {type(nb_steps)}") + if not isinstance(min_bin_count, int): + raise TypeError( + f"min_bin_count must be of type int. Got: {type(min_bin_count)}" + ) + if not isinstance(initial_bin_max_val, (int, float)): + raise TypeError( + f"initial_bin_max_val must be of type int or float. Got: {type(initial_bin_max_val)}" + ) + if "bivariate_KDE" in method and bandwidth == None: + raise TypeError( + f"Must specify keyword bandwidth with bivariate KDE method. Got: {type(bandwidth)}" + ) if isinstance(method, str): method = [method] - assert (len(set(method)) == len(method)), ( - 'Can only pass a unique ' - + 'method once per function call. Consider wrapping this ' - + 'function in a for loop to investage variations on the same method') - - method_class = {'PCA': 'parametric', - 'gaussian': 'parametric', - 'gumbel': 'parametric', - 'clayton': 'parametric', - 'rosenblatt': 'parametric', - 'nonparametric_gaussian': 'nonparametric', - 'nonparametric_clayton': 'nonparametric', - 'nonparametric_gumbel': 'nonparametric', - 'bivariate_KDE': 'KDE', - 'bivariate_KDE_log': 'KDE'} + if not (len(set(method)) == len(method)): + raise ValueError( + f"Can only pass a unique " + + "method once per function call. Consider wrapping this " + + "function in a for loop to investage variations on the same method" + ) + + method_class = { + "PCA": "parametric", + "gaussian": "parametric", + "gumbel": "parametric", + "clayton": "parametric", + "rosenblatt": "parametric", + "nonparametric_gaussian": "nonparametric", + "nonparametric_clayton": "nonparametric", + "nonparametric_gumbel": "nonparametric", + "bivariate_KDE": "KDE", + "bivariate_KDE_log": "KDE", + } classification = [] methods = method @@ -142,95 +167,128 @@ def environmental_contours(x1, x2, sea_state_duration, return_period, fit_parametric = None fit_nonparametric = None component_1 = None - if 'parametric' in classification: - (para_dist_1, para_dist_2, mean_cond, std_cond) = ( - _copula_parameters(x1, x2, min_bin_count, - initial_bin_max_val, bin_val_size)) + if "parametric" in classification: + (para_dist_1, para_dist_2, mean_cond, std_cond) = _copula_parameters( + x1, x2, min_bin_count, initial_bin_max_val, bin_val_size + ) - x_quantile = fit['x_quantile'] + x_quantile = fit["x_quantile"] a = para_dist_1[0] c = para_dist_1[1] loc = para_dist_1[2] scale = para_dist_1[3] - component_1 = stats.exponweib.ppf( - x_quantile, a, c, loc=loc, scale=scale) + component_1 = stats.exponweib.ppf(x_quantile, a, c, loc=loc, scale=scale) fit_parametric = fit - fit_parametric['para_dist_1'] = para_dist_1 - fit_parametric['para_dist_2'] = para_dist_2 - fit_parametric['mean_cond'] = mean_cond - fit_parametric['std_cond'] = std_cond + fit_parametric["para_dist_1"] = para_dist_1 + fit_parametric["para_dist_2"] = para_dist_2 + fit_parametric["mean_cond"] = mean_cond + fit_parametric["std_cond"] = std_cond if PCA == None: PCA = fit_parametric - if 'nonparametric' in classification: - (nonpara_dist_1, nonpara_dist_2, nonpara_pdf_2) = ( - _nonparametric_copula_parameters(x1, x2, nb_steps=nb_steps)) + if "nonparametric" in classification: + ( + nonpara_dist_1, + nonpara_dist_2, + nonpara_pdf_2, + ) = _nonparametric_copula_parameters(x1, x2, nb_steps=nb_steps) fit_nonparametric = fit - fit_nonparametric['nonpara_dist_1'] = nonpara_dist_1 - fit_nonparametric['nonpara_dist_2'] = nonpara_dist_2 - fit_nonparametric['nonpara_pdf_2'] = nonpara_pdf_2 - - copula_functions = {'PCA': - {'func': PCA_contour, - 'vals': (x1, x2, PCA, {'nb_steps': nb_steps, - 'return_fit': return_fit, - 'bin_size': PCA_bin_size})}, - 'gaussian': - {'func': _gaussian_copula, - 'vals': (x1, x2, fit_parametric, component_1, - {'return_fit': return_fit})}, - 'gumbel': - {'func': _gumbel_copula, - 'vals': (x1, x2, fit_parametric, component_1, - nb_steps, {'return_fit': return_fit})}, - 'clayton': - {'func': _clayton_copula, - 'vals': (x1, x2, fit_parametric, component_1, - {'return_fit': return_fit})}, - 'rosenblatt': - {'func': _rosenblatt_copula, - 'vals': (x1, x2, fit_parametric, component_1, - {'return_fit': return_fit})}, - 'nonparametric_gaussian': - {'func': _nonparametric_gaussian_copula, - 'vals': (x1, x2, fit_nonparametric, nb_steps, - {'return_fit': return_fit})}, - 'nonparametric_clayton': - {'func': _nonparametric_clayton_copula, - 'vals': (x1, x2, fit_nonparametric, nb_steps, - {'return_fit': return_fit})}, - 'nonparametric_gumbel': - {'func': _nonparametric_gumbel_copula, - 'vals': (x1, x2, fit_nonparametric, nb_steps, - {'return_fit': return_fit})}, - 'bivariate_KDE': - {'func': _bivariate_KDE, - 'vals': (x1, x2, bandwidth, fit, nb_steps, - Ndata_bivariate_KDE, - {'max_x1': max_x1, 'max_x2': max_x2, - 'return_fit': return_fit})}, - 'bivariate_KDE_log': - {'func': _bivariate_KDE, - 'vals': (x1, x2, bandwidth, fit, nb_steps, - Ndata_bivariate_KDE, - {'max_x1': max_x1, 'max_x2': max_x2, - 'log_transform': True, - 'return_fit': return_fit})}, - } + fit_nonparametric["nonpara_dist_1"] = nonpara_dist_1 + fit_nonparametric["nonpara_dist_2"] = nonpara_dist_2 + fit_nonparametric["nonpara_pdf_2"] = nonpara_pdf_2 + + copula_functions = { + "PCA": { + "func": PCA_contour, + "vals": ( + x1, + x2, + PCA, + { + "nb_steps": nb_steps, + "return_fit": return_fit, + "bin_size": PCA_bin_size, + }, + ), + }, + "gaussian": { + "func": _gaussian_copula, + "vals": (x1, x2, fit_parametric, component_1, {"return_fit": return_fit}), + }, + "gumbel": { + "func": _gumbel_copula, + "vals": ( + x1, + x2, + fit_parametric, + component_1, + nb_steps, + {"return_fit": return_fit}, + ), + }, + "clayton": { + "func": _clayton_copula, + "vals": (x1, x2, fit_parametric, component_1, {"return_fit": return_fit}), + }, + "rosenblatt": { + "func": _rosenblatt_copula, + "vals": (x1, x2, fit_parametric, component_1, {"return_fit": return_fit}), + }, + "nonparametric_gaussian": { + "func": _nonparametric_gaussian_copula, + "vals": (x1, x2, fit_nonparametric, nb_steps, {"return_fit": return_fit}), + }, + "nonparametric_clayton": { + "func": _nonparametric_clayton_copula, + "vals": (x1, x2, fit_nonparametric, nb_steps, {"return_fit": return_fit}), + }, + "nonparametric_gumbel": { + "func": _nonparametric_gumbel_copula, + "vals": (x1, x2, fit_nonparametric, nb_steps, {"return_fit": return_fit}), + }, + "bivariate_KDE": { + "func": _bivariate_KDE, + "vals": ( + x1, + x2, + bandwidth, + fit, + nb_steps, + Ndata_bivariate_KDE, + {"max_x1": max_x1, "max_x2": max_x2, "return_fit": return_fit}, + ), + }, + "bivariate_KDE_log": { + "func": _bivariate_KDE, + "vals": ( + x1, + x2, + bandwidth, + fit, + nb_steps, + Ndata_bivariate_KDE, + { + "max_x1": max_x1, + "max_x2": max_x2, + "log_transform": True, + "return_fit": return_fit, + }, + ), + }, + } copulas = {} for method in methods: - vals = copula_functions[method]['vals'] + vals = copula_functions[method]["vals"] if return_fit: - component_1, component_2, fit = copula_functions[method]['func']( - *vals) - copulas[f'{method}_fit'] = fit + component_1, component_2, fit = copula_functions[method]["func"](*vals) + copulas[f"{method}_fit"] = fit else: - component_1, component_2 = copula_functions[method]['func'](*vals) - copulas[f'{method}_x1'] = component_1 - copulas[f'{method}_x2'] = component_2 + component_1, component_2 = copula_functions[method]["func"](*vals) + copulas[f"{method}_x1"] = component_1 + copulas[f"{method}_x2"] = component_2 return copulas @@ -259,9 +317,9 @@ def PCA_contour(x1, x2, fit, kwargs): Parameters ---------- - x1: numpy array + x1: list, np.ndarray, pd.Series, xr.DataArray Component 1 data - x2: numpy array + x2: list, np.ndarray, pd.Series, xr.DataArray Component 2 data fit: dict Dictionary of the iso-probability results. May additionally @@ -289,7 +347,7 @@ def PCA_contour(x1, x2, fit, kwargs): Calculated x2 values along the contour boundary following return to original input orientation. fit: dict (optional) - principal component analysis dictionary + principal component analysis dictionary Keys: ----- 'principal_axes': sign corrected PCA axes @@ -299,63 +357,68 @@ def PCA_contour(x1, x2, fit, kwargs): 'sigma_param' : fit to _sig_fits """ - try: - x1 = np.array(x1) - except: - pass - try: - x2 = np.array(x2) - except: - pass - assert isinstance(x1, np.ndarray), 'x1 must be of type np.ndarray' - assert isinstance(x2, np.ndarray), 'x2 must be of type np.ndarray' + x1 = to_numeric_array(x1, "x1") + x2 = to_numeric_array(x2, "x2") + if not isinstance(x1, np.ndarray) or x1.ndim == 0: + raise TypeError(f"x1 must be a non-scalar array. Got: {type(x1)}") + if not isinstance(x2, np.ndarray) or x2.ndim == 0: + raise TypeError(f"x2 must be a non-scalar array. Got: {type(x2)}") + if len(x1) != len(x2): + raise ValueError("The lengths of x1 and x2 must be equal.") bin_size = kwargs.get("bin_size", 250) nb_steps = kwargs.get("nb_steps", 1000) return_fit = kwargs.get("return_fit", False) - assert isinstance(bin_size, int), 'bin_size must be of type int' - assert isinstance(nb_steps, int), 'nb_steps must be of type int' - assert isinstance(return_fit, bool), 'return_fit must be of type bool' + if not isinstance(bin_size, int): + raise TypeError(f"bin_size must be of type int. Got: {type(bin_size)}") + if not isinstance(nb_steps, int): + raise TypeError(f"nb_steps must be of type int. Got: {type(nb_steps)}") + if not isinstance(return_fit, bool): + raise TypeError(f"return_fit must be of type bool. Got: {type(return_fit)}") - if 'x1_fit' not in fit: + if "x1_fit" not in fit: pca_fit = _principal_component_analysis(x1, x2, bin_size=bin_size) for key in pca_fit: fit[key] = pca_fit[key] - x_quantile = fit['x_quantile'] - y_quantile = fit['y_quantile'] + x_quantile = fit["x_quantile"] + y_quantile = fit["y_quantile"] # Use the inverse of cdf to calculate component 1 values - component_1 = stats.invgauss.ppf(x_quantile, - mu=fit['x1_fit']['mu'], - loc=fit['x1_fit']['loc'], - scale=fit['x1_fit']['scale']) + component_1 = stats.invgauss.ppf( + x_quantile, + mu=fit["x1_fit"]["mu"], + loc=fit["x1_fit"]["loc"], + scale=fit["x1_fit"]["scale"], + ) # Find Component 2 mu using first order linear regression - mu_slope = fit['mu_fit'].slope - mu_intercept = fit['mu_fit'].intercept + mu_slope = fit["mu_fit"].slope + mu_intercept = fit["mu_fit"].intercept component_2_mu = mu_slope * component_1 + mu_intercept # Find Componenet 2 sigma using second order polynomial fit - sigma_polynomial_coeffcients = fit['sigma_fit'].x + sigma_polynomial_coeffcients = fit["sigma_fit"].x component_2_sigma = np.polyval(sigma_polynomial_coeffcients, component_1) # Use calculated mu and sigma values to calculate C2 along the contour - component_2 = stats.norm.ppf(y_quantile, - loc=component_2_mu, - scale=component_2_sigma) + component_2 = stats.norm.ppf( + y_quantile, loc=component_2_mu, scale=component_2_sigma + ) # Convert contours back to the original reference frame - principal_axes = fit['principal_axes'] - shift = fit['shift'] + principal_axes = fit["principal_axes"] + shift = fit["shift"] pa00 = principal_axes[0, 0] pa01 = principal_axes[0, 1] - x1_contour = ((pa00 * component_1 + pa01 * (component_2 - shift)) / - (pa01**2 + pa00**2)) - x2_contour = ((pa01 * component_1 - pa00 * (component_2 - shift)) / - (pa01**2 + pa00**2)) + x1_contour = (pa00 * component_1 + pa01 * (component_2 - shift)) / ( + pa01**2 + pa00**2 + ) + x2_contour = (pa01 * component_1 - pa00 * (component_2 - shift)) / ( + pa01**2 + pa00**2 + ) # Assign 0 value to any negative x1 contour values x1_contour = np.maximum(0, x1_contour) @@ -410,15 +473,18 @@ def _principal_component_analysis(x1, x2, bin_size=250): 'mu_param' : fit to _mu_fcn 'sigma_param' : fit to _sig_fits """ - assert isinstance(x1, np.ndarray), 'x1 must be of type np.ndarray' - assert isinstance(x2, np.ndarray), 'x2 must be of type np.ndarray' - assert isinstance(bin_size, int), 'bin_size must be of type int' + if not isinstance(x1, np.ndarray): + raise TypeError(f"x1 must be of type np.ndarray. Got: {type(x1)}") + if not isinstance(x2, np.ndarray): + raise TypeError(f"x2 must be of type np.ndarray. Got: {type(x2)}") + if not isinstance(bin_size, int): + raise TypeError(f"bin_size must be of type int. Got: {type(bin_size)}") + # Step 0: Perform Standard PCA mean_location = 0 x1_mean_centered = x1 - x1.mean(axis=0) x2_mean_centered = x2 - x2.mean(axis=0) - n_samples_by_n_features = np.column_stack((x1_mean_centered, - x2_mean_centered)) + n_samples_by_n_features = np.column_stack((x1_mean_centered, x2_mean_centered)) pca = skPCA(n_components=2) pca.fit(n_samples_by_n_features) principal_axes = pca.components_ @@ -444,29 +510,31 @@ def _principal_component_analysis(x1, x2, bin_size=250): x2_sorted = x2_components[x1_sorted_index] x1_fit_results = stats.invgauss.fit(x1_sorted, floc=mean_location) - x1_fit = {'mu': x1_fit_results[0], - 'loc': x1_fit_results[1], - 'scale': x1_fit_results[2]} + x1_fit = { + "mu": x1_fit_results[0], + "loc": x1_fit_results[1], + "scale": x1_fit_results[2], + } # Step 3: Bin Data & find order 1 linear relation between x1 & x2 means N = len(x1) - minimum_4_bins = np.floor(N*0.25) + minimum_4_bins = np.floor(N * 0.25) if bin_size > minimum_4_bins: bin_size = minimum_4_bins - msg = ('To allow for a minimum of 4 bins the bin size has been' + - f'set to {minimum_4_bins}') - print(msg) + msg = ( + "To allow for a minimum of 4 bins, the bin size has been " + + f"set to {minimum_4_bins}" + ) + warnings.warn(msg, UserWarning) - N_multiples = N // bin_size - max_N_multiples_index = N_multiples*bin_size + N_multiples = int(N // bin_size) + max_N_multiples_index = int(N_multiples * bin_size) x1_integer_multiples_of_bin_size = x1_sorted[0:max_N_multiples_index] x2_integer_multiples_of_bin_size = x2_sorted[0:max_N_multiples_index] - x1_bins = np.split(x1_integer_multiples_of_bin_size, - N_multiples) - x2_bins = np.split(x2_integer_multiples_of_bin_size, - N_multiples) + x1_bins = np.split(x1_integer_multiples_of_bin_size, N_multiples) + x2_bins = np.split(x2_integer_multiples_of_bin_size, N_multiples) x1_last_bin = x1_sorted[max_N_multiples_index:] x2_last_bin = x2_sorted[max_N_multiples_index:] @@ -487,29 +555,38 @@ def _principal_component_analysis(x1, x2, bin_size=250): # STEP 4: Find order 2 relation between x1_mean and x2 standard deviation sigma_polynomial_order = 2 - sig_0 = 0.1 * np.ones(sigma_polynomial_order+1) + sig_0 = 0.1 * np.ones(sigma_polynomial_order + 1) def _objective_function(sig_p, x1_means, x2_sigmas): return mean_squared_error(np.polyval(sig_p, x1_means), x2_sigmas) # Constraint Functions - def y_intercept_gt_0(sig_p): return (sig_p[2]) + def y_intercept_gt_0(sig_p): + return sig_p[2] def sig_polynomial_min_gt_0(sig_p): - return (sig_p[2] - (sig_p[1]**2) / (4 * sig_p[0])) - - constraints = ({'type': 'ineq', 'fun': y_intercept_gt_0}, - {'type': 'ineq', 'fun': sig_polynomial_min_gt_0}) - - sigma_fit = optim.minimize(_objective_function, x0=sig_0, - args=(x1_means, x2_sigmas), - method='SLSQP', constraints=constraints) - - PCA = {'principal_axes': principal_axes, - 'shift': shift, - 'x1_fit': x1_fit, - 'mu_fit': mu_fit, - 'sigma_fit': sigma_fit} + return sig_p[2] - (sig_p[1] ** 2) / (4 * sig_p[0]) + + constraints = ( + {"type": "ineq", "fun": y_intercept_gt_0}, + {"type": "ineq", "fun": sig_polynomial_min_gt_0}, + ) + + sigma_fit = optim.minimize( + _objective_function, + x0=sig_0, + args=(x1_means, x2_sigmas), + method="SLSQP", + constraints=constraints, + ) + + PCA = { + "principal_axes": principal_axes, + "shift": shift, + "x1_fit": x1_fit, + "mu_fit": mu_fit, + "sigma_fit": sigma_fit, + } return PCA @@ -541,37 +618,41 @@ def _iso_prob_and_quantile(sea_state_duration, return_period, nb_steps): 'y_quantile' - CDF of y-component """ - assert isinstance(sea_state_duration, (int, float) - ), 'sea_state_duration must be of type int or float' - assert isinstance(return_period, (int, float)), ( - 'return_period must be of type int or float') - - assert isinstance(nb_steps, int), 'nb_steps must be of type int' + if not isinstance(sea_state_duration, (int, float)): + raise TypeError( + f"sea_state_duration must be of type int or float. Got: {type(sea_state_duration)}" + ) + if not isinstance(return_period, (int, float)): + raise TypeError( + f"return_period must be of type int or float. Got: {type(return_period)}" + ) + if not isinstance(nb_steps, int): + raise TypeError(f"nb_steps must be of type int. Got: {type(nb_steps)}") dt_yrs = sea_state_duration / (3600 * 24 * 365) exceedance_probability = 1 / (return_period / dt_yrs) - iso_probability_radius = stats.norm.ppf((1 - exceedance_probability), - loc=0, scale=1) + iso_probability_radius = stats.norm.ppf( + (1 - exceedance_probability), loc=0, scale=1 + ) discretized_radians = np.linspace(0, 2 * np.pi, nb_steps) - x_component_iso_prob = iso_probability_radius * \ - np.cos(discretized_radians) - y_component_iso_prob = iso_probability_radius * \ - np.sin(discretized_radians) + x_component_iso_prob = iso_probability_radius * np.cos(discretized_radians) + y_component_iso_prob = iso_probability_radius * np.sin(discretized_radians) x_quantile = stats.norm.cdf(x_component_iso_prob, loc=0, scale=1) y_quantile = stats.norm.cdf(y_component_iso_prob, loc=0, scale=1) - results = {'exceedance_probability': exceedance_probability, - 'x_component_iso_prob': x_component_iso_prob, - 'y_component_iso_prob': y_component_iso_prob, - 'x_quantile': x_quantile, - 'y_quantile': y_quantile} + results = { + "exceedance_probability": exceedance_probability, + "x_component_iso_prob": x_component_iso_prob, + "y_component_iso_prob": y_component_iso_prob, + "x_quantile": x_quantile, + "y_quantile": y_quantile, + } return results -def _copula_parameters(x1, x2, min_bin_count, initial_bin_max_val, - bin_val_size): +def _copula_parameters(x1, x2, min_bin_count, initial_bin_max_val, bin_val_size): """ Returns an estimate of the Weibull and Lognormal distribution for x1 and x2 respectively. Additionally returns the estimates of the @@ -602,14 +683,22 @@ def _copula_parameters(x1, x2, min_bin_count, initial_bin_max_val, std_cond: array Estimate coefficients of the standard deviation of Ln(x2|x1) """ - assert isinstance(x1, np.ndarray), 'x1 must be of type np.ndarray' - assert isinstance(x2, np.ndarray), 'x2 must be of type np.ndarray' - assert isinstance(min_bin_count, int), ('min_bin_count must be of' - + 'type int') - assert isinstance(bin_val_size, (int, float)), ( - 'bin_val_size must be of type int or float') - assert isinstance(initial_bin_max_val, (int, float)), ( - 'initial_bin_max_val must be of type int or float') + if not isinstance(x1, np.ndarray): + raise TypeError(f"x1 must be of type np.ndarray. Got: {type(x1)}") + if not isinstance(x2, np.ndarray): + raise TypeError(f"x2 must be of type np.ndarray. Got: {type(x2)}") + if not isinstance(min_bin_count, int): + raise TypeError( + f"min_bin_count must be of type int. Got: {type(min_bin_count)}" + ) + if not isinstance(bin_val_size, (int, float)): + raise TypeError( + f"bin_val_size must be of type int or float. Got: {type(bin_val_size)}" + ) + if not isinstance(initial_bin_max_val, (int, float)): + raise TypeError( + f"initial_bin_max_val must be of type int or float. Got: {type(initial_bin_max_val)}" + ) # Binning x1_sorted_index = x1.argsort() @@ -634,10 +723,10 @@ def _copula_parameters(x1, x2, min_bin_count, initial_bin_max_val, bin_size_i = np.inf while bin_size_i >= min_bin_count: i += 1 - bin_i_max_val = initial_bin_max_val + bin_val_size*(i) + bin_i_max_val = initial_bin_max_val + bin_val_size * (i) N_vals_lt_limit = sum(x1_sorted <= bin_i_max_val) ind = np.append(ind, N_vals_lt_limit) - bin_size_i = ind[i]-ind[i-1] + bin_size_i = ind[i] - ind[i - 1] # Weibull distribution parameters for component 1 using MLE para_dist_1 = stats.exponweib.fit(x1_sorted, floc=0, fa=1) @@ -656,7 +745,7 @@ def _copula_parameters(x1, x2, min_bin_count, initial_bin_max_val, x2_lognormal_dist0 = stats.norm.fit(x2_log0) para_dist_cond.append(x2_lognormal_dist0) # mean of x1 (component 1 for zero bin) - x1_bin0 = x1_sorted[range(0, int(ind[0])-1)] + x1_bin0 = x1_sorted[range(0, int(ind[0]) - 1)] hss.append(np.mean(x1_bin0)) # Special case 2-bin lognormal Dist @@ -667,11 +756,11 @@ def _copula_parameters(x1, x2, min_bin_count, initial_bin_max_val, para_dist_cond.append(x2_lognormal_dist1) # mean of Hs (component 1 for bin 1) - hss.append(np.mean(x1_sorted[range(0, int(ind[1])-1)])) + hss.append(np.mean(x1_sorted[range(0, int(ind[1]) - 1)])) # lognormal Dist (lognormal dist over only 2 bins) for i in range(2, num): - ind_i = range(int(ind[i-2]), int(ind[i])) + ind_i = range(int(ind[i - 2]), int(ind[i])) x2_log_i = np.log(x2_sorted[ind_i]) x2_lognormal_dist_i = stats.norm.fit(x2_log_i) para_dist_cond.append(x2_lognormal_dist_i) @@ -680,7 +769,7 @@ def _copula_parameters(x1, x2, min_bin_count, initial_bin_max_val, # Estimate coefficient using least square solution (mean: 3rd order, # sigma: 2nd order) - ind_f = range(int(ind[num-2]), int(len(x1))) + ind_f = range(int(ind[num - 2]), int(len(x1))) x2_log_f = np.log(x2_sorted[ind_f]) x2_lognormal_dist_f = stats.norm.fit(x2_log_f) para_dist_cond.append(x2_lognormal_dist_f) # parameters for last bin @@ -692,17 +781,15 @@ def _copula_parameters(x1, x2, min_bin_count, initial_bin_max_val, hss = np.array(hss) # cubic in Hs: a + bx + cx**2 + dx**3 - phi_mean = np.column_stack((np.ones(num+1), hss, hss**2, hss**3)) + phi_mean = np.column_stack((np.ones(num + 1), hss, hss**2, hss**3)) # quadratic in Hs a + bx + cx**2 - phi_std = np.column_stack((np.ones(num+1), hss, hss**2)) + phi_std = np.column_stack((np.ones(num + 1), hss, hss**2)) # Estimate coefficients of mean of Ln(T|Hs)(vector 4x1) (cubic in Hs) - mean_cond = np.linalg.lstsq(phi_mean, para_dist_cond[:, 0], - rcond=None)[0] + mean_cond = np.linalg.lstsq(phi_mean, para_dist_cond[:, 0], rcond=None)[0] # Estimate coefficients of standard deviation of Ln(T|Hs) # (vector 3x1) (quadratic in Hs) - std_cond = np.linalg.lstsq(phi_std, para_dist_cond[:, 1], - rcond=None)[0] + std_cond = np.linalg.lstsq(phi_std, para_dist_cond[:, 1], rcond=None)[0] return para_dist_1, para_dist_2, mean_cond, std_cond @@ -753,36 +840,42 @@ def _gaussian_copula(x1, x2, fit, component_1, kwargs): x2 = np.array(x2) except: pass - assert isinstance(x1, np.ndarray), 'x1 must be of type np.ndarray' - assert isinstance(x2, np.ndarray), 'x2 must be of type np.ndarray' - assert isinstance(component_1, np.ndarray), ( - 'x2 must be of type np.ndarray') - + if not isinstance(x1, np.ndarray): + raise TypeError(f"x1 must be of type np.ndarray. Got: {type(x1)}") + if not isinstance(x2, np.ndarray): + raise TypeError(f"x2 must be of type np.ndarray. Got: {type(x2)}") + if not isinstance(component_1, np.ndarray): + raise TypeError( + f"component_1 must be of type np.ndarray. Got: {type(component_1)}" + ) return_fit = kwargs.get("return_fit", False) - assert isinstance(return_fit, bool), ( - 'If specified return_fit must be a bool') + if not isinstance(return_fit, bool): + raise TypeError( + f"If specified, return_fit must be of type bool. Got: {type(return_fit)}" + ) - x_component_iso_prob = fit['x_component_iso_prob'] - y_component_iso_prob = fit['y_component_iso_prob'] + x_component_iso_prob = fit["x_component_iso_prob"] + y_component_iso_prob = fit["y_component_iso_prob"] # Calculate Kendall's tau tau = stats.kendalltau(x2, x1)[0] - rho_gau = np.sin(tau*np.pi/2.) + rho_gau = np.sin(tau * np.pi / 2.0) - z2_Gauss = stats.norm.cdf(y_component_iso_prob*np.sqrt(1.-rho_gau**2.) - + rho_gau*x_component_iso_prob) + z2_Gauss = stats.norm.cdf( + y_component_iso_prob * np.sqrt(1.0 - rho_gau**2.0) + + rho_gau * x_component_iso_prob + ) - para_dist_2 = fit['para_dist_2'] + para_dist_2 = fit["para_dist_2"] s = para_dist_2[1] loc = 0 scale = np.exp(para_dist_2[0]) # lognormal inverse - component_2_Gaussian = stats.lognorm.ppf(z2_Gauss, s=s, loc=loc, - scale=scale) - fit['tau'] = tau - fit['rho'] = rho_gau - fit['z2'] = z2_Gauss + component_2_Gaussian = stats.lognorm.ppf(z2_Gauss, s=s, loc=loc, scale=scale) + fit["tau"] = tau + fit["rho"] = rho_gau + fit["z2"] = z2_Gauss if return_fit: return component_1, component_2_Gaussian, fit @@ -807,18 +900,20 @@ def _gumbel_density(u, alpha): Copula density function. """ - #Ignore divide by 0 warnings and resulting NaN warnings - np.seterr(all='ignore') + # Ignore divide by 0 warnings and resulting NaN warnings + np.seterr(all="ignore") v = -np.log(u) v = np.sort(v, axis=0) vmin = v[0, :] vmax = v[1, :] nlogC = vmax * (1 + (vmin / vmax) ** alpha) ** (1 / alpha) - y = (alpha - 1 + nlogC)*np.exp( - -nlogC+np.sum((alpha-1) * np.log(v)+v, axis=0) + - (1-2*alpha)*np.log(nlogC)) - np.seterr(all='warn') - return(y) + y = (alpha - 1 + nlogC) * np.exp( + -nlogC + + np.sum((alpha - 1) * np.log(v) + v, axis=0) + + (1 - 2 * alpha) * np.log(nlogC) + ) + np.seterr(all="warn") + return y def _gumbel_copula(x1, x2, fit, component_1, nb_steps, kwargs): @@ -869,24 +964,30 @@ def _gumbel_copula(x1, x2, fit, component_1, nb_steps, kwargs): x2 = np.array(x2) except: pass - assert isinstance(x1, np.ndarray), 'x1 must be of type np.ndarray' - assert isinstance(x2, np.ndarray), 'x2 must be of type np.ndarray' - assert isinstance(component_1, np.ndarray), 'x2 must be of type np.ndarray' - + if not isinstance(x1, np.ndarray): + raise TypeError(f"x1 must be of type np.ndarray. Got: {type(x1)}") + if not isinstance(x2, np.ndarray): + raise TypeError(f"x2 must be of type np.ndarray. Got: {type(x2)}") + if not isinstance(component_1, np.ndarray): + raise TypeError( + f"component_1 must be of type np.ndarray. Got: {type(component_1)}" + ) return_fit = kwargs.get("return_fit", False) - assert isinstance( - return_fit, bool), 'If specified return_fit must be a bool' + if not isinstance(return_fit, bool): + raise TypeError( + f"If specified, return_fit must be of type bool. Got: {type(return_fit)}" + ) - x_quantile = fit['x_quantile'] - y_quantile = fit['y_quantile'] - para_dist_2 = fit['para_dist_2'] + x_quantile = fit["x_quantile"] + y_quantile = fit["y_quantile"] + para_dist_2 = fit["para_dist_2"] # Calculate Kendall's tau tau = stats.kendalltau(x2, x1)[0] - theta_gum = 1./(1.-tau) + theta_gum = 1.0 / (1.0 - tau) min_limit_2 = 0 - max_limit_2 = np.ceil(np.amax(x2)*2) + max_limit_2 = np.ceil(np.amax(x2) * 2) Ndata = 1000 x = np.linspace(min_limit_2, max_limit_2, Ndata) @@ -895,21 +996,21 @@ def _gumbel_copula(x1, x2, fit, component_1, nb_steps, kwargs): scale = np.exp(para_dist_2[0]) z2 = stats.lognorm.cdf(x, s=s, loc=0, scale=scale) - fit['tau'] = tau - fit['theta'] = theta_gum - fit['z2'] = z2 + fit["tau"] = tau + fit["theta"] = theta_gum + fit["z2"] = z2 component_2_Gumbel = np.zeros(nb_steps) for k in range(nb_steps): - z1 = np.array([x_quantile[k]]*Ndata) + z1 = np.array([x_quantile[k]] * Ndata) Z = np.array((z1, z2)) Y = _gumbel_density(Z, theta_gum) Y = np.nan_to_num(Y) # pdf 2|1, f(comp_2|comp_1)=c(z1,z2)*f(comp_2) - p_x_x1 = Y*(stats.lognorm.pdf(x, s=s, loc=0, scale=scale)) + p_x_x1 = Y * (stats.lognorm.pdf(x, s=s, loc=0, scale=scale)) # Estimate CDF from PDF dum = np.cumsum(p_x_x1) - cdf = dum/(dum[Ndata-1]) + cdf = dum / (dum[Ndata - 1]) # Result of conditional CDF derived based on Gumbel copula table = np.array((x, cdf)) table = table.T @@ -918,7 +1019,7 @@ def _gumbel_copula(x1, x2, fit, component_1, nb_steps, kwargs): component_2_Gumbel[k] = min(table[:, 0]) break elif y_quantile[k] <= table[j, 1]: - component_2_Gumbel[k] = (table[j, 0]+table[j-1, 0])/2 + component_2_Gumbel[k] = (table[j, 0] + table[j - 1, 0]) / 2 break else: component_2_Gumbel[k] = table[:, 0].max() @@ -967,32 +1068,41 @@ def _clayton_copula(x1, x2, fit, component_1, kwargs): If return_fit=True. Dictionary with iso-probabilities passed with additional fit metrics from the copula method. """ - assert isinstance(x1, np.ndarray), 'x1 must be of type np.ndarray' - assert isinstance(x2, np.ndarray), 'x2 must be of type np.ndarray' - assert isinstance(component_1, np.ndarray), 'x2 must be of type np.ndarray' + if not isinstance(x1, np.ndarray): + raise TypeError(f"x1 must be of type np.ndarray. Got: {type(x1)}") + if not isinstance(x2, np.ndarray): + raise TypeError(f"x2 must be of type np.ndarray. Got: {type(x2)}") + if not isinstance(component_1, np.ndarray): + raise TypeError( + f"component_1 must be of type np.ndarray. Got: {type(component_1)}" + ) return_fit = kwargs.get("return_fit", False) - assert isinstance( - return_fit, bool), 'If specified return_fit must be a bool' + if not isinstance(return_fit, bool): + raise TypeError( + f"If specified, return_fit must be of type bool. Got: {type(return_fit)}" + ) - x_quantile = fit['x_quantile'] - y_quantile = fit['y_quantile'] - para_dist_2 = fit['para_dist_2'] + x_quantile = fit["x_quantile"] + y_quantile = fit["y_quantile"] + para_dist_2 = fit["para_dist_2"] # Calculate Kendall's tau tau = stats.kendalltau(x2, x1)[0] - theta_clay = (2.*tau)/(1.-tau) + theta_clay = (2.0 * tau) / (1.0 - tau) s = para_dist_2[1] scale = np.exp(para_dist_2[0]) - z2_Clay = ((1.-x_quantile**(-theta_clay)+x_quantile**(-theta_clay) / - y_quantile)**(theta_clay/(1.+theta_clay)))**(-1./theta_clay) + z2_Clay = ( + (1.0 - x_quantile ** (-theta_clay) + x_quantile ** (-theta_clay) / y_quantile) + ** (theta_clay / (1.0 + theta_clay)) + ) ** (-1.0 / theta_clay) # lognormal inverse component_2_Clayton = stats.lognorm.ppf(z2_Clay, s=s, loc=0, scale=scale) - fit['theta_clay'] = theta_clay - fit['tau'] = tau - fit['z2_Clay'] = z2_Clay + fit["theta_clay"] = theta_clay + fit["tau"] = tau + fit["z2_Clay"] = z2_Clay if return_fit: return component_1, component_2_Clayton, fit @@ -1047,36 +1157,47 @@ def _rosenblatt_copula(x1, x2, fit, component_1, kwargs): x2 = np.array(x2) except: pass - assert isinstance(x1, np.ndarray), 'x1 must be of type np.ndarray' - assert isinstance(x2, np.ndarray), 'x2 must be of type np.ndarray' - assert isinstance(component_1, np.ndarray), 'x2 must be of type np.ndarray' + if not isinstance(x1, np.ndarray): + raise TypeError(f"x1 must be of type np.ndarray. Got: {type(x1)}") + if not isinstance(x2, np.ndarray): + raise TypeError(f"x2 must be of type np.ndarray. Got: {type(x2)}") + if not isinstance(component_1, np.ndarray): + raise TypeError( + f"component_1 must be of type np.ndarray. Got: {type(component_1)}" + ) return_fit = kwargs.get("return_fit", False) - assert isinstance( - return_fit, bool), 'If specified return_fit must be a bool' + if not isinstance(return_fit, bool): + raise TypeError( + f"If specified, return_fit must be of type bool. Got: {type(return_fit)}" + ) - y_quantile = fit['y_quantile'] - mean_cond = fit['mean_cond'] - std_cond = fit['std_cond'] + y_quantile = fit["y_quantile"] + mean_cond = fit["mean_cond"] + std_cond = fit["std_cond"] # mean of Ln(T) as a function of x1 - lamda_cond = mean_cond[0]+mean_cond[1]*component_1 + \ - mean_cond[2]*component_1**2+mean_cond[3]*component_1**3 + lamda_cond = ( + mean_cond[0] + + mean_cond[1] * component_1 + + mean_cond[2] * component_1**2 + + mean_cond[3] * component_1**3 + ) # Standard deviation of Ln(x2) as a function of x1 - sigma_cond = std_cond[0]+std_cond[1]*component_1+std_cond[2]*component_1**2 + sigma_cond = std_cond[0] + std_cond[1] * component_1 + std_cond[2] * component_1**2 # lognormal inverse component_2_Rosenblatt = stats.lognorm.ppf( - y_quantile, s=sigma_cond, loc=0, scale=np.exp(lamda_cond)) + y_quantile, s=sigma_cond, loc=0, scale=np.exp(lamda_cond) + ) - fit['lamda_cond'] = lamda_cond - fit['sigma_cond'] = sigma_cond + fit["lamda_cond"] = lamda_cond + fit["sigma_cond"] = sigma_cond if return_fit: return component_1, component_2_Rosenblatt, fit return component_1, component_2_Rosenblatt -def _nonparametric_copula_parameters(x1, x2, max_x1=None, max_x2=None, - nb_steps=1000): +def _nonparametric_copula_parameters(x1, x2, max_x1=None, max_x2=None, nb_steps=1000): """ Calculates nonparametric copula parameters @@ -1102,15 +1223,20 @@ def _nonparametric_copula_parameters(x1, x2, max_x1=None, max_x2=None, nonpara_pdf_2: x2 points in KDE space and Nonparametric PDF for x2 """ - assert isinstance(x1, np.ndarray), 'x1 must be of type np.ndarray' - assert isinstance(x2, np.ndarray), 'x2 must be of type np.ndarray' + if not isinstance(x1, np.ndarray): + raise TypeError(f"x1 must be of type np.ndarray. Got: {type(x1)}") + if not isinstance(x2, np.ndarray): + raise TypeError(f"x2 must be of type np.ndarray. Got: {type(x2)}") if not max_x1: - max_x1 = x1.max()*2 + max_x1 = x1.max() * 2 if not max_x2: - max_x2 = x2.max()*2 - assert isinstance(max_x1, float), 'max_x1 must be of type float' - assert isinstance(max_x2, float), 'max_x2 must be of type float' - assert isinstance(nb_steps, int), 'nb_steps must be of type int' + max_x2 = x2.max() * 2 + if not isinstance(max_x1, float): + raise TypeError(f"max_x1 must be of type float. Got: {type(max_x1)}") + if not isinstance(max_x2, float): + raise TypeError(f"max_x2 must be of type float. Got: {type(max_x2)}") + if not isinstance(nb_steps, int): + raise TypeError(f"nb_steps must be of type int. Got: {type(nb_steps)}") # Binning x1_sorted_index = x1.argsort() @@ -1128,11 +1254,11 @@ def _nonparametric_copula_parameters(x1, x2, max_x1=None, max_x2=None, # Calculate optimal bandwidth for T and Hs sig = stats.median_abs_deviation(x2_sorted) num = float(len(x2_sorted)) - bwT = sig*(4.0/(3.0*num))**(1.0/5.0) + bwT = sig * (4.0 / (3.0 * num)) ** (1.0 / 5.0) sig = stats.median_abs_deviation(x1_sorted) num = float(len(x1_sorted)) - bwHs = sig*(4.0/(3.0*num))**(1.0/5.0) + bwHs = sig * (4.0 / (3.0 * num)) ** (1.0 / 5.0) # Nonparametric PDF for x2 temp = KDEUnivariate(x2_sorted) @@ -1143,11 +1269,11 @@ def _nonparametric_copula_parameters(x1, x2, max_x1=None, max_x2=None, temp = KDEUnivariate(x1_sorted) temp.fit(bw=bwHs) tempPDF = temp.evaluate(pts_x1) - F_x1 = tempPDF/sum(tempPDF) + F_x1 = tempPDF / sum(tempPDF) F_x1 = np.cumsum(F_x1) # Nonparametric CDF for x2 - F_x2 = f_x2/sum(f_x2) + F_x2 = f_x2 / sum(f_x2) F_x2 = np.cumsum(F_x2) nonpara_dist_1 = np.transpose(np.array([pts_x1, F_x1])) @@ -1176,7 +1302,8 @@ def _nonparametric_component(z, nonpara_dist, nb_steps): component: array nonparametic component values """ - assert isinstance(nb_steps, int), 'nb_steps must be of type int' + if not isinstance(nb_steps, int): + raise TypeError(f"nb_steps must be of type int. Got: {type(nb_steps)}") component = np.zeros(nb_steps) for k in range(0, nb_steps): @@ -1185,7 +1312,7 @@ def _nonparametric_component(z, nonpara_dist, nb_steps): component[k] = min(nonpara_dist[:, 0]) break elif z[k] <= nonpara_dist[j, 1]: - component[k] = (nonpara_dist[j, 0] + nonpara_dist[j-1, 0])/2 + component[k] = (nonpara_dist[j, 0] + nonpara_dist[j - 1, 0]) / 2 break else: component[k] = max(nonpara_dist[:, 0]) @@ -1223,48 +1350,51 @@ def _nonparametric_gaussian_copula(x1, x2, fit, nb_steps, kwargs): If return_fit=True. Dictionary with iso-probabilities passed with additional fit metrics from the copula method. """ - assert isinstance(x1, np.ndarray), 'x1 must be of type np.ndarray' - assert isinstance(x2, np.ndarray), 'x2 must be of type np.ndarray' - assert isinstance(nb_steps, int), 'nb_steps must be of type int' - + if not isinstance(x1, np.ndarray): + raise TypeError(f"x1 must be of type np.ndarray. Got: {type(x1)}") + if not isinstance(x2, np.ndarray): + raise TypeError(f"x2 must be of type np.ndarray. Got: {type(x2)}") + if not isinstance(nb_steps, int): + raise TypeError(f"nb_steps must be of type int. Got: {type(nb_steps)}") return_fit = kwargs.get("return_fit", False) - assert isinstance( - return_fit, bool), 'If specified return_fit must be a bool' + if not isinstance(return_fit, bool): + raise TypeError( + f"If specified, return_fit must be of type bool. Got: {type(return_fit)}" + ) - x_component_iso_prob = fit['x_component_iso_prob'] - y_component_iso_prob = fit['y_component_iso_prob'] - nonpara_dist_1 = fit['nonpara_dist_1'] - nonpara_dist_2 = fit['nonpara_dist_2'] + x_component_iso_prob = fit["x_component_iso_prob"] + y_component_iso_prob = fit["y_component_iso_prob"] + nonpara_dist_1 = fit["nonpara_dist_1"] + nonpara_dist_2 = fit["nonpara_dist_2"] # Calculate Kendall's tau tau = stats.kendalltau(x2, x1)[0] - rho_gau = np.sin(tau*np.pi/2.) + rho_gau = np.sin(tau * np.pi / 2.0) # Component 1 z1 = stats.norm.cdf(x_component_iso_prob) - z2 = stats.norm.cdf(y_component_iso_prob*np.sqrt(1. - - rho_gau**2.)+rho_gau*x_component_iso_prob) + z2 = stats.norm.cdf( + y_component_iso_prob * np.sqrt(1.0 - rho_gau**2.0) + + rho_gau * x_component_iso_prob + ) - comps = {1: {'z': z1, - 'nonpara_dist': nonpara_dist_1 - }, - 2: {'z': z2, - 'nonpara_dist': nonpara_dist_2 - } - } + comps = { + 1: {"z": z1, "nonpara_dist": nonpara_dist_1}, + 2: {"z": z2, "nonpara_dist": nonpara_dist_2}, + } for c in comps: - z = comps[c]['z'] - nonpara_dist = comps[c]['nonpara_dist'] - comps[c]['comp'] = _nonparametric_component(z, nonpara_dist, nb_steps) + z = comps[c]["z"] + nonpara_dist = comps[c]["nonpara_dist"] + comps[c]["comp"] = _nonparametric_component(z, nonpara_dist, nb_steps) - component_1_np = comps[1]['comp'] - component_2_np_gaussian = comps[2]['comp'] + component_1_np = comps[1]["comp"] + component_2_np_gaussian = comps[2]["comp"] - fit['tau'] = tau - fit['rho'] = rho_gau - fit['z1'] = z1 - fit['z2'] = z2 + fit["tau"] = tau + fit["rho"] = rho_gau + fit["z1"] = z1 + fit["z2"] = z2 if return_fit: return component_1_np, component_2_np_gaussian, fit @@ -1302,51 +1432,53 @@ def _nonparametric_clayton_copula(x1, x2, fit, nb_steps, kwargs): If return_fit=True. Dictionary with iso-probabilities passed with additional fit metrics from the copula method. """ - assert isinstance(x1, np.ndarray), 'x1 must be of type np.ndarray' - assert isinstance(x2, np.ndarray), 'x2 must be of type np.ndarray' - assert isinstance(nb_steps, int), 'nb_steps must be of type int' - + if not isinstance(x1, np.ndarray): + raise TypeError(f"x1 must be of type np.ndarray. Got: {type(x1)}") + if not isinstance(x2, np.ndarray): + raise TypeError(f"x2 must be of type np.ndarray. Got: {type(x2)}") + if not isinstance(nb_steps, int): + raise TypeError(f"nb_steps must be of type int. Got: {type(nb_steps)}") return_fit = kwargs.get("return_fit", False) - assert isinstance(return_fit, bool), ('If specified return_fit ' - + 'must be a bool') - - x_component_iso_prob = fit['x_component_iso_prob'] - x_quantile = fit['x_quantile'] - y_quantile = fit['y_quantile'] - nonpara_dist_1 = fit['nonpara_dist_1'] - nonpara_dist_2 = fit['nonpara_dist_2'] - nonpara_pdf_2 = fit['nonpara_pdf_2'] + if not isinstance(return_fit, bool): + raise TypeError( + f"If specified, return_fit must be of type bool. Got: {type(return_fit)}" + ) + + x_component_iso_prob = fit["x_component_iso_prob"] + x_quantile = fit["x_quantile"] + y_quantile = fit["y_quantile"] + nonpara_dist_1 = fit["nonpara_dist_1"] + nonpara_dist_2 = fit["nonpara_dist_2"] + nonpara_pdf_2 = fit["nonpara_pdf_2"] # Calculate Kendall's tau tau = stats.kendalltau(x2, x1)[0] - theta_clay = (2.*tau)/(1.-tau) + theta_clay = (2.0 * tau) / (1.0 - tau) # Component 1 (Hs) z1 = stats.norm.cdf(x_component_iso_prob) - z2_clay = ((1-x_quantile**(-theta_clay) - + x_quantile**(-theta_clay) - / y_quantile)**(theta_clay/(1.+theta_clay)))**(-1./theta_clay) - - comps = {1: {'z': z1, - 'nonpara_dist': nonpara_dist_1 - }, - 2: {'z': z2_clay, - 'nonpara_dist': nonpara_dist_2 - } - } + z2_clay = ( + (1 - x_quantile ** (-theta_clay) + x_quantile ** (-theta_clay) / y_quantile) + ** (theta_clay / (1.0 + theta_clay)) + ) ** (-1.0 / theta_clay) + + comps = { + 1: {"z": z1, "nonpara_dist": nonpara_dist_1}, + 2: {"z": z2_clay, "nonpara_dist": nonpara_dist_2}, + } for c in comps: - z = comps[c]['z'] - nonpara_dist = comps[c]['nonpara_dist'] - comps[c]['comp'] = _nonparametric_component(z, nonpara_dist, nb_steps) + z = comps[c]["z"] + nonpara_dist = comps[c]["nonpara_dist"] + comps[c]["comp"] = _nonparametric_component(z, nonpara_dist, nb_steps) - component_1_np = comps[1]['comp'] - component_2_np_clayton = comps[2]['comp'] + component_1_np = comps[1]["comp"] + component_2_np_clayton = comps[2]["comp"] - fit['tau'] = tau - fit['theta'] = theta_clay - fit['z1'] = z1 - fit['z2'] = z2_clay + fit["tau"] = tau + fit["theta"] = theta_clay + fit["z1"] = z1 + fit["z2"] = z2_clay if return_fit: return component_1_np, component_2_np_clayton, fit @@ -1384,25 +1516,29 @@ def _nonparametric_gumbel_copula(x1, x2, fit, nb_steps, kwargs): If return_fit=True. Dictionary with iso-probabilities passed with additional fit metrics from the copula method. """ - assert isinstance(x1, np.ndarray), 'x1 must be of type np.ndarray' - assert isinstance(x2, np.ndarray), 'x2 must be of type np.ndarray' - assert isinstance(nb_steps, int), 'nb_steps must be of type int' - + if not isinstance(x1, np.ndarray): + raise TypeError(f"x1 must be of type np.ndarray. Got: {type(x1)}") + if not isinstance(x2, np.ndarray): + raise TypeError(f"x2 must be of type np.ndarray. Got: {type(x2)}") + if not isinstance(nb_steps, int): + raise TypeError(f"nb_steps must be of type int. Got: {type(nb_steps)}") return_fit = kwargs.get("return_fit", False) - assert isinstance(return_fit, bool), ('If specified return_fit ' - + 'must be a bool') + if not isinstance(return_fit, bool): + raise TypeError( + f"If specified, return_fit must be a bool. Got: {type(return_fit)}" + ) Ndata = 1000 - x_quantile = fit['x_quantile'] - y_quantile = fit['y_quantile'] - nonpara_dist_1 = fit['nonpara_dist_1'] - nonpara_dist_2 = fit['nonpara_dist_2'] - nonpara_pdf_2 = fit['nonpara_pdf_2'] + x_quantile = fit["x_quantile"] + y_quantile = fit["y_quantile"] + nonpara_dist_1 = fit["nonpara_dist_1"] + nonpara_dist_2 = fit["nonpara_dist_2"] + nonpara_pdf_2 = fit["nonpara_pdf_2"] # Calculate Kendall's tau tau = stats.kendalltau(x2, x1)[0] - theta_gum = 1./(1.-tau) + theta_gum = 1.0 / (1.0 - tau) # Component 1 (Hs) z1 = x_quantile @@ -1414,15 +1550,15 @@ def _nonparametric_gumbel_copula(x1, x2, fit, nb_steps, kwargs): component_2_np_gumbel = np.zeros(nb_steps) for k in range(nb_steps): - z1 = np.array([x_quantile[k]]*Ndata) + z1 = np.array([x_quantile[k]] * Ndata) Z = np.array((z1.T, F_x2)) Y = _gumbel_density(Z, theta_gum) Y = np.nan_to_num(Y) # pdf 2|1 - p_x2_x1 = Y*f_x2 + p_x2_x1 = Y * f_x2 # Estimate CDF from PDF dum = np.cumsum(p_x2_x1) - cdf = dum/(dum[Ndata-1]) + cdf = dum / (dum[Ndata - 1]) table = np.array((pts_x2, cdf)) table = table.T for j in range(Ndata): @@ -1430,17 +1566,17 @@ def _nonparametric_gumbel_copula(x1, x2, fit, nb_steps, kwargs): component_2_np_gumbel[k] = min(table[:, 0]) break elif y_quantile[k] <= table[j, 1]: - component_2_np_gumbel[k] = (table[j, 0]+table[j-1, 0])/2 + component_2_np_gumbel[k] = (table[j, 0] + table[j - 1, 0]) / 2 break else: component_2_np_gumbel[k] = max(table[:, 0]) - fit['tau'] = tau - fit['theta'] = theta_gum - fit['z1'] = z1 - fit['pts_x2'] = pts_x2 - fit['f_x2'] = f_x2 - fit['F_x2'] = F_x2 + fit["tau"] = tau + fit["theta"] = theta_gum + fit["z1"] = z1 + fit["pts_x2"] = pts_x2 + fit["f_x2"] = f_x2 + fit["F_x2"] = F_x2 if return_fit: return component_1_np, component_2_np_gumbel, fit @@ -1466,7 +1602,7 @@ def _bivariate_KDE(x1, x2, bw, fit, nb_steps, Ndata_bivariate_KDE, kwargs): fit: Dictionay Dictionary of the iso-probability results nb_steps: int - number of points used to discritize KDE space + number of points used to discretize KDE space max_x1: float Defines the max value of x1 to discretize the KDE space max_x2: float @@ -1487,9 +1623,12 @@ def _bivariate_KDE(x1, x2, bw, fit, nb_steps, Ndata_bivariate_KDE, kwargs): If return_fit=True. Dictionary with iso-probabilities passed with additional fit metrics from the copula method. """ - assert isinstance(x1, np.ndarray), 'x1 must be of type np.ndarray' - assert isinstance(x2, np.ndarray), 'x2 must be of type np.ndarray' - assert isinstance(nb_steps, int), 'nb_steps must be of type int' + if not isinstance(x1, np.ndarray): + raise TypeError(f"x1 must be of type np.ndarray. Got: {type(x1)}") + if not isinstance(x2, np.ndarray): + raise TypeError(f"x2 must be of type np.ndarray. Got: {type(x2)}") + if not isinstance(nb_steps, int): + raise TypeError(f"nb_steps must be of type int. Got: {type(nb_steps)}") max_x1 = kwargs.get("max_x1", None) max_x2 = kwargs.get("max_x2", None) @@ -1497,17 +1636,23 @@ def _bivariate_KDE(x1, x2, bw, fit, nb_steps, Ndata_bivariate_KDE, kwargs): return_fit = kwargs.get("return_fit", False) if isinstance(max_x1, type(None)): - max_x1 = x1.max()*2 + max_x1 = x1.max() * 2 if isinstance(max_x2, type(None)): - max_x2 = x2.max()*2 - assert isinstance(max_x1, float), 'max_x1 must be of type float' - assert isinstance(max_x2, float), 'max_x2 must be of type float' - assert isinstance(log_transform, bool), ('If specified log_transform' - + 'must be a bool') - assert isinstance(return_fit, bool), ('If specified return_fit must ' - + 'be a bool') - - p_f = fit['exceedance_probability'] + max_x2 = x2.max() * 2 + if not isinstance(max_x1, float): + raise TypeError(f"max_x1 must be of type float. Got: {type(max_x1)}") + if not isinstance(max_x2, float): + raise TypeError(f"max_x2 must be of type float. Got: {type(max_x2)}") + if not isinstance(log_transform, bool): + raise TypeError( + f"If specified, log_transform must be of type bool. Got: {type(log_transform)}" + ) + if not isinstance(return_fit, bool): + raise TypeError( + f"If specified, return_fit must be of type bool. Got: {type(return_fit)}" + ) + + p_f = fit["exceedance_probability"] min_limit_1 = 0.01 min_limit_2 = 0.01 @@ -1535,10 +1680,10 @@ def _bivariate_KDE(x1, x2, bw, fit, nb_steps, Ndata_bivariate_KDE, kwargs): for i in range(0, m): ftemp = np.ones((n, 1)) for j in range(0, d): - z = (txi[j][i] - ty[j])/bw[j] + z = (txi[j][i] - ty[j]) / bw[j] fk = stats.norm.pdf(z) if log_transform: - fnew = fk*(1/np.transpose(xi[j][i])) + fnew = fk * (1 / np.transpose(xi[j][i])) else: fnew = fk fnew = np.reshape(fnew, (n, 1)) @@ -1551,27 +1696,39 @@ def _bivariate_KDE(x1, x2, bw, fit, nb_steps, Ndata_bivariate_KDE, kwargs): x1_bivariate_KDE = [] x2_bivariate_KDE = [] - for i, seg in enumerate(vals.allsegs[0]): + if mpl_version < (3, 8): # For versions before 3.8 + segments = vals.allsegs[0] + else: + segments = [path.vertices for path in vals.get_paths()] + + for seg in segments: x1_bivariate_KDE.append(seg[:, 1]) x2_bivariate_KDE.append(seg[:, 0]) x1_bivariate_KDE = np.transpose(np.asarray(x1_bivariate_KDE)[0]) x2_bivariate_KDE = np.transpose(np.asarray(x2_bivariate_KDE)[0]) - fit['mesh_pts_x1'] = mesh_pts_x1 - fit['mesh_pts_x2'] = mesh_pts_x2 - fit['ty'] = ty - fit['xi'] = xi - fit['contour_vals'] = vals + fit["mesh_pts_x1"] = mesh_pts_x1 + fit["mesh_pts_x2"] = mesh_pts_x2 + fit["ty"] = ty + fit["xi"] = xi + fit["contour_vals"] = vals if return_fit: return x1_bivariate_KDE, x2_bivariate_KDE, fit return x1_bivariate_KDE, x2_bivariate_KDE -### Sampling -def samples_full_seastate(x1, x2, points_per_interval, return_periods, - sea_state_duration, method="PCA", bin_size=250): +# Sampling +def samples_full_seastate( + x1, + x2, + points_per_interval, + return_periods, + sea_state_duration, + method="PCA", + bin_size=250, +): """ Sample a sea state between contours of specified return periods. @@ -1585,9 +1742,9 @@ def samples_full_seastate(x1, x2, points_per_interval, return_periods, Parameters ---------- - x1: np.array + x1: list, np.ndarray, pd.Series, xr.DataArray Component 1 data - x2: np.array + x2: list, np.ndarray, pd.Series, xr.DataArray Component 2 data points_per_interval : int Number of sample points to be calculated per contour interval. @@ -1612,21 +1769,29 @@ def samples_full_seastate(x1, x2, points_per_interval, return_periods, Vector of probabilistic weights for each sampling point to be used in risk calculations. """ - if method != 'PCA': + if method != "PCA": raise NotImplementedError( - "Full sea state sampling is currently only implemented using " + - "the 'PCA' method.") - assert isinstance(x1, np.ndarray), 'x1 must be of type np.ndarray' - assert isinstance(x2, np.ndarray), 'x2 must be of type np.ndarray' - assert isinstance(points_per_interval, - int), 'points_per_interval must be of int' - assert isinstance(return_periods, np.ndarray - ), 'return_periods must be of type np.ndarray' - assert isinstance(sea_state_duration, (int, float) - ), 'sea_state_duration must be of int or float' - assert isinstance(method, (str, list) - ), 'method must be of type string or list' - assert isinstance(bin_size, int), 'bin_size must be of int' + "Full sea state sampling is currently only implemented using " + + "the 'PCA' method." + ) + x1 = to_numeric_array(x1, "x1") + x2 = to_numeric_array(x2, "x2") + if not isinstance(points_per_interval, int): + raise TypeError( + f"points_per_interval must be of int. Got: {type(points_per_interval)}" + ) + if not isinstance(return_periods, np.ndarray): + raise TypeError( + f"return_periods must be of type np.ndarray. Got: {type(return_periods)}" + ) + if not isinstance(sea_state_duration, (int, float)): + raise TypeError( + f"sea_state_duration must be of int or float. Got: {type(sea_state_duration)}" + ) + if not isinstance(method, (str, list)): + raise TypeError(f"method must be of type string or list. Got: {type(method)}") + if not isinstance(bin_size, int): + raise TypeError(f"bin_size must be of int. Got: {type(bin_size)}") pca_fit = _principal_component_analysis(x1, x2, bin_size) @@ -1636,31 +1801,31 @@ def samples_full_seastate(x1, x2, points_per_interval, return_periods, h_zeroline = np.zeros(len(t_zeroline)) # Transform zero line into principal component space - coeff = pca_fit['principal_axes'] - shift = pca_fit['shift'] - comp_zeroline = np.dot(np.transpose(np.vstack([h_zeroline, t_zeroline])), - coeff) + coeff = pca_fit["principal_axes"] + shift = pca_fit["shift"] + comp_zeroline = np.dot(np.transpose(np.vstack([h_zeroline, t_zeroline])), coeff) comp_zeroline[:, 1] = comp_zeroline[:, 1] + shift - comp1 = pca_fit['x1_fit'] + comp1 = pca_fit["x1_fit"] c1_zeroline_prob = stats.invgauss.cdf( - comp_zeroline[:, 0], mu=comp1['mu'], loc=0, scale=comp1['scale']) + comp_zeroline[:, 0], mu=comp1["mu"], loc=0, scale=comp1["scale"] + ) - mu_slope = pca_fit['mu_fit'].slope - mu_intercept = pca_fit['mu_fit'].intercept + mu_slope = pca_fit["mu_fit"].slope + mu_intercept = pca_fit["mu_fit"].intercept mu_zeroline = mu_slope * comp_zeroline[:, 0] + mu_intercept - sigma_polynomial_coeffcients = pca_fit['sigma_fit'].x - sigma_zeroline = np.polyval( - sigma_polynomial_coeffcients, comp_zeroline[:, 0]) - c2_zeroline_prob = stats.norm.cdf(comp_zeroline[:, 1], - loc=mu_zeroline, scale=sigma_zeroline) + sigma_polynomial_coeffcients = pca_fit["sigma_fit"].x + sigma_zeroline = np.polyval(sigma_polynomial_coeffcients, comp_zeroline[:, 0]) + c2_zeroline_prob = stats.norm.cdf( + comp_zeroline[:, 1], loc=mu_zeroline, scale=sigma_zeroline + ) c1_normzeroline = stats.norm.ppf(c1_zeroline_prob, 0, 1) c2_normzeroline = stats.norm.ppf(c2_zeroline_prob, 0, 1) return_periods = np.asarray(return_periods) - contour_probs = 1 / (365*24*60*60/sea_state_duration * return_periods) + contour_probs = 1 / (365 * 24 * 60 * 60 / sea_state_duration * return_periods) # Reliability contour generation # Calculate reliability @@ -1686,12 +1851,11 @@ def samples_full_seastate(x1, x2, points_per_interval, return_periods, # Transform to polar coordinates theta_zeroline = np.arctan2(c2_normzeroline, c1_normzeroline) rho_zeroline = np.sqrt(c1_normzeroline**2 + c2_normzeroline**2) - theta_zeroline[theta_zeroline < 0] = theta_zeroline[ - theta_zeroline < 0] + 2 * np.pi + theta_zeroline[theta_zeroline < 0] = theta_zeroline[theta_zeroline < 0] + 2 * np.pi sample_alpha, sample_beta, weight_points = _generate_sample_data( - beta_lines, rho_zeroline, theta_zeroline, points_per_interval, - contour_probs) + beta_lines, rho_zeroline, theta_zeroline, points_per_interval, contour_probs + ) # Sample transformation to principal component space sample_u1 = sample_beta * np.cos(sample_alpha) @@ -1699,19 +1863,22 @@ def samples_full_seastate(x1, x2, points_per_interval, return_periods, comp1_sample = stats.invgauss.ppf( stats.norm.cdf(sample_u1, loc=0, scale=1), - mu=comp1['mu'], loc=0, scale=comp1['scale']) + mu=comp1["mu"], + loc=0, + scale=comp1["scale"], + ) mu_sample = mu_slope * comp1_sample + mu_intercept # Calculate sigma values at each point on the circle sigma_sample = np.polyval(sigma_polynomial_coeffcients, comp1_sample) # Use calculated mu and sigma values to calculate C2 along the contour - comp2_sample = stats.norm.ppf(stats.norm.cdf(sample_u2, loc=0, scale=1), - loc=mu_sample, scale=sigma_sample) + comp2_sample = stats.norm.ppf( + stats.norm.cdf(sample_u2, loc=0, scale=1), loc=mu_sample, scale=sigma_sample + ) # Sample transformation into Hs-T space - h_sample, t_sample = _princomp_inv( - comp1_sample, comp2_sample, coeff, shift) + h_sample, t_sample = _princomp_inv(comp1_sample, comp2_sample, coeff, shift) return h_sample, t_sample, weight_points @@ -1723,65 +1890,63 @@ def samples_contour(t_samples, t_contour, hs_contour): Parameters ---------- - t_samples : np.array + t_samples : list, np.ndarray, pd.Series, xr.DataArray Points for sampling along return contour - t_contour : np.array + t_contour : list, np.ndarray, pd.Series, xr.DataArray T values along contour - hs_contour : np.array + hs_contour : list, np.ndarray, pd.Series, xr.DataArray Hs values along contour Returns ------- - hs_samples : nparray + hs_samples : np.ndarray points sampled along return contour """ - assert isinstance( - t_samples, np.ndarray), 't_samples must be of type np.ndarray' - assert isinstance( - t_contour, np.ndarray), 't_contour must be of type np.ndarray' - assert isinstance( - hs_contour, np.ndarray), 'hs_contour must be of type np.ndarray' - - #finds minimum and maximum energy period values + t_samples = to_numeric_array(t_samples, "t_samples") + t_contour = to_numeric_array(t_contour, "t_contour") + hs_contour = to_numeric_array(hs_contour, "hs_contour") + + # finds minimum and maximum energy period values amin = np.argmin(t_contour) amax = np.argmax(t_contour) aamin = np.min([amin, amax]) aamax = np.max([amin, amax]) - #finds points along the contour + # finds points along the contour w1 = hs_contour[aamin:aamax] w2 = np.concatenate((hs_contour[aamax:], hs_contour[:aamin])) - if (np.max(w1) > np.max(w2)): + if np.max(w1) > np.max(w2): x1 = t_contour[aamin:aamax] y1 = hs_contour[aamin:aamax] else: x1 = np.concatenate((t_contour[aamax:], t_contour[:aamin])) y1 = np.concatenate((hs_contour[aamax:], hs_contour[:aamin])) - #sorts data based on the max and min energy period values + # sorts data based on the max and min energy period values ms = np.argsort(x1) x = x1[ms] y = y1[ms] - #interpolates the sorted data + # interpolates the sorted data si = interp.interp1d(x, y) - #finds the wave height based on the user specified energy period values + # finds the wave height based on the user specified energy period values hs_samples = si(t_samples) return hs_samples -def _generate_sample_data(beta_lines, rho_zeroline, theta_zeroline, - points_per_interval, contour_probs): +def _generate_sample_data( + beta_lines, rho_zeroline, theta_zeroline, points_per_interval, contour_probs +): """ Calculate radius, angle, and weight for each sample point Parameters ---------- - beta_lines: np.array + beta_lines: list, np.ndarray, pd.Series, xr.DataArray Array of mu fitting function parameters. - rho_zeroline: np.array + rho_zeroline: list, np.ndarray, pd.Series, xr.DataArray Array of radii - theta_zeroline: np.array + theta_zeroline: list, np.ndarray, pd.Series, xr.DataArray points_per_interval: int - contour_probs: np.array + contour_probs: list, np.ndarray, pd.Series, xr.DataArray Returns ------- @@ -1792,16 +1957,14 @@ def _generate_sample_data(beta_lines, rho_zeroline, theta_zeroline, weight_points: np.array Array of weights for each point. """ - assert isinstance( - beta_lines, np.ndarray), 'beta_lines must be of type np.ndarray' - assert isinstance( - rho_zeroline, np.ndarray), 'rho_zeroline must be of type np.ndarray' - assert isinstance(theta_zeroline, np.ndarray - ), 'theta_zeroline must be of type np.ndarray' - assert isinstance(points_per_interval, int - ), 'points_per_interval must be of type int' - assert isinstance( - contour_probs, np.ndarray), 'contour_probs must be of type np.ndarray' + beta_lines = to_numeric_array(beta_lines, "beta_lines") + rho_zeroline = to_numeric_array(rho_zeroline, "rho_zeroline") + theta_zeroline = to_numeric_array(theta_zeroline, "theta_zeroline") + contour_probs = to_numeric_array(contour_probs, "contour_probs") + if not isinstance(points_per_interval, int): + raise TypeError( + f"points_per_interval must be of type int. Got: {type(points_per_interval)}" + ) num_samples = (len(beta_lines) - 1) * points_per_interval alpha_bounds = np.zeros((len(beta_lines) - 1, 2)) @@ -1822,8 +1985,10 @@ def _generate_sample_data(beta_lines, rho_zeroline, theta_zeroline, left = np.amin(np.where(r < 0)) right = np.amax(np.where(r < 0)) # Save sampling bounds - alpha_bounds[i, :] = (theta_zeroline[left], theta_zeroline[right] - - 2 * np.pi) + alpha_bounds[i, :] = ( + theta_zeroline[left], + theta_zeroline[right] - 2 * np.pi, + ) else: alpha_bounds[i, :] = np.array((0, 2 * np.pi)) # Find the angular distance that will be covered by sampling the disc @@ -1834,23 +1999,27 @@ def _generate_sample_data(beta_lines, rho_zeroline, theta_zeroline, # areas to be sampled alpha[i, :] = np.arange( min(alpha_bounds[i]), - max(alpha_bounds[i]) + 0.1, angular_dist[i] / points_per_interval) + max(alpha_bounds[i]) + 0.1, + angular_dist[i] / points_per_interval, + ) # Calculate the weight of each point sampled per contour - weight[i] = ((contour_probs[i] - contour_probs[i + 1]) * - angular_ratio[i] / points_per_interval) + weight[i] = ( + (contour_probs[i] - contour_probs[i + 1]) + * angular_ratio[i] + / points_per_interval + ) for j in range(points_per_interval): # Generate sample radius by adding a randomly sampled distance to # the 'disc' lower bound - sample_beta[(i) * points_per_interval + j] = ( - beta_lines[i] + - np.random.random_sample() * (beta_lines[i + 1] - beta_lines[i]) - ) + sample_beta[(i) * points_per_interval + j] = beta_lines[ + i + ] + np.random.random_sample() * (beta_lines[i + 1] - beta_lines[i]) # Generate sample angle by adding a randomly sampled distance to # the lower bound of the angle defining a discrete portion of the # 'disc' - sample_alpha[(i) * points_per_interval + j] = ( - alpha[i, j] + - np.random.random_sample() * (alpha[i, j + 1] - alpha[i, j])) + sample_alpha[(i) * points_per_interval + j] = alpha[ + i, j + ] + np.random.random_sample() * (alpha[i, j + 1] - alpha[i, j]) # Save the weight for each sample point weight_points[i * points_per_interval + j] = weight[i] @@ -1880,20 +2049,28 @@ def _princomp_inv(princip_data1, princip_data2, coeff, shift): original2: np.array T values following rotation from principal component space. """ - assert isinstance( - princip_data1, np.ndarray), 'princip_data1 must be of type np.ndarray' - assert isinstance( - princip_data2, np.ndarray), 'princip_data2 must be of type np.ndarray' - assert isinstance(coeff, np.ndarray), 'coeff must be of type np.ndarray' - assert isinstance(shift, float), 'float must be of type float' + if not isinstance(princip_data1, np.ndarray): + raise TypeError( + f"princip_data1 must be of type np.ndarray. Got: {type(princip_data1)}" + ) + if not isinstance(princip_data2, np.ndarray): + raise TypeError( + f"princip_data2 must be of type np.ndarray. Got: {type(princip_data2)}" + ) + if not isinstance(coeff, np.ndarray): + raise TypeError(f"coeff must be of type np.ndarray. Got: {type(coeff)}") + if not isinstance(shift, float): + raise TypeError(f"shift must be of type float. Got: {type(shift)}") original1 = np.zeros(len(princip_data1)) original2 = np.zeros(len(princip_data1)) for i in range(len(princip_data2)): - original1[i] = (((coeff[0, 1] * (princip_data2[i] - shift)) + - (coeff[0, 0] * princip_data1[i])) / (coeff[0, 1]**2 + - coeff[0, 0]**2)) - original2[i] = (((coeff[0, 1] * princip_data1[i]) - - (coeff[0, 0] * (princip_data2[i] - shift))) / - (coeff[0, 1]**2 + coeff[0, 0]**2)) + original1[i] = ( + (coeff[0, 1] * (princip_data2[i] - shift)) + + (coeff[0, 0] * princip_data1[i]) + ) / (coeff[0, 1] ** 2 + coeff[0, 0] ** 2) + original2[i] = ( + (coeff[0, 1] * princip_data1[i]) + - (coeff[0, 0] * (princip_data2[i] - shift)) + ) / (coeff[0, 1] ** 2 + coeff[0, 0] ** 2) return original1, original2 diff --git a/mhkit/wave/graphics.py b/mhkit/wave/graphics.py index afb24016a..ba8e536ff 100644 --- a/mhkit/wave/graphics.py +++ b/mhkit/wave/graphics.py @@ -1,6 +1,6 @@ - from mhkit.river.resource import exceedance_probability from mhkit.river.graphics import _xy_plot +from mhkit.utils import convert_to_dataset import matplotlib.patheffects as pe import matplotlib.pyplot as plt from matplotlib import gridspec @@ -17,7 +17,7 @@ def plot_spectrum(S, ax=None): Parameters ------------ - S: pandas DataFrame + S: pandas Series, pandas DataFrame, xarray DataArray, or xarray Dataset Spectral density [m^2/Hz] indexed frequency [Hz] ax : matplotlib axes object Axes for plotting. If None, then a new figure is created. @@ -26,12 +26,19 @@ def plot_spectrum(S, ax=None): --------- ax : matplotlib pyplot axes """ - assert isinstance(S, pd.DataFrame), 'S must be of type pd.DataFrame' - - f = S.index - for key in S.keys(): - ax = _xy_plot(f*2*np.pi, S[key]/(2*np.pi), fmt='-', xlabel='omega [rad/s]', - ylabel='Spectral density [m$^2$s/rad]', ax=ax) + S = convert_to_dataset(S) + + frequency_dimension = list(S.dims)[0] + f = S[frequency_dimension] + for var in S.data_vars: + ax = _xy_plot( + f * 2 * np.pi, + S[var] / (2 * np.pi), + fmt="-", + xlabel="omega [rad/s]", + ylabel="Spectral density [m$^2$s/rad]", + ax=ax, + ) return ax @@ -42,7 +49,7 @@ def plot_elevation_timeseries(eta, ax=None): Parameters ---------- - eta: pandas DataFrame + eta: pandas Series, pandas DataFrame, xarray DataArray, or xarray Dataset Wave surface elevation [m] indexed by time [datetime or s] ax : matplotlib axes object Axes for plotting. If None, then a new figure is created. @@ -51,30 +58,24 @@ def plot_elevation_timeseries(eta, ax=None): ------- ax : matplotlib pyplot axes """ + eta = convert_to_dataset(eta) - assert isinstance(eta, pd.DataFrame), 'eta must be of type pd.DataFrame' + time_dimension = list(eta.dims)[0] + t = eta[time_dimension] - for key in eta.keys(): - ax = _xy_plot(eta.index, eta[key], fmt='-', xlabel='Time', - ylabel='$\eta$ [m]', ax=ax) + for var in eta.data_vars: + ax = _xy_plot(t, eta[var], fmt="-", xlabel="Time", ylabel="$\eta$ [m]", ax=ax) return ax -def plot_matrix( - M, - xlabel='Te', - ylabel='Hm0', - zlabel=None, - show_values=True, - ax=None - ): +def plot_matrix(M, xlabel="Te", ylabel="Hm0", zlabel=None, show_values=True, ax=None): """ Plots values in the matrix as a scatter diagram Parameters ------------ - M: pandas DataFrame + M: pandas Series, pandas DataFrame, xarray DataArray Matrix with numeric labels for x and y axis, and numeric entries. An example would be the average capture length matrix generated by mhkit.device.wave, or something similar. @@ -93,13 +94,18 @@ def plot_matrix( ax : matplotlib pyplot axes """ - assert isinstance(M, pd.DataFrame), 'M must be of type pd.DataFrame' + try: + M = pd.DataFrame(M) + except: + pass + if not isinstance(M, pd.DataFrame): + raise TypeError(f"M must be of type pd.DataFrame. Got: {type(M)}") if ax is None: plt.figure() ax = plt.gca() - im = ax.imshow(M, origin='lower', aspect='auto') + im = ax.imshow(M, origin="lower", aspect="auto") # Add colorbar cbar = plt.colorbar(im) @@ -114,8 +120,10 @@ def plot_matrix( if show_values: for i, col in enumerate(M.columns): for j, index in enumerate(M.index): - if not np.isnan(M.loc[index,col]): - ax.text(i, j, format(M.loc[index,col], '.2f'), ha="center", va="center") + if not np.isnan(M.loc[index, col]): + ax.text( + i, j, format(M.loc[index, col], ".2f"), ha="center", va="center" + ) # Reset x and y ticks ax.set_xticks(np.arange(len(M.columns))) @@ -162,11 +170,11 @@ def plot_chakrabarti(H, lambda_w, D, ax=None): Parameters ---------- - H: float or numpy array or pandas Series + H: int, float, numpy array, pandas Series, or xarray DataArray Wave height [m] - lambda_w: float or numpy array or pandas Series + lambda_w: int, float, numpy array, pandas Series, or xarray DataArray Wave length [m] - D: float or numpy array or pandas Series + D: int, float, numpy array, pandas Series, or xarray DataArray Characteristic length [m] ax : matplotlib axes object (optional) Axes for plotting. If None, then a new figure is created. @@ -175,46 +183,57 @@ def plot_chakrabarti(H, lambda_w, D, ax=None): ------- ax : matplotlib pyplot axes """ - assert isinstance(H, (np.ndarray, float, int, np.int64,pd.Series)), \ - 'H must be a real numeric type' - assert isinstance(lambda_w, (np.ndarray, float, int, np.int64,pd.Series)), \ - 'lambda_w must be a real numeric type' - assert isinstance(D, (np.ndarray, float, int, np.int64,pd.Series)), \ - 'D must be a real numeric type' - - if any([(isinstance(H, np.ndarray) or isinstance(H, pd.Series)), \ - (isinstance(lambda_w, np.ndarray) or isinstance(H, pd.Series)), \ - (isinstance(D, np.ndarray) or isinstance(H, pd.Series))\ - ]): - errMsg = 'D, H, and lambda_w must be same shape' + if not isinstance(H, (np.ndarray, float, int, np.int64, pd.Series, xr.DataArray)): + raise TypeError( + f"H must be of type float, int, np.int64, np.ndarray, pd.Series, or xr.DataArray. Got: {type(H)}" + ) + if not isinstance( + lambda_w, (np.ndarray, float, int, np.int64, pd.Series, xr.DataArray) + ): + raise TypeError( + f"lambda_w must be of type float, int, np.int64, np.ndarray, pd.Series, or xr.DataArray. Got: {type(lambda_w)}" + ) + if not isinstance(D, (np.ndarray, float, int, np.int64, pd.Series, xr.DataArray)): + raise TypeError( + f"D must be of type float, int, np.int64, np.ndarray, pd.Series, or xr.DataArray. Got: {type(D)}" + ) + + if any( + [ + isinstance(H, (np.ndarray, pd.Series, xr.DataArray)), + isinstance(lambda_w, (np.ndarray, pd.Series, xr.DataArray)), + isinstance(D, (np.ndarray, pd.Series, xr.DataArray)), + ] + ): n_H = H.squeeze().shape n_lambda_w = lambda_w.squeeze().shape n_D = D.squeeze().shape - assert n_H == n_lambda_w and n_H == n_D, errMsg + if not (n_H == n_lambda_w and n_H == n_D): + raise ValueError("D, H, and lambda_w must be same shape") if isinstance(H, np.ndarray): - mvals = pd.DataFrame(H.reshape(len(H),1), columns=['H']) - mvals['lambda_w'] = lambda_w - mvals['D'] = D - elif isinstance(H, pd.Series): + mvals = pd.DataFrame(H.reshape(len(H), 1), columns=["H"]) + mvals["lambda_w"] = lambda_w + mvals["D"] = D + elif isinstance(H, (pd.Series, xr.DataArray)): mvals = pd.DataFrame(H) - mvals['lambda_w'] = lambda_w - mvals['D'] = D + mvals["lambda_w"] = lambda_w + mvals["D"] = D else: H = np.array([H]) lambda_w = np.array([lambda_w]) D = np.array([D]) - mvals = pd.DataFrame(H.reshape(len(H),1), columns=['H']) - mvals['lambda_w'] = lambda_w - mvals['D'] = D + mvals = pd.DataFrame(H.reshape(len(H), 1), columns=["H"]) + mvals["lambda_w"] = lambda_w + mvals["D"] = D if ax is None: plt.figure() ax = plt.gca() - ax.set_xscale('log') - ax.set_yscale('log') + ax.set_xscale("log") + ax.set_yscale("log") for index, row in mvals.iterrows(): H = row.H @@ -222,103 +241,140 @@ def plot_chakrabarti(H, lambda_w, D, ax=None): lambda_w = row.lambda_w KC = H / D - Diffraction = np.pi*D / lambda_w - label = f'$H$ = {H:g}, $\lambda_w$ = {lambda_w:g}, $D$ = {D:g}' - ax.plot(Diffraction, KC, 'o', label=label) - - if np.any(KC>=10 or KC<=.02) or np.any(Diffraction>=50) or \ - np.any(lambda_w >= 1000) : - ax.autoscale(enable=True, axis='both', tight=True) + Diffraction = np.pi * D / lambda_w + label = f"$H$ = {H:g}, $\lambda_w$ = {lambda_w:g}, $D$ = {D:g}" + ax.plot(Diffraction, KC, "o", label=label) + + if ( + np.any(KC >= 10 or KC <= 0.02) + or np.any(Diffraction >= 50) + or np.any(lambda_w >= 1000) + ): + ax.autoscale(enable=True, axis="both", tight=True) else: ax.set_xlim((0.01, 10)) ax.set_ylim((0.01, 50)) graphScale = list(ax.get_xlim()) - if graphScale[0] >= .01: - graphScale[0] =.01 + if graphScale[0] >= 0.01: + graphScale[0] = 0.01 # deep water breaking limit (H/lambda_w = 0.14) - x = np.logspace(1,np.log10(graphScale[0]), 2) + x = np.logspace(1, np.log10(graphScale[0]), 2) y_breaking = 0.14 * np.pi / x - ax.plot(x, y_breaking, 'k-') + ax.plot(x, y_breaking, "k-") graphScale = list(ax.get_xlim()) - ax.text(1, 7, - 'wave\nbreaking\n$H/\lambda_w > 0.14$', - ha='center', va='center', fontstyle='italic', - fontsize='small',clip_on='True') + ax.text( + 1, + 7, + "wave\nbreaking\n$H/\lambda_w > 0.14$", + ha="center", + va="center", + fontstyle="italic", + fontsize="small", + clip_on="True", + ) # upper bound of low drag region ldv = 20 - y_small_drag = 20*np.ones_like(graphScale) + y_small_drag = 20 * np.ones_like(graphScale) graphScale[1] = 0.14 * np.pi / ldv - ax.plot(graphScale, y_small_drag,'k--') - ax.text(0.0125, 30, - 'drag', - ha='center', va='top', fontstyle='italic', - fontsize='small',clip_on='True') + ax.plot(graphScale, y_small_drag, "k--") + ax.text( + 0.0125, + 30, + "drag", + ha="center", + va="top", + fontstyle="italic", + fontsize="small", + clip_on="True", + ) # upper bound of small drag region sdv = 1.5 - y_small_drag = sdv*np.ones_like(graphScale) + y_small_drag = sdv * np.ones_like(graphScale) graphScale[1] = 0.14 * np.pi / sdv - ax.plot(graphScale, y_small_drag,'k--') - ax.text(0.02, 7, - 'inertia \n& drag', - ha='center', va='center', fontstyle='italic', - fontsize='small',clip_on='True') + ax.plot(graphScale, y_small_drag, "k--") + ax.text( + 0.02, + 7, + "inertia \n& drag", + ha="center", + va="center", + fontstyle="italic", + fontsize="small", + clip_on="True", + ) # upper bound of negligible drag region ndv = 0.25 graphScale[1] = 0.14 * np.pi / ndv - y_small_drag = ndv*np.ones_like(graphScale) - ax.plot(graphScale, y_small_drag,'k--') - ax.text(8e-2, 0.7, - 'large\ninertia', - ha='center', va='center', fontstyle='italic', - fontsize='small',clip_on='True') - - - ax.text(8e-2, 6e-2, - 'all\ninertia', - ha='center', va='center', fontstyle='italic', - fontsize='small', clip_on='True') + y_small_drag = ndv * np.ones_like(graphScale) + ax.plot(graphScale, y_small_drag, "k--") + ax.text( + 8e-2, + 0.7, + "large\ninertia", + ha="center", + va="center", + fontstyle="italic", + fontsize="small", + clip_on="True", + ) + + ax.text( + 8e-2, + 6e-2, + "all\ninertia", + ha="center", + va="center", + fontstyle="italic", + fontsize="small", + clip_on="True", + ) # left bound of diffraction region drv = 0.5 graphScale = list(ax.get_ylim()) graphScale[1] = 0.14 * np.pi / drv - x_diff_reg = drv*np.ones_like(graphScale) - ax.plot(x_diff_reg, graphScale, 'k--') - ax.text(2, 6e-2, - 'diffraction', - ha='center', va='center', fontstyle='italic', - fontsize='small',clip_on='True') - + x_diff_reg = drv * np.ones_like(graphScale) + ax.plot(x_diff_reg, graphScale, "k--") + ax.text( + 2, + 6e-2, + "diffraction", + ha="center", + va="center", + fontstyle="italic", + fontsize="small", + clip_on="True", + ) if index > 0: - ax.legend(fontsize='xx-small', ncol=2) + ax.legend(fontsize="xx-small", ncol=2) - ax.set_xlabel('Diffraction parameter, $\\frac{\\pi D}{\\lambda_w}$') - ax.set_ylabel('KC parameter, $\\frac{H}{D}$') + ax.set_xlabel("Diffraction parameter, $\\frac{\\pi D}{\\lambda_w}$") + ax.set_ylabel("KC parameter, $\\frac{H}{D}$") plt.tight_layout() def plot_environmental_contour(x1, x2, x1_contour, x2_contour, **kwargs): - ''' + """ Plots an overlay of the x1 and x2 variables to the calculate environmental contours. - + Parameters ---------- - x1: numpy array + x1: list, np.ndarray, pd.Series, xr.DataArray x-axis data - x2: numpy array + x2: list, np.ndarray, pd.Series, xr.DataArray x-axis data - x1_contour: numpy array or list + x1_contour: list, np.ndarray, pd.Series, xr.DataArray Calculated x1 contour values - x2_contour: numpy array or list + x2_contour: list, np.ndarray, pd.Series, xr.DataArray Calculated x2 contour values **kwargs : optional x_label: string (optional) @@ -336,74 +392,105 @@ def plot_environmental_contour(x1, x2, x1_contour, x2_contour, **kwargs): Default None. markers: string string or list of strings to use as marker types - + Returns ------- ax : matplotlib pyplot axes - ''' - try: x1 = x1.values - except: pass - try: x2 = x2.values - except: pass - assert isinstance(x1, np.ndarray), 'x1 must be of type np.ndarray' - assert isinstance(x2, np.ndarray), 'x2 must be of type np.ndarray' - assert isinstance(x1_contour, (np.ndarray,list)), ('x1_contour must be of ' - 'type np.ndarray or list') - assert isinstance(x2_contour, (np.ndarray,list)), ('x2_contour must be of ' - 'type np.ndarray or list') + """ + try: + x1 = x1.values + except: + pass + try: + x2 = x2.values + except: + pass + if not isinstance(x1, np.ndarray): + raise TypeError(f"x1 must be of type np.ndarray. Got: {type(x1)}") + if not isinstance(x2, np.ndarray): + raise TypeError(f"x2 must be of type np.ndarray. Got: {type(x2)}") + try: + x1_contour = x1_contour.values + except: + pass + try: + x2_contour = x2_contour.values + except: + pass + if not isinstance(x1_contour, (np.ndarray, list)): + raise TypeError( + f"x1_contour must be of type np.ndarray or list. Got: {type(x1_contour)}" + ) + if not isinstance(x2_contour, (np.ndarray, list)): + raise TypeError( + f"x2_contour must be of type np.ndarray or list. Got: {type(x2_contour)}" + ) + x_label = kwargs.get("x_label", None) y_label = kwargs.get("y_label", None) - data_label=kwargs.get("data_label", None) - contour_label=kwargs.get("contour_label", None) - ax=kwargs.get("ax", None) - markers=kwargs.get("markers", '-') - assert isinstance(data_label, (str,type(None))), 'data_label must be of type str' - assert isinstance(contour_label, (str,list, type(None))), ('contour_label be of ' - 'type str') - - if isinstance(markers, list): - assert all( [isinstance(marker, (str)) for marker in markers] ) - elif isinstance(markers, str): - markers=[markers] - assert all( [isinstance(marker, (str)) for marker in markers] ) - else: - assert isinstance(markers, (str,list)), ('markers must be of type str or list of strings') + data_label = kwargs.get("data_label", None) + contour_label = kwargs.get("contour_label", None) + ax = kwargs.get("ax", None) + markers = kwargs.get("markers", "-") + if not isinstance(data_label, (str, type(None))): + raise TypeError( + f"If specified, data_label must be of type str. Got: {type(data_label)}" + ) + if not isinstance(contour_label, (str, list, type(None))): + raise TypeError( + f"If specified, contour_label be of type str. Got: {type(contour_label)}" + ) - assert len(x2_contour) == len(x1_contour), ('contour must be of' - f'equal dimesion got {len(x2_contour)} and {len(x1_contour)}') + if isinstance(markers, str): + markers = [markers] + if not isinstance(markers, list) or not all( + [isinstance(marker, (str)) for marker in markers] + ): + raise TypeError( + f"markers must be of type str or list of strings. Got: {markers}" + ) + if not len(x2_contour) == len(x1_contour): + raise ValueError( + f"contour must be of equal dimension got {len(x2_contour)} and {len(x1_contour)}" + ) if isinstance(x1_contour, np.ndarray): - N_contours=1 - x2_contour = [x2_contour] + N_contours = 1 + x2_contour = [x2_contour] x1_contour = [x1_contour] elif isinstance(x1_contour, list): - N_contours=len(x1_contour) + N_contours = len(x1_contour) if contour_label != None: if isinstance(contour_label, str): contour_label = [contour_label] N_c_labels = len(contour_label) - assert N_c_labels == N_contours, ('If specified, the ' - 'number of contour lables must be equal to number the ' - f'number of contour years. Got {N_c_labels} and {N_contours}') + if not N_c_labels == N_contours: + raise ValueError( + "If specified, the number of contour labels must" + " be equal to number the number of contour years." + f" Got: {N_c_labels} and {N_contours}" + ) else: contour_label = [None] * N_contours - if len(markers)==1: - markers=markers*N_contours - assert len(markers) == N_contours, ('Markers must be same length' - f'as N contours specified. Got: {len(markers)} and {len(x1_contour)}') + if len(markers) == 1: + markers = markers * N_contours + if not len(markers) == N_contours: + raise ValueError( + "Markers must be same length as N contours specified." + f"Got: {len(markers)} and {len(x1_contour)}" + ) for i in range(N_contours): contour1 = np.array(x1_contour[i]).T contour2 = np.array(x2_contour[i]).T - ax = _xy_plot(contour1, contour2, markers[i], - label=contour_label[i], ax=ax) + ax = _xy_plot(contour1, contour2, markers[i], label=contour_label[i], ax=ax) - plt.plot(x1, x2, 'bo', alpha=0.1, label=data_label) + plt.plot(x1, x2, "bo", alpha=0.1, label=data_label) - plt.legend(loc='lower right') + plt.legend(loc="lower right") plt.xlabel(x_label) plt.ylabel(y_label) plt.tight_layout() @@ -411,16 +498,16 @@ def plot_environmental_contour(x1, x2, x1_contour, x2_contour, **kwargs): def plot_avg_annual_energy_matrix( - Hm0, - Te, - J, - time_index=None, - Hm0_bin_size=None, - Te_bin_size=None, - Hm0_edges=None, - Te_edges=None - ): - ''' + Hm0, + Te, + J, + time_index=None, + Hm0_bin_size=None, + Te_bin_size=None, + Hm0_edges=None, + Te_edges=None, +): + """ Creates an average annual energy matrix with frequency of occurance. Parameters @@ -446,51 +533,53 @@ def plot_avg_annual_energy_matrix( ------- fig: Figure Average annual energy table plot - ''' + """ fig = plt.figure() if isinstance(time_index, type(None)): data = pd.DataFrame(dict(Hm0=Hm0, Te=Te, J=J)) else: - data= pd.DataFrame(dict(Hm0=Hm0, Te=Te, J=J), index=time_index) - years=data.index.year.unique() + data = pd.DataFrame(dict(Hm0=Hm0, Te=Te, J=J), index=time_index) + years = data.index.year.unique() if isinstance(Hm0_edges, type(None)): Hm0_max = data.Hm0.max() - Hm0_edges = np.arange(0,Hm0_max+Hm0_bin_size,Hm0_bin_size) + Hm0_edges = np.arange(0, Hm0_max + Hm0_bin_size, Hm0_bin_size) if isinstance(Te_edges, type(None)): Te_max = data.Te.max() - Te_edges = np.arange(0, Te_max+Te_bin_size,Te_bin_size) + Te_edges = np.arange(0, Te_max + Te_bin_size, Te_bin_size) # Dict for number of hours each sea state occurs - hist_counts={} - hist_J={} + hist_counts = {} + hist_J = {} # Create hist of counts, and weghted by J for each year for year in years: year_data = data.loc[str(year)].copy(deep=True) # Get the counts of each bin - counts, xedges, yedges= np.histogram2d( + counts, xedges, yedges = np.histogram2d( year_data.Te, year_data.Hm0, - bins = (Te_edges,Hm0_edges), + bins=(Te_edges, Hm0_edges), ) # Get centers for number of counts plot location - xcenters = xedges[:-1]+ np.diff(xedges) - ycenters = yedges[:-1]+ np.diff(yedges) + xcenters = xedges[:-1] + np.diff(xedges) + ycenters = yedges[:-1] + np.diff(yedges) - year_data['xbins'] = np.digitize(year_data.Te, xcenters) - year_data['ybins'] = np.digitize(year_data.Hm0, ycenters) + year_data["xbins"] = np.digitize(year_data.Te, xcenters) + year_data["ybins"] = np.digitize(year_data.Hm0, ycenters) total_year_J = year_data.J.sum() - H=counts.copy() + H = counts.copy() for i in range(len(xcenters)): for j in range(len(ycenters)): - bin_J = year_data[(year_data.xbins == i) & (year_data.ybins == j)].J.sum() + bin_J = year_data[ + (year_data.xbins == i) & (year_data.ybins == j) + ].J.sum() H[i][j] = bin_J / total_year_J # Save in results dict @@ -498,70 +587,82 @@ def plot_avg_annual_energy_matrix( hist_J[year] = H # Calculate avg annual - avg_annual_counts_hist = sum(hist_counts.values())/len(years) - avg_annual_J_hist = sum(hist_J.values())/len(years) + avg_annual_counts_hist = sum(hist_counts.values()) / len(years) + avg_annual_J_hist = sum(hist_J.values()) / len(years) # Create a mask of non-zero weights to hide from imshow - Hmasked = np.ma.masked_where(~(avg_annual_J_hist>0),avg_annual_J_hist) - plt.imshow(Hmasked.T, interpolation = 'none', vmin = 0.005, origin='lower', aspect='auto', - extent=[xedges[0], xedges[-1], yedges[0], yedges[-1]]) + Hmasked = np.ma.masked_where(~(avg_annual_J_hist > 0), avg_annual_J_hist) + plt.imshow( + Hmasked.T, + interpolation="none", + vmin=0.005, + origin="lower", + aspect="auto", + extent=[xedges[0], xedges[-1], yedges[0], yedges[-1]], + ) # Plot number of counts as text on the hist of annual avg J for xi in range(len(xcenters)): for yi in range(len(ycenters)): if avg_annual_counts_hist[xi][yi] != 0: plt.text( - xedges[xi], - yedges[yi], - int(np.ceil(avg_annual_counts_hist[xi][yi])), - fontsize=10, - color='white', - path_effects=[pe.withStroke(linewidth=1, foreground="k")] - ) - plt.xlabel('Wave Energy Period (s)') - plt.ylabel('Significant Wave Height (m)') - - cbar=plt.colorbar() - cbar.set_label('Mean Normalized Annual Energy') + xedges[xi], + yedges[yi], + int(np.ceil(avg_annual_counts_hist[xi][yi])), + fontsize=10, + color="white", + path_effects=[pe.withStroke(linewidth=1, foreground="k")], + ) + plt.xlabel("Wave Energy Period (s)") + plt.ylabel("Significant Wave Height (m)") + + cbar = plt.colorbar() + cbar.set_label("Mean Normalized Annual Energy") plt.tight_layout() return fig def monthly_cumulative_distribution(J): - ''' + """ Creates a cumulative distribution of energy flux as described in IEC TS 62600-101. Parameters ---------- - J: Series + J: pd.Series, xr.DataArray Energy Flux with DateTime index Returns ------- ax: axes Figure of monthly cumulative distribution - ''' - assert isinstance(J, pd.Series), 'J must be of type pd.Series' - cumSum={} - months=J.index.month.unique() + """ + J = pd.Series(J) + cumSum = {} + months = J.index.month.unique() for month in months: - F = exceedance_probability(J[J.index.month==month]) - cumSum[month] = 1-F/100 - cumSum[month].sort_values('F', inplace=True) - plt.figure(figsize=(12,8) ) + F = exceedance_probability(J[J.index.month == month]) + cumSum[month] = 1 - F / 100 + cumSum[month].sort_values("F", inplace=True) + plt.figure(figsize=(12, 8)) for month in months: - plt.semilogx(J.loc[cumSum[month].index], cumSum[month].F, '--', - label=calendar.month_abbr[month]) + plt.semilogx( + J.loc[cumSum[month].index], + cumSum[month].F, + "--", + label=calendar.month_abbr[month], + ) F = exceedance_probability(J) - F.sort_values('F', inplace=True) - ax = plt.semilogx(J.loc[F.index], 1-F['F']/100, 'k-', fillstyle='none', label='All') + F.sort_values("F", inplace=True) + ax = plt.semilogx( + J.loc[F.index], 1 - F["F"] / 100, "k-", fillstyle="none", label="All" + ) plt.grid() - plt.xlabel('Energy Flux') - plt.ylabel('Cumulative Distribution') + plt.xlabel("Energy Flux") + plt.ylabel("Cumulative Distribution") plt.legend() return ax @@ -577,11 +678,11 @@ def plot_compendium(Hs, Tp, Dp, buoy_title=None, ax=None): Parameters ---------- - Hs: pandas Series + Hs: pandas Series or xarray DataArray significant wave height - Tp: pandas Series + Tp: pandas Series or xarray DataArray significant wave height - Dp: pandas Series + Dp: pandas Series or xarray DataArray significant wave height buoy_title: string (optional) Buoy title from the CDIP THREDDS Server @@ -592,47 +693,54 @@ def plot_compendium(Hs, Tp, Dp, buoy_title=None, ax=None): ax : matplotlib pyplot axes """ - assert isinstance(Hs, pd.Series), 'Hs must be of type pd.Series' - assert isinstance(Tp, pd.Series), 'Tp must be of type pd.Series' - assert isinstance(Dp, pd.Series), 'Dp must be of type pd.Series' - assert isinstance(buoy_title, (str, type(None))), 'buoy_title must be of type string' + Hs = pd.Series(Hs) + Tp = pd.Series(Tp) + Dp = pd.Series(Dp) + if not isinstance(Hs, pd.Series): + raise TypeError(f"Hs must be of type pd.Series. Got: {type(Hs)}") + if not isinstance(Tp, pd.Series): + raise TypeError(f"Tp must be of type pd.Series. Got: {type(Tp)}") + if not isinstance(Dp, pd.Series): + raise TypeError(f"Dp must be of type pd.Series. Got: {type(Dp)}") + if not isinstance(buoy_title, (str, type(None))): + raise TypeError( + f"If specified, buoy_title must be of type string. Got: {type(buoy_title)}" + ) - f, (pHs, pTp, pDp) = plt.subplots(3, 1, sharex=True, figsize=(15,10)) + f, (pHs, pTp, pDp) = plt.subplots(3, 1, sharex=True, figsize=(15, 10)) - pHs.plot(Hs.index,Hs,'b') - pTp.plot(Tp.index,Tp,'b') - pDp.scatter(Dp.index,Dp,color='blue',s=5) + pHs.plot(Hs.index, Hs, "b") + pTp.plot(Tp.index, Tp, "b") + pDp.scatter(Dp.index, Dp, color="blue", s=5) - pHs.tick_params(axis='x', which='major', labelsize=12, top='off') - pHs.set_ylim(0,8) - pHs.tick_params(axis='y', which='major', labelsize=12, right='off') - pHs.set_ylabel('Hs [m]', fontsize=18) - pHs.grid(color='b', linestyle='--') + pHs.tick_params(axis="x", which="major", labelsize=12, top="off") + pHs.set_ylim(0, 8) + pHs.tick_params(axis="y", which="major", labelsize=12, right="off") + pHs.set_ylabel("Hs [m]", fontsize=18) + pHs.grid(color="b", linestyle="--") pHs2 = pHs.twinx() - pHs2.set_ylim(0,25) - pHs2.set_ylabel('Hs [ft]', fontsize=18) - + pHs2.set_ylim(0, 25) + pHs2.set_ylabel("Hs [ft]", fontsize=18) # Peak Period, Tp - pTp.set_ylim(0,28) - pTp.set_ylabel('Tp [s]', fontsize=18) - pTp.grid(color='b', linestyle='--') - + pTp.set_ylim(0, 28) + pTp.set_ylabel("Tp [s]", fontsize=18) + pTp.grid(color="b", linestyle="--") # Direction, Dp - pDp.set_ylim(0,360) - pDp.set_ylabel('Dp [deg]', fontsize=18) - pDp.grid(color='b', linestyle='--') - pDp.set_xlabel('Day', fontsize=18) + pDp.set_ylim(0, 360) + pDp.set_ylabel("Dp [deg]", fontsize=18) + pDp.grid(color="b", linestyle="--") + pDp.set_xlabel("Day", fontsize=18) # Set x-axis tick interval to every 5 days degrees = 70 days = matplotlib.dates.DayLocator(interval=5) - daysFmt = matplotlib.dates.DateFormatter('%Y-%m-%d') + daysFmt = matplotlib.dates.DateFormatter("%Y-%m-%d") plt.gca().xaxis.set_major_locator(days) plt.gca().xaxis.set_major_formatter(daysFmt) - plt.setp( pDp.xaxis.get_majorticklabels(), rotation=degrees ) + plt.setp(pDp.xaxis.get_majorticklabels(), rotation=degrees) # Set Titles month_name_start = Hs.index.month_name()[0][:3] @@ -641,7 +749,7 @@ def plot_compendium(Hs, Tp, Dp, buoy_title=None, ax=None): year_end = Hs.index.year[-1] plt.suptitle(buoy_title, fontsize=30) - plt.title(f'{Hs.index[0].date()} to {Hs.index[-1].date()}', fontsize=20) + plt.title(f"{Hs.index[0].date()} to {Hs.index[-1].date()}", fontsize=20) ax = f @@ -658,7 +766,7 @@ def plot_boxplot(Hs, buoy_title=None): Parameters ------------ - data: pandas DataFrame + Hs: pandas Series or xarray DataArray Spectral density [m^2/Hz] indexed frequency [Hz] buoy_title: string (optional) Buoy title from the CDIP THREDDS Server @@ -668,66 +776,82 @@ def plot_boxplot(Hs, buoy_title=None): --------- ax : matplotlib pyplot axes """ - assert isinstance(Hs, pd.Series), 'Hs must be of type pd.Series' - assert isinstance(buoy_title, (str, type(None))), 'buoy_title must be of type string' + Hs = pd.Series(Hs) + if not isinstance(Hs, pd.Series): + raise TypeError(f"Hs must be of type pd.Series. Got: {type(Hs)}") + if not isinstance(buoy_title, (str, type(None))): + raise TypeError( + f"If specified, buoy_title must be of type string. Got: {type(buoy_title)}" + ) months = Hs.index.month means = Hs.groupby(months).mean() monthlengths = Hs.groupby(months).count() - fig = plt.figure(figsize=(10,12)) - gs = gridspec.GridSpec(2,1, height_ratios=[4,1]) + fig = plt.figure(figsize=(10, 12)) + gs = gridspec.GridSpec(2, 1, height_ratios=[4, 1]) - boxprops = dict(color='k') - whiskerprops = dict(linestyle='--', color='k') - flierprops = dict(marker='+', color='r',markeredgecolor='r',markerfacecolor='r') - medianprops = dict(linewidth=2.5,color='firebrick') - meanprops = dict(linewidth=2.5, marker='_', markersize=25) + boxprops = dict(color="k") + whiskerprops = dict(linestyle="--", color="k") + flierprops = dict(marker="+", color="r", markeredgecolor="r", markerfacecolor="r") + medianprops = dict(linewidth=2.5, color="firebrick") + meanprops = dict(linewidth=2.5, marker="_", markersize=25) - bp = plt.subplot(gs[0,:]) + bp = plt.subplot(gs[0, :]) Hs_months = Hs.to_frame().groupby(months) - bp = Hs_months.boxplot(subplots=False, boxprops=boxprops, - whiskerprops=whiskerprops, flierprops=flierprops, - medianprops=medianprops, showmeans=True, meanprops=meanprops) + bp = Hs_months.boxplot( + subplots=False, + boxprops=boxprops, + whiskerprops=whiskerprops, + flierprops=flierprops, + medianprops=medianprops, + showmeans=True, + meanprops=meanprops, + ) # Add values of monthly means as text for i, mean in enumerate(means): - bp.annotate(np.round(mean,2), (means.index[i],mean),fontsize=12, - horizontalalignment='center',verticalalignment='bottom', - color='g') + bp.annotate( + np.round(mean, 2), + (means.index[i], mean), + fontsize=12, + horizontalalignment="center", + verticalalignment="bottom", + color="g", + ) # Create a second row of x-axis labels for top subplot newax = bp.twiny() - newax.tick_params(which='major', direction='in', pad=-18) + newax.tick_params(which="major", direction="in", pad=-18) newax.set_xlim(bp.get_xlim()) - newax.xaxis.set_ticks_position('top') - newax.xaxis.set_label_position('top') - newax.set_xticks(np.arange(1,13,1)) - newax.set_xticklabels(monthlengths,fontsize=10) - + newax.xaxis.set_ticks_position("top") + newax.xaxis.set_label_position("top") + newax.set_xticks(np.arange(1, 13, 1)) + newax.set_xticklabels(monthlengths, fontsize=10) # Sample 'legend' boxplot, to go underneath actual boxplot - bp_sample2 = np.random.normal(2.5,0.5,500) - bp2 = plt.subplot(gs[1,:]) - meanprops = dict(linewidth=2.5, marker='|', markersize=25) - bp2_example = bp2.boxplot(bp_sample2,vert=False,flierprops=flierprops, - medianprops=medianprops) - sample_mean=2.3 - bp2.scatter(sample_mean,1,marker="|",color='g',linewidths=1.0,s=200) - - for line in bp2_example['medians']: + bp_sample2 = np.random.normal(2.5, 0.5, 500) + bp2 = plt.subplot(gs[1, :]) + meanprops = dict(linewidth=2.5, marker="|", markersize=25) + bp2_example = bp2.boxplot( + bp_sample2, vert=False, flierprops=flierprops, medianprops=medianprops + ) + sample_mean = 2.3 + bp2.scatter(sample_mean, 1, marker="|", color="g", linewidths=1.0, s=200) + + for line in bp2_example["medians"]: xm, ym = line.get_xydata()[0] - for line in bp2_example['boxes']: + for line in bp2_example["boxes"]: xb, yb = line.get_xydata()[0] - for line in bp2_example['whiskers']: + for line in bp2_example["whiskers"]: xw, yw = line.get_xydata()[0] - bp2.annotate("Median",[xm-0.1,ym-0.3*ym],fontsize=10,color='firebrick') - bp2.annotate("Mean",[sample_mean-0.1,0.65],fontsize=10,color='g') - bp2.annotate("25%ile",[xb-0.05*xb,yb-0.15*yb],fontsize=10) - bp2.annotate("75%ile",[xb+0.26*xb,yb-0.15*yb],fontsize=10) - bp2.annotate("Outliers",[xw+0.3*xw,yw-0.3*yw],fontsize=10,color='r') + bp2.annotate("Median", [xm - 0.1, ym - 0.3 * ym], fontsize=10, color="firebrick") + bp2.annotate("Mean", [sample_mean - 0.1, 0.65], fontsize=10, color="g") + bp2.annotate("25%ile", [xb - 0.05 * xb, yb - 0.15 * yb], fontsize=10) + bp2.annotate("75%ile", [xb + 0.26 * xb, yb - 0.15 * yb], fontsize=10) + bp2.annotate("Outliers", [xw + 0.3 * xw, yw - 0.3 * yw], fontsize=10, color="r") if buoy_title: plt.suptitle(buoy_title, fontsize=30, y=0.97) @@ -735,14 +859,14 @@ def plot_boxplot(Hs, buoy_title=None): bp2.set_title("Sample Boxplot", fontsize=10, y=1.02) # Set axes labels and ticks - months_text = [ m[:3] for m in Hs.index.month_name().unique()] - bp.set_xticklabels(months_text,fontsize=12) - bp.set_ylabel('Significant Wave Height, Hs (m)', fontsize=14) - bp.tick_params(axis='y', which='major', labelsize=12, right='off') - bp.tick_params(axis='x', which='major', labelsize=12, top='off') + months_text = [m[:3] for m in Hs.index.month_name().unique()] + bp.set_xticklabels(months_text, fontsize=12) + bp.set_ylabel("Significant Wave Height, Hs (m)", fontsize=14) + bp.tick_params(axis="y", which="major", labelsize=12, right="off") + bp.tick_params(axis="x", which="major", labelsize=12, top="off") # Plot horizontal gridlines onto top subplot - bp.grid(axis='x', color='b', linestyle='-', alpha=0.25) + bp.grid(axis="x", color="b", linestyle="-", alpha=0.25) # Remove tickmarks from bottom subplot bp2.axes.get_xaxis().set_visible(False) @@ -754,13 +878,13 @@ def plot_boxplot(Hs, buoy_title=None): def plot_directional_spectrum( - spectrum, - min=None, - fill=True, - nlevels=11, - name="Elevation Variance", - units="m^2" - ): + spectrum, + color_level_min=None, + fill=True, + nlevels=11, + name="Elevation Variance", + units="m^2", +): """ Create a contour polar plot of a directional spectrum. @@ -768,8 +892,8 @@ def plot_directional_spectrum( ------------ spectrum: xarray.DataArray Spectral data indexed frequency [Hz] and wave direction [deg]. - min: float (optional) - Minimum value to plot. + color_level_min: float (optional) + Minimum color bar level. fill: bool Whether to use `contourf` (filled) instead of `contour` (lines). nlevels: int @@ -783,27 +907,38 @@ def plot_directional_spectrum( --------- ax : matplotlib pyplot axes """ - assert isinstance(spectrum, xr.DataArray), 'spectrum must be a DataArray' - if min is not None: - assert isinstance(min, float), 'min must be a float' - assert isinstance(fill, bool), 'fill must be a bool' - assert isinstance(nlevels, int), 'nlevels must be an int' - assert isinstance(name, str), 'name must be a string' - assert isinstance(units, str), 'units must be a string' - - a,f = np.meshgrid(np.deg2rad(spectrum.direction), spectrum.frequency) - _, ax = plt.subplots(subplot_kw=dict(projection='polar')) - tmp = np.floor(np.min(spectrum.data)*10)/10 - min = tmp if (min is None) else min - max = np.ceil(np.max(spectrum.data)*10)/10 - levels = np.linspace(min, max, nlevels) + if not isinstance(spectrum, xr.DataArray): + raise TypeError(f"spectrum must be of type xr.DataArray. Got: {type(spectrum)}") + if not isinstance(color_level_min, (type(None), float)): + raise TypeError( + f"If specified, color_level_min must be of type float. Got: {type(color_level_min)}" + ) + if not isinstance(fill, bool): + raise TypeError(f"If specified, fill must be of type bool. Got: {type(fill)}") + if not isinstance(nlevels, int): + raise TypeError( + f"If specified, nlevels must be of type int. Got: {type(nlevels)}" + ) + if not isinstance(name, str): + raise TypeError(f"If specified, name must be of type string. Got: {type(name)}") + if not isinstance(units, str): + raise TypeError( + f"If specified, units must be of type string. Got: {type(units)}" + ) + + a, f = np.meshgrid(np.deg2rad(spectrum.direction), spectrum.frequency) + _, ax = plt.subplots(subplot_kw=dict(projection="polar")) + tmp = np.floor(np.min(spectrum.data) * 10) / 10 + color_level_min = tmp if (color_level_min is None) else color_level_min + color_level_max = np.ceil(np.max(spectrum.data) * 10) / 10 + levels = np.linspace(color_level_min, color_level_max, nlevels) if fill: c = ax.contourf(a, f, spectrum, levels=levels) else: c = ax.contour(a, f, spectrum, levels=levels) cbar = plt.colorbar(c) - cbar.set_label(f'Spectrum [{units}/Hz/deg]', rotation=270, labelpad=20) - ax.set_title(f'{name} Spectrum') + cbar.set_label(f"Spectrum [{units}/Hz/deg]", rotation=270, labelpad=20) + ax.set_title(f"{name} Spectrum") ylabels = ax.get_yticklabels() ylabels = [ilabel.get_text() for ilabel in ax.get_yticklabels()] ylabels = [ilabel + "Hz" for ilabel in ylabels] diff --git a/mhkit/wave/io/__init__.py b/mhkit/wave/io/__init__.py index f6ad3f71f..2e966e752 100644 --- a/mhkit/wave/io/__init__.py +++ b/mhkit/wave/io/__init__.py @@ -2,4 +2,4 @@ from mhkit.wave.io import wecsim from mhkit.wave.io import cdip from mhkit.wave.io import swan -from mhkit.wave.io import hindcast \ No newline at end of file +from mhkit.wave.io import hindcast diff --git a/mhkit/wave/io/cdip.py b/mhkit/wave/io/cdip.py index a5cf2451b..5fb6e34f3 100644 --- a/mhkit/wave/io/cdip.py +++ b/mhkit/wave/io/cdip.py @@ -1,323 +1,408 @@ -from datetime import timezone +import os import pandas as pd import numpy as np import datetime import netCDF4 -import time import pytz +from mhkit.utils.cache import handle_caching +from mhkit.utils import convert_nested_dict_and_pandas + def _validate_date(date_text): - ''' + """ Checks date format to ensure YYYY-MM-DD format and return date in datetime format. - + Parameters ---------- date_text: string Date string format to check - + Returns ------- dt: datetime - ''' - assert isinstance(date_text, str), (f'date_text must be' / - 'of type string') + """ + + if not isinstance(date_text, str): + raise ValueError("date_text must be of type string. Got: {date_text}") + try: - dt = datetime.datetime.strptime(date_text, '%Y-%m-%d') + dt = datetime.datetime.strptime(date_text, "%Y-%m-%d") except ValueError: raise ValueError("Incorrect data format, should be YYYY-MM-DD") else: - dt = dt.replace(tzinfo=timezone.utc) - + dt = dt.replace(tzinfo=datetime.timezone.utc) + return dt def _start_and_end_of_year(year): - ''' + """ Returns a datetime start and end for a given year - + Parameters ---------- year: int Year to get start and end dates - + Returns ------- start_year: datetime object start of the year end_year: datetime object - end of the year - ''' - - assert isinstance(year, (type(None),int,list)), 'year must be of type int' - + end of the year + """ + + if not isinstance(year, (type(None), int, list)): + raise ValueError("year must be of type int, list, or None. Got: {type(year)}") + try: year = str(year) - start_year = datetime.datetime.strptime(year, '%Y') - except ValueError: - raise ValueError("Incorrect years format, should be YYYY") - else: - next_year = datetime.datetime.strptime(f'{int(year)+1}', '%Y') + start_year = datetime.datetime.strptime(year, "%Y") + except ValueError as exc: + raise ValueError("Incorrect years format, should be YYYY") from exc + else: + next_year = datetime.datetime.strptime(f"{int(year)+1}", "%Y") end_year = next_year - datetime.timedelta(days=1) return start_year, end_year def _dates_to_timestamp(nc, start_date=None, end_date=None): - ''' - Returns timestamps from dates. - + """ + Returns timestamps from dates. + Parameters ---------- nc: netCDF Object - netCDF data for the given station number and data type - start_date: string + netCDF data for the given station number and data type + start_date: string Start date in YYYY-MM-DD, e.g. '2012-04-01' - end_date: string - End date in YYYY-MM-DD, e.g. '2012-04-30' - + end_date: string + End date in YYYY-MM-DD, e.g. '2012-04-30' + Returns ------- start_stamp: float - seconds since the Epoch to start_date + seconds since the Epoch to start_date end_stamp: float seconds since the Epoch to end_date - ''' - - assert isinstance(start_date, (str, type(None))), ('start_date' / - 'must be of type str') - assert isinstance(end_date, (str, type(None))), ('end_date must be' / - 'of type str') - - time_all = nc.variables['waveTime'][:].compressed() - t_i=(datetime.datetime.fromtimestamp(time_all[0]) - .astimezone(pytz.timezone('UTC'))) - t_f=(datetime.datetime.fromtimestamp(time_all[-1]) - .astimezone(pytz.timezone('UTC'))) + """ + + if start_date and not isinstance(start_date, datetime.datetime): + raise ValueError( + f"start_date must be of type datetime.datetime or None. Got: {type(start_date)}" + ) + + if end_date and not isinstance(end_date, datetime.datetime): + raise ValueError( + f"end_date must be of type datetime.datetime or None. Got: {type(end_date)}" + ) + + time_all = nc.variables["waveTime"][:].compressed() + t_i = datetime.datetime.fromtimestamp(time_all[0]).astimezone(pytz.timezone("UTC")) + t_f = datetime.datetime.fromtimestamp(time_all[-1]).astimezone(pytz.timezone("UTC")) time_range_all = [t_i, t_f] - - if start_date: - start_datetime = _validate_date(start_date) - if end_date: - end_datetime = _validate_date(end_date) - if start_datetime > end_datetime: - raise Exception(f'start_date ({start_datetime}) must be'+ - f'before end_date ({end_datetime})') - elif start_datetime == end_datetime: - raise Exception(f'start_date ({start_datetime}) cannot be'+ - f'the same as end_date ({end_datetime})') - - def to_timestamp(time): - stamp = (pd.to_datetime(time) - .astimezone(pytz.timezone('UTC')) - .timestamp()) - return stamp - + if start_date: - if start_datetime > time_range_all[0] and start_datetime < time_range_all[1]: - start_stamp = start_datetime.astimezone(pytz.timezone('UTC')).timestamp() + start_date = start_date.astimezone(pytz.UTC) + if start_date > time_range_all[0] and start_date < time_range_all[1]: + start_stamp = start_date.timestamp() else: - print(f'WARNING: Provided start_date ({start_datetime}) is ' - f'not in the returned data range {time_range_all} \n' - f'Setting start_date to the earliest date in range ' - f'{time_range_all[0]}') - start_stamp = to_timestamp(time_range_all[0]) - + print( + f"WARNING: Provided start_date ({start_date}) is " + f"not in the returned data range {time_range_all} \n" + f"Setting start_date to the earliest date in range " + f"{time_range_all[0]}" + ) + start_stamp = time_range_all[0].timestamp() + if end_date: - if end_datetime > time_range_all[0] and end_datetime < time_range_all[1]: - end_stamp = end_datetime.astimezone(pytz.timezone('UTC')).timestamp() + end_date = end_date.astimezone(pytz.UTC) + if end_date > time_range_all[0] and end_date < time_range_all[1]: + end_stamp = end_date.timestamp() else: - print(f'WARNING: Provided end_date ({end_datetime}) is ' - f'not in the returned data range {time_range_all} \n' - f'Setting end_date to the latest date in range ' - f'{time_range_all[1]}') - end_stamp = to_timestamp(time_range_all[1]) - - + print( + f"WARNING: Provided end_date ({end_date}) is " + f"not in the returned data range {time_range_all} \n" + f"Setting end_date to the latest date in range " + f"{time_range_all[1]}" + ) + end_stamp = time_range_all[1].timestamp() + if start_date and not end_date: - end_stamp = to_timestamp(time_range_all[1]) + end_stamp = time_range_all[1].timestamp() elif end_date and not start_date: - start_stamp = to_timestamp(time_range_all[0]) - + start_stamp = time_range_all[0].timestamp() + if not start_date: - start_stamp = to_timestamp(time_range_all[0]) + start_stamp = time_range_all[0].timestamp() if not end_date: - end_stamp = to_timestamp(time_range_all[1]) + end_stamp = time_range_all[1].timestamp() + + return start_stamp, end_stamp - return start_stamp, end_stamp - def request_netCDF(station_number, data_type): - ''' + """ Returns historic or realtime data from CDIP THREDDS server - + Parameters ---------- station_number: string CDIP station number of interest data_type: string 'historic' or 'realtime' - + Returns ------- - nc: netCDF Object + nc: xarray Dataset netCDF data for the given station number and data type - ''' - assert isinstance(station_number, str), (f'station_number must be ' + - f'of type string. Got: {station_number}') - assert isinstance(data_type, str), (f'data_type must be' / - 'of type string') - assert data_type in ['historic', 'realtime'], ('data_type must be'\ - f' "historic" or "realtime". Got: {data_type}') - if data_type == 'historic': - cdip_archive= 'http://thredds.cdip.ucsd.edu/thredds/dodsC/cdip/archive' - data_url = f'{cdip_archive}/{station_number}p1/{station_number}p1_historic.nc' - elif data_type == 'realtime': - cdip_realtime = 'http://thredds.cdip.ucsd.edu/thredds/dodsC/cdip/realtime' - data_url = f'{cdip_realtime}/{station_number}p1_rt.nc' - + """ + + if not isinstance(station_number, (str, type(None))): + raise ValueError( + f"station_number must be of type string. Got: {type(station_number)}" + ) + + if not isinstance(data_type, str): + raise ValueError(f"data_type must be of type string. Got: {type(data_type)}") + + if data_type not in ["historic", "realtime"]: + raise ValueError('data_type must be "historic" or "realtime". Got: {data_type}') + + BASE_URL = "http://thredds.cdip.ucsd.edu/thredds/dodsC/cdip/" + + if data_type == "historic": + data_url = ( + f"{BASE_URL}archive/{station_number}p1/{station_number}p1_historic.nc" + ) + else: # data_type == 'realtime' + data_url = f"{BASE_URL}realtime/{station_number}p1_rt.nc" + nc = netCDF4.Dataset(data_url) - + return nc - -def request_parse_workflow(nc=None, station_number=None, parameters=None, - years=None, start_date=None, end_date=None, - data_type='historic', all_2D_variables=False): - ''' - Parses a passed CDIP netCDF file or requests a station number - from http://cdip.ucsd.edu/) and parses. This function can return specific + +def request_parse_workflow( + nc=None, + station_number=None, + parameters=None, + years=None, + start_date=None, + end_date=None, + data_type="historic", + all_2D_variables=False, + silent=False, + to_pandas=True, +): + """ + Parses a passed CDIP netCDF file or requests a station number + from http://cdip.ucsd.edu/) and parses. This function can return specific parameters is passed. Years may be non-consecutive e.g. [2001, 2010]. Time may be sliced by dates (start_date or end date in YYYY-MM-DD). data_type defaults to historic but may also be set to 'realtime'. By default 2D variables are not parsed if all 2D varaibles are needed. See - the MHKiT CDiP example Jupyter notbook for information on available parameters. - - + the MHKiT CDiP example Jupyter notbook for information on available parameters. + + Parameters ---------- nc: netCDF Object - netCDF data for the given station number and data type. Can be the output of - request_netCDF + netCDF data for the given station number and data type. Can be the output of + request_netCDF station_number: string Station number of CDIP wave buoy - parameters: string or list of stings + parameters: string or list of strings Parameters to return. If None will return all varaibles except - 2D-variables. + 2D-variables. years: int or list of int - Year date, e.g. 2001 or [2001, 2010] - start_date: string + Year date, e.g. 2001 or [2001, 2010] + start_date: string Start date in YYYY-MM-DD, e.g. '2012-04-01' - end_date: string + end_date: string End date in YYYY-MM-DD, e.g. '2012-04-30' data_type: string - Either 'historic' or 'realtime' + Either 'historic' or 'realtime' all_2D_variables: boolean - Will return all 2D data. Enabling this will add significant + Will return all 2D data. Enabling this will add significant processing time. If all 2D variables are not needed it is - recomended to pass 2D parameters of interest using the + recomended to pass 2D parameters of interest using the 'parameters' keyword and leave this set to False. Default False. - + silent: boolean + Set to True to prevent the print statement that announces when 2D + variable processing begins. Default False. + to_pandas: bool (optional) + Flag to output a dictionary of pandas objects instead of a dictionary + of xarray objects. Default = True. + + Returns ------- data: dictionary - 'vars1D': DataFrame - 1D variables indexed by time + 'data': dictionary of variables + 'vars': pandas DataFrame or xarray Dataset + 1D variables indexed by time + 'vars2D': dictionary of DataFrames or Datasets, optional + If 2D-vars are passed in the 'parameters key' or if run + with all_2D_variables=True, then this key will appear + with a dictonary of DataFrames of 2D variables. 'metadata': dictionary Anything not of length time - 'vars2D': dictionary of DataFrames, optional - If 2D-vars are passed in the 'parameters key' or if run - with all_2D_variables=True, then this key will appear - with a dictonary of DataFrames of 2D variables. - ''' - assert isinstance(station_number, (str, type(None))), (f'station_number must be '+ - 'of type string') - assert isinstance(parameters, (str, type(None), list)), ('parameters' / - 'must be of type str or list of strings') - assert isinstance(start_date, (str, type(None))), ('start_date' / - 'must be of type str') - assert isinstance(end_date, (str, type(None))), ('end_date must be' / - 'of type str') - assert isinstance(years, (type(None),int,list)), ('years must be of'/ - 'type int or list of ints') - assert isinstance(data_type, str), (f'data_type must be' / - 'of type string') - assert data_type in ['historic', 'realtime'], 'data_type must be'\ - f' "historic" or "realtime". Got: {data_type}' - - + """ + if not isinstance(station_number, (str, type(None))): + raise TypeError( + f"station_number must be of type string. Got: {type(station_number)}" + ) + + if not isinstance(parameters, (str, type(None), list)): + raise TypeError( + f"parameters must be of type str or list of strings. Got: {type(parameters)}" + ) + + if start_date is not None: + if isinstance(start_date, str): + try: + start_date = datetime.datetime.strptime(start_date, "%Y-%m-%d") + start_date = start_date.replace(tzinfo=pytz.UTC) + except ValueError as exc: + raise ValueError("Incorrect data format, should be YYYY-MM-DD") from exc + else: + raise TypeError(f"start_date must be of type str. Got: {type(start_date)}") + + if end_date is not None: + if isinstance(end_date, str): + try: + end_date = datetime.datetime.strptime(end_date, "%Y-%m-%d") + end_date = end_date.replace(tzinfo=pytz.UTC) + except ValueError as exc: + raise ValueError("Incorrect data format, should be YYYY-MM-DD") from exc + else: + raise TypeError(f"end_date must be of type str. Got: {type(end_date)}") + + if not isinstance(years, (type(None), int, list)): + raise TypeError( + f"years must be of type int or list of ints. Got: {type(years)}" + ) + + if not isinstance(data_type, str): + raise TypeError(f"data_type must be of type string. Got: {type(data_type)}") + + if data_type not in ["historic", "realtime"]: + raise ValueError( + f'data_type must be "historic" or "realtime". Got: {data_type}' + ) + if not any([nc, station_number]): - raise Exception('Must provide either a CDIP netCDF file or a station '+ - 'number') - + raise ValueError("Must provide either a CDIP netCDF file or a station number.") + + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type bool. Got: {type(to_pandas)}") + if not nc: nc = request_netCDF(station_number, data_type) - - buoy_name = nc.variables['metaStationName'][:].compressed().tobytes().decode("utf-8") - - - multiyear=False + + # Define the path to the cache directory + cache_dir = os.path.join(os.path.expanduser("~"), ".cache", "mhkit", "cdip") + + buoy_name = ( + nc.variables["metaStationName"][:].compressed().tobytes().decode("utf-8") + ) + + multiyear = False if years: - if isinstance(years,int): - start_date = f'{years}-01-01' - end_date = f'{years+1}-01-01' - elif isinstance(years,list): - if len(years)==1: - start_date = f'{years[0]}-01-01' - end_date = f'{years[0]+1}-01-01' + if isinstance(years, int): + start_date = datetime.datetime(years, 1, 1, tzinfo=pytz.UTC) + end_date = datetime.datetime(years + 1, 1, 1, tzinfo=pytz.UTC) + elif isinstance(years, list): + if len(years) == 1: + start_date = datetime.datetime(years[0], 1, 1, tzinfo=pytz.UTC) + end_date = datetime.datetime(years[0] + 1, 1, 1, tzinfo=pytz.UTC) else: - multiyear=True - + multiyear = True if not multiyear: - data = get_netcdf_variables(nc, - start_date=start_date, end_date=end_date, - parameters=parameters, - all_2D_variables=all_2D_variables) - - elif multiyear: - data={'data':{},'metadata':{}} - multiyear_data={} - multiyear_data_2D={} - for year in years: - start_date = f'{year}-01-01' - end_date = f'{year+1}-01-01' - - year_data = get_netcdf_variables(nc, - start_date=start_date, end_date=end_date, - parameters=parameters, - all_2D_variables=all_2D_variables) - multiyear_data[year] = year_data['data'] - - for data_key in year_data['data'].keys(): - if data_key.endswith('2D'): - data['data'][data_key]={} - for data_key2D in year_data['data'][data_key].keys(): - data_list=[] - for year in years: + # Check the cache first + hash_params = f"{station_number}-{parameters}-{start_date}-{end_date}" + data = handle_caching(hash_params, cache_dir) + + if data[:2] == (None, None): + data = get_netcdf_variables( + nc, + start_date=start_date, + end_date=end_date, + parameters=parameters, + all_2D_variables=all_2D_variables, + silent=silent, + ) + handle_caching(hash_params, cache_dir, data=data) + else: + data = data[0] + + else: + data = {"data": {}, "metadata": {}} + multiyear_data = {} + for year in years: + start_date = datetime.datetime(year, 1, 1, tzinfo=pytz.UTC) + end_date = datetime.datetime(year + 1, 1, 1, tzinfo=pytz.UTC) + + # Check the cache for each individual year + hash_params = f"{station_number}-{parameters}-{start_date}-{end_date}" + year_data = handle_caching(hash_params, cache_dir) + if year_data[:2] == (None, None): + year_data = get_netcdf_variables( + nc, + start_date=start_date, + end_date=end_date, + parameters=parameters, + all_2D_variables=all_2D_variables, + silent=silent, + ) + # Cache the individual year's data + handle_caching(hash_params, cache_dir, data=year_data) + else: + year_data = year_data[0] + multiyear_data[year] = year_data["data"] + + for data_key in year_data["data"].keys(): + if data_key.endswith("2D"): + data["data"][data_key] = {} + for data_key2D in year_data["data"][data_key].keys(): + data_list = [] + for year in years: data2D = multiyear_data[year][data_key][data_key2D] data_list.append(data2D) - data['data'][data_key][data_key2D]=pd.concat(data_list) - else: + data["data"][data_key][data_key2D] = pd.concat(data_list) + else: data_list = [multiyear_data[year][data_key] for year in years] - data['data'][data_key] = pd.concat(data_list) + data["data"][data_key] = pd.concat(data_list) + if buoy_name: + try: + data.setdefault("metadata", {})["name"] = buoy_name + except: + pass - - - data['metadata'] = year_data['metadata'] - data['metadata']['name'] = buoy_name + if not to_pandas: + data = convert_nested_dict_and_pandas(data) return data - - -def get_netcdf_variables(nc, start_date=None, end_date=None, - parameters=None, all_2D_variables=False): - ''' + + +def get_netcdf_variables( + nc, + start_date=None, + end_date=None, + parameters=None, + all_2D_variables=False, + silent=False, + to_pandas=True, +): + """ Iterates over and extracts variables from CDIP bouy data. See - the MHKiT CDiP example Jupyter notbook for information on available - parameters. - - + the MHKiT CDiP example Jupyter notbook for information on available + parameters. + Parameters ---------- nc: netCDF Object @@ -325,152 +410,221 @@ def get_netcdf_variables(nc, start_date=None, end_date=None, start_stamp: float Data of interest start in seconds since epoch end_stamp: float - Data of interest end in seconds since epoch - parameters: string or list of stings + Data of interest end in seconds since epoch + parameters: string or list of strings Parameters to return. If None will return all varaibles except 2D-variables. Default None. all_2D_variables: boolean - Will return all 2D data. Enabling this will add significant + Will return all 2D data. Enabling this will add significant processing time. If all 2D variables are not needed it is - recomended to pass 2D parameters of interest using the + recomended to pass 2D parameters of interest using the 'parameters' keyword and leave this set to False. Default False. + silent: boolean + Set to True to prevent the print statement that announces when 2D + variable processing begins. Default False. + to_pandas: bool (optional) + Flag to output a dictionary of pandas objects instead of a dictionary + of xarray objects. Default = True. + Returns ------- results: dictionary - 'vars1D': DataFrame - 1D variables indexed by time + 'data': dictionary of variables + 'vars': pandas DataFrame or xarray Dataset + 1D variables indexed by time + 'vars2D': dictionary of DataFrames or Datasets, optional + If 2D-vars are passed in the 'parameters key' or if run + with all_2D_variables=True, then this key will appear + with a dictonary of DataFrames/Datasets of 2D variables. 'metadata': dictionary Anything not of length time - 'vars2D': dictionary of DataFrames, optional - If 2D-vars are passed in the 'parameters key' or if run - with all_2D_variables=True, then this key will appear - with a dictonary of DataFrames of 2D variables. - ''' - - assert isinstance(nc, netCDF4.Dataset), 'nc must be netCDF4 dataset' - assert isinstance(start_date, (str, type(None))), ('start_date' / - 'must be of type str') - assert isinstance(end_date, (str, type(None))), ('end_date must be' / - 'of type str') - assert isinstance(parameters, (str, type(None), list)), ('parameters' / - 'must be of type str or list of strings') - assert isinstance(all_2D_variables, bool), ('all_2D_variables'/ - 'must be a boolean') + """ + + if not isinstance(nc, netCDF4.Dataset): + raise TypeError("nc must be netCDF4 dataset. Got: {type(nc)}") + + if start_date and isinstance(start_date, str): + start_date = datetime.datetime.strptime(start_date, "%Y-%m-%d") + + if end_date and isinstance(end_date, str): + end_date = datetime.datetime.strptime(end_date, "%Y-%m-%d") + + if not isinstance(parameters, (str, type(None), list)): + raise TypeError( + "parameters must be of type str or list of strings. Got: {type(parameters)}" + ) + + if not isinstance(all_2D_variables, bool): + raise TypeError( + "all_2D_variables must be a boolean. Got: {type(all_2D_variables)}" + ) if parameters: - if isinstance(parameters,str): - parameters = [parameters] - assert all([isinstance(param , str) for param in parameters]), ('All'/ - 'elements of parameters must be strings') + if isinstance(parameters, str): + parameters = [parameters] + for param in parameters: + if not isinstance(param, str): + raise TypeError("All elements of parameters must be strings.") + + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type bool. Got: {type(to_pandas)}") + buoy_name = ( + nc.variables["metaStationName"][:].compressed().tobytes().decode("utf-8") + ) - buoy_name = nc.variables['metaStationName'][:].compressed().tobytes().decode("utf-8") allVariables = [var for var in nc.variables] - - include_2D_variables=False - twoDimensionalVars = [ 'waveEnergyDensity', 'waveMeanDirection', - 'waveA1Value', 'waveB1Value', 'waveA2Value', - 'waveB2Value', 'waveCheckFactor', 'waveSpread', - 'waveM2Value', 'waveN2Value'] - + allVariableSet = set(allVariables) + + twoDimensionalVars = [ + "waveEnergyDensity", + "waveMeanDirection", + "waveA1Value", + "waveB1Value", + "waveA2Value", + "waveB2Value", + "waveCheckFactor", + "waveSpread", + "waveM2Value", + "waveN2Value", + ] + twoDimensionalVarsSet = set(twoDimensionalVars) + + # If parameters are provided, convert them into a set if parameters: params = set(parameters) - include_params = params.intersection(set(allVariables)) - if params != include_params: - not_found = params.difference(include_params) - print(f'WARNING: {not_found} was not found in data.\n' \ - f'Possible parameters are:\n {allVariables}') - - include_params_2D = include_params.intersection( - set(twoDimensionalVars)) - include_params = include_params.difference(include_params_2D) - - if include_params_2D: - include_2D_variables=True - include_params.add('waveFrequency') - include_2D_vars = sorted(include_params_2D) - - include_vars = sorted(include_params) - else: - include_vars = allVariables - - for var in twoDimensionalVars: - include_vars.remove(var) - - if all_2D_variables: - include_2D_variables=True - include_2D_vars = twoDimensionalVars - - - start_stamp, end_stamp =_dates_to_timestamp(nc, start_date=start_date, - end_date=end_date) - - variables_by_type={} - prefixs = ['wave', 'sst', 'gps', 'dwr', 'meta'] - remainingVariables = set(include_vars) - for prefix in prefixs: - variables_by_type[prefix] = [var for var in include_vars - if var.startswith(prefix)] - remainingVariables -= set(variables_by_type[prefix]) - if not variables_by_type[prefix]: - del variables_by_type[prefix] - - results={'data':{}, 'metadata':{}} + params = set() + + # If all_2D_variables is True, add all 2D variables to params + if all_2D_variables: + params.update(twoDimensionalVarsSet) + + include_params = params & allVariableSet + if params != include_params: + not_found = params - include_params + print( + f"WARNING: {not_found} was not found in data.\n" + f"Possible parameters are:\n {allVariables}" + ) + + include_params_2D = include_params & twoDimensionalVarsSet + include_params -= include_params_2D + + include_2D_variables = bool(include_params_2D) + if include_2D_variables: + include_params.add("waveFrequency") + + include_vars = include_params + + # when parameters is None and all_2D_variables is False + if not parameters and not all_2D_variables: + include_vars = allVariableSet - twoDimensionalVarsSet + + start_stamp, end_stamp = _dates_to_timestamp( + nc, start_date=start_date, end_date=end_date + ) + + prefixs = ["wave", "sst", "gps", "dwr", "meta"] + variables_by_type = { + prefix: [var for var in include_vars if var.startswith(prefix)] + for prefix in prefixs + } + variables_by_type = { + prefix: vars for prefix, vars in variables_by_type.items() if vars + } + + results = {"data": {}, "metadata": {}} for prefix in variables_by_type: - var_results={} - time_variables={} - metadata={} - - if prefix != 'meta': - prefixTime = nc.variables[f'{prefix}Time'][:] - - masked_time = np.ma.masked_outside(prefixTime, start_stamp, - end_stamp) - mask = masked_time.mask - var_time = masked_time.compressed() + time_variables = {} + metadata = {} + + if prefix != "meta": + prefixTime = nc.variables[f"{prefix}Time"][:] + + masked_time = np.ma.masked_outside(prefixTime, start_stamp, end_stamp) + mask = masked_time.mask + var_time = masked_time.compressed() N_time = masked_time.size - else: - N_time= np.nan - - for var in variables_by_type[prefix]: - variable = np.ma.filled(nc.variables[var]) - if variable.size == N_time: - variable = np.ma.masked_array(variable, mask).astype(float) - time_variables[var] = variable.compressed() - else: - metadata[var] = nc.variables[var][:].compressed() - - time_slice = pd.to_datetime(var_time, unit='s') - data = pd.DataFrame(time_variables, index=time_slice) - - if prefix != 'meta': - results['data'][prefix] = data - results['data'][prefix].name = buoy_name - results['metadata'][prefix] = metadata - - if (prefix == 'wave') and (include_2D_variables): - - print('Processing 2D Variables:') - vars2D={} - columns=metadata['waveFrequency'] - N_time= len(time_slice) + + for var in variables_by_type[prefix]: + variable = np.ma.filled(nc.variables[var]) + if variable.size == N_time: + variable = np.ma.masked_array(variable, mask).astype(float) + time_variables[var] = variable.compressed() + else: + metadata[var] = nc.variables[var][:].compressed() + + time_slice = pd.to_datetime(var_time, unit="s") + data = pd.DataFrame(time_variables, index=time_slice) + results["data"][prefix] = data + results["data"][prefix].name = buoy_name + + results["metadata"][prefix] = metadata + + if (prefix == "wave") and (include_2D_variables): + if not silent: + print("Processing 2D Variables:") + + vars2D = {} + columns = metadata["waveFrequency"] + N_time = len(time_slice) N_frequency = len(columns) try: l = len(mask) except: mask = np.array([False] * N_time) - - mask2D= np.tile(mask, (len(columns),1)).T - for var in include_2D_vars: + + mask2D = np.tile(mask, (len(columns), 1)).T + for var in include_params_2D: variable2D = nc.variables[var][:].data variable2D = np.ma.masked_array(variable2D, mask2D) - variable2D = variable2D.compressed().reshape(N_time, N_frequency) - variable = pd.DataFrame(variable2D,index=time_slice, - columns=columns) + variable2D = variable2D.compressed().reshape(N_time, N_frequency) + variable = pd.DataFrame(variable2D, index=time_slice, columns=columns) vars2D[var] = variable - results['data']['wave2D'] = vars2D - results['metadata']['name'] = buoy_name - + results["data"]["wave2D"] = vars2D + results["metadata"]["name"] = buoy_name + + if not to_pandas: + results = convert_nested_dict_and_pandas(results) + return results + + +def _process_multiyear_data(nc, years, parameters, all_2D_variables): + """ + A helper function to process multiyear data. + + Parameters + ---------- + nc : netCDF4.Dataset + netCDF file containing the data + years : list of int + A list of years to process + parameters : list of str + A list of parameters to return + all_2D_variables : bool + Whether to return all 2D variables + + Returns + ------- + data : dict + A dictionary containing the processed data + """ + + data = {} + for year in years: + start_date = datetime.datetime(year, 1, 1) + end_date = datetime.datetime(year + 1, 1, 1) + + year_data = get_netcdf_variables( + nc, + start_date=start_date, + end_date=end_date, + parameters=parameters, + all_2D_variables=all_2D_variables, + ) + data[year] = year_data + + return data diff --git a/mhkit/wave/io/hindcast/__init__.py b/mhkit/wave/io/hindcast/__init__.py index 5d6507b9e..2e6057131 100644 --- a/mhkit/wave/io/hindcast/__init__.py +++ b/mhkit/wave/io/hindcast/__init__.py @@ -1,8 +1,11 @@ from mhkit.wave.io.hindcast import wind_toolkit + try: from mhkit.wave.io.hindcast import hindcast except ImportError: - print("WARNING: Wave WPTO hindcast functions not imported from" - "MHKiT-Python. If you are using Windows and calling from" - "MHKiT-MATLAB this is expected.") + print( + "WARNING: Wave WPTO hindcast functions not imported from" + "MHKiT-Python. If you are using Windows and calling from" + "MHKiT-MATLAB this is expected." + ) pass diff --git a/mhkit/wave/io/hindcast/hindcast.py b/mhkit/wave/io/hindcast/hindcast.py index 81b83548f..5922edbc7 100644 --- a/mhkit/wave/io/hindcast/hindcast.py +++ b/mhkit/wave/io/hindcast/hindcast.py @@ -24,17 +24,24 @@ - xarray - numpy - rex.MultiYearWaveX, rex.WaveX + +Author: rpauly, aidanbharath, ssolson +Date: 2023-09-26 """ + +import os import sys from time import sleep import pandas as pd import xarray as xr import numpy as np from rex import MultiYearWaveX, WaveX +from mhkit.utils.cache import handle_caching +from mhkit.utils.type_handling import convert_to_dataset def region_selection(lat_lon): - ''' + """ Returns the name of the predefined region in which the given coordinates reside. Can be used to check if the passed lat/lon pair is within the WPTO hindcast dataset. @@ -48,39 +55,31 @@ def region_selection(lat_lon): ------- region : string Name of predefined region for given coordinates - ''' + """ if not isinstance(lat_lon, (list, tuple)): - raise TypeError('lat_lon must be of type list or tuple') + raise TypeError(f"lat_lon must be of type list or tuple. Got: {type(lat_lon)}") if not all(isinstance(coord, (float, int)) for coord in lat_lon): - raise TypeError('lat_lon values must be of type float or int') + raise TypeError( + f"lat_lon values must be of type float or int. Got: {type(lat_lon[0])}" + ) regions = { - 'Hawaii': { - 'lat': [15.0, 27.000002], - 'lon': [-164.0, -151.0] - }, - 'West_Coast': { - 'lat': [30.0906, 48.8641], - 'lon': [-130.072, -116.899] - }, - 'Atlantic': { - 'lat': [24.382, 44.8247], - 'lon': [-81.552, -65.721] - }, + "Hawaii": {"lat": [15.0, 27.000002], "lon": [-164.0, -151.0]}, + "West_Coast": {"lat": [30.0906, 48.8641], "lon": [-130.072, -116.899]}, + "Atlantic": {"lat": [24.382, 44.8247], "lon": [-81.552, -65.721]}, } def region_search(lat_lon, region, regions): return all( regions[region][dk][0] <= d <= regions[region][dk][1] - for dk, d in {'lat': lat_lon[0], 'lon': lat_lon[1]}.items() + for dk, d in {"lat": lat_lon[0], "lon": lat_lon[1]}.items() ) - region = [region for region in regions if region_search( - lat_lon, region, regions)] + region = [region for region in regions if region_search(lat_lon, region, regions)] if not region: - raise ValueError('ERROR: coordinates out of bounds') + raise ValueError("ERROR: coordinates out of bounds.") return region[0] @@ -95,18 +94,18 @@ def request_wpto_point_data( str_decode=True, hsds=True, path=None, - as_xarray=False, + to_pandas=True, ): """ Returns data from the WPTO wave hindcast hosted on AWS at the specified latitude and longitude point(s), or the closest available point(s). - Visit https://registry.opendata.aws/wpto-pds-us-wave/ for more - information about the dataset and available locations and years. + Visit https://registry.opendata.aws/wpto-pds-us-wave/ for more + information about the dataset and available locations and years. Note: To access the WPTO hindcast data, you will need to configure - h5pyd for data access on HSDS. Please see the WPTO_hindcast_example - notebook for more information. + h5pyd for data access on HSDS. Please see the WPTO_hindcast_example + notebook for setup instructions. Parameters ---------- @@ -115,22 +114,22 @@ def request_wpto_point_data( Options: '3-hour' '1-hour' parameter : string or list of strings Dataset parameter to be downloaded - 3-hour dataset options: 'directionality_coefficient', + 3-hour dataset options: 'directionality_coefficient', 'energy_period', 'maximum_energy_direction' 'mean_absolute_period', 'mean_zero-crossing_period', 'omni-directional_wave_power', 'peak_period' - 'significant_wave_height', 'spectral_width', 'water_depth' - 1-hour dataset options: 'directionality_coefficient', + 'significant_wave_height', 'spectral_width', 'water_depth' + 1-hour dataset options: 'directionality_coefficient', 'energy_period', 'maximum_energy_direction' 'mean_absolute_period', 'mean_zero-crossing_period', 'omni-directional_wave_power', 'peak_period', - 'significant_wave_height', 'spectral_width', + 'significant_wave_height', 'spectral_width', 'water_depth', 'maximim_energy_direction', 'mean_wave_direction', 'frequency_bin_edges' lat_lon : tuple or list of tuples - Latitude longitude pairs at which to extract data - years : list - Year(s) to be accessed. The years 1979-2010 available. + Latitude longitude pairs at which to extract data + years : list + Year(s) to be accessed. The years 1979-2010 available. Examples: [1996] or [2004,2006,2007] tree : str | cKDTree (optional) cKDTree or path to .pkl file containing pre-computed tree @@ -144,112 +143,143 @@ def request_wpto_point_data( Default = True hsds : bool (optional) Boolean flag to use h5pyd to handle .h5 'files' hosted on AWS - behind HSDS. Setting to False will indicate to look for files on + behind HSDS. Setting to False will indicate to look for files on local machine, not AWS. Default = True path : string (optional) Optionally override with a custom .h5 filepath. Useful when setting - `hsds=False`. - as_xarray : bool (optional) - Boolean flag to return data as an xarray Dataset. Default = False + `hsds=False`. + to_pandas: bool (optional) + Flag to output pandas instead of xarray. Default = True. Returns --------- - data: DataFrame - Data indexed by datetime with columns named for parameter - and cooresponding metadata index - meta: DataFrame - Location metadata for the requested data location + data: pandas DataFrame or xarray Dataset + Data indexed by datetime with columns named for parameter + and cooresponding metadata index + meta: DataFrame + Location metadata for the requested data location """ - assert isinstance(parameter, (str, list) - ), 'parameter must be of type string or list' - assert isinstance(lat_lon, (list, tuple) - ), 'lat_lon must be of type list or tuple' - assert isinstance(data_type, str), 'data_type must be a string' - assert isinstance(years, list), 'years must be a list' - assert isinstance(tree, (str, type(None))), 'tree must be a string' - assert isinstance(unscale, bool), 'unscale must be bool type' - assert isinstance(str_decode, bool), 'str_decode must be bool type' - assert isinstance(hsds, bool), 'hsds must be bool type' - assert isinstance(path, (str, type(None))), 'path must be a string' - assert isinstance(as_xarray, bool), 'as_xarray must be bool type' - - if 'directional_wave_spectrum' in parameter: - sys.exit('This function does not support directional_wave_spectrum output') - - # Check for multiple region selection - if isinstance(lat_lon[0], float): - region = region_selection(lat_lon) + if not isinstance(parameter, (str, list)): + raise TypeError( + f"parameter must be of type string or list. Got: {type(parameter)}" + ) + if not isinstance(lat_lon, (list, tuple)): + raise TypeError(f"lat_lon must be of type list or tuple. Got: {type(lat_lon)}") + if not isinstance(data_type, str): + raise TypeError(f"data_type must be a string. Got: {type(data_type)}") + if not isinstance(years, list): + raise TypeError(f"years must be a list. Got: {type(years)}") + if not isinstance(tree, (str, type(None))): + raise TypeError(f"If specified, tree must be a string. Got: {type(tree)}") + if not isinstance(unscale, bool): + raise TypeError( + f"If specified, unscale must be bool type. Got: {type(unscale)}" + ) + if not isinstance(str_decode, bool): + raise TypeError( + f"If specified, str_decode must be bool type. Got: {type(str_decode)}" + ) + if not isinstance(hsds, bool): + raise TypeError(f"If specified, hsds must be bool type. Got: {type(hsds)}") + if not isinstance(path, (str, type(None))): + raise TypeError(f"If specified, path must be a string. Got: {type(path)}") + if not isinstance(to_pandas, bool): + raise TypeError( + f"If specified, to_pandas must be bool type. Got: {type(to_pandas)}" + ) + + # Attempt to load data from cache + # Construct a string representation of the function parameters + hash_params = f"{data_type}_{parameter}_{lat_lon}_{years}_{tree}_{unscale}_{str_decode}_{hsds}_{path}_{to_pandas}" + cache_dir = _get_cache_dir() + data, meta, _ = handle_caching(hash_params, cache_dir) + + if data is not None: + return data, meta else: - region_list = [] - for loc in lat_lon: - region_list.append(region_selection(loc)) - if region_list.count(region_list[0]) == len(lat_lon): - region = region_list[0] + if "directional_wave_spectrum" in parameter: + sys.exit("This function does not support directional_wave_spectrum output") + + # Check for multiple region selection + if isinstance(lat_lon[0], float): + region = region_selection(lat_lon) else: - sys.exit('Coordinates must be within the same region!') - - if path: - wave_path = path - elif data_type == '3-hour': - wave_path = f'/nrel/US_wave/{region}/{region}_wave_*.h5' - elif data_type == '1-hour': - wave_path = f'/nrel/US_wave/virtual_buoy/{region}/{region}_virtual_buoy_*.h5' - else: - print('ERROR: invalid data_type') + region_list = [] + for loc in lat_lon: + region_list.append(region_selection(loc)) + if region_list.count(region_list[0]) == len(lat_lon): + region = region_list[0] + else: + sys.exit("Coordinates must be within the same region!") + + if path: + wave_path = path + elif data_type == "3-hour": + wave_path = f"/nrel/US_wave/{region}/{region}_wave_*.h5" + elif data_type == "1-hour": + wave_path = ( + f"/nrel/US_wave/virtual_buoy/{region}/{region}_virtual_buoy_*.h5" + ) + else: + print("ERROR: invalid data_type") + + wave_kwargs = { + "tree": tree, + "unscale": unscale, + "str_decode": str_decode, + "hsds": hsds, + "years": years, + } + data_list = [] + + with MultiYearWaveX(wave_path, **wave_kwargs) as rex_waves: + if isinstance(parameter, list): + for param in parameter: + temp_data = rex_waves.get_lat_lon_df(param, lat_lon) + gid = rex_waves.lat_lon_gid(lat_lon) + cols = temp_data.columns[:] + for i, col in zip(range(len(cols)), cols): + temp = f"{param}_{gid}" + temp_data = temp_data.rename(columns={col: temp}) - wave_kwargs = { - 'tree': tree, - 'unscale': unscale, - 'str_decode': str_decode, - 'hsds': hsds, - 'years': years - } - data_list = [] - - with MultiYearWaveX(wave_path, **wave_kwargs) as rex_waves: - if isinstance(parameter, list): - for param in parameter: - temp_data = rex_waves.get_lat_lon_df(param, lat_lon) - gid = rex_waves.lat_lon_gid(lat_lon) - cols = temp_data.columns[:] - for i, col in zip(range(len(cols)), cols): - temp = f'{param}_{gid}' - temp_data = temp_data.rename(columns={col: temp}) + data_list.append(temp_data) + data = pd.concat(data_list, axis=1) - data_list.append(temp_data) - data = pd.concat(data_list, axis=1) + else: + data = rex_waves.get_lat_lon_df(parameter, lat_lon) + cols = data.columns[:] - else: - data = rex_waves.get_lat_lon_df(parameter, lat_lon) - cols = data.columns[:] + for i, col in zip(range(len(cols)), cols): + temp = f"{parameter}_{i}" + data = data.rename(columns={col: temp}) - for i, col in zip(range(len(cols)), cols): - temp = f'{parameter}_{i}' - data = data.rename(columns={col: temp}) + meta = rex_waves.meta.loc[cols, :] + meta = meta.reset_index(drop=True) + gid = rex_waves.lat_lon_gid(lat_lon) + meta["gid"] = gid - meta = rex_waves.meta.loc[cols, :] - meta = meta.reset_index(drop=True) - gid = rex_waves.lat_lon_gid(lat_lon) - meta['gid'] = gid + if not to_pandas: + data = convert_to_dataset(data) + data["time_index"] = pd.to_datetime(data.time_index) - if as_xarray: - data = data.to_xarray() - data['time_index'] = pd.to_datetime(data.time_index) + if isinstance(parameter, list): + param_coords = [f"{param}_{gid}" for param in parameter] + data.coords["parameter"] = xr.DataArray( + param_coords, dims="parameter" + ) - if isinstance(parameter, list): - param_coords = [f'{param}_{gid}' for param in parameter] - data.coords['parameter'] = xr.DataArray( - param_coords, dims='parameter') + data.coords["year"] = xr.DataArray(years, dims="year") - data.coords['year'] = xr.DataArray(years, dims='year') + meta_ds = meta.to_xarray() + data = xr.merge([data, meta_ds]) - meta_ds = meta.to_xarray() - data = xr.merge([data, meta_ds]) + # Remove the 'index' coordinate + data = data.drop_vars("index") - # Remove the 'index' coordinate - data = data.drop_vars('index') + # save_to_cache(hash_params, data, meta) + handle_caching(hash_params, cache_dir, data, meta) - return data, meta + return data, meta def request_wpto_directional_spectrum( @@ -267,13 +297,13 @@ def request_wpto_directional_spectrum( or the closest available point(s). The data is returned as an xarray Dataset with keys indexed by a graphical identifier (gid). `gid`s are integers which represent a lat, long on which data is - stored. Requesting an array of `lat_lons` will return a dataset - with multiple `gids` representing the data closest to each requested + stored. Requesting an array of `lat_lons` will return a dataset + with multiple `gids` representing the data closest to each requested `lat`, `lon`. Visit https://registry.opendata.aws/wpto-pds-us-wave/ for more information about the dataset and available - locations and years. + locations and years. Note: To access the WPTO hindcast data, you will need to configure h5pyd for data access on HSDS. @@ -302,23 +332,34 @@ def request_wpto_directional_spectrum( local machine, not AWS. Default = True path : string (optional) Optionally override with a custom .h5 filepath. Useful when setting - `hsds=False` + `hsds=False` Returns --------- - data: xarray + data: xarray Dataset Coordinates as datetime, frequency, and direction for data at specified location(s) meta: DataFrame Location metadata for the requested data location """ - assert isinstance(lat_lon, (list, tuple) - ), 'lat_lon must be of type list or tuple' - assert isinstance(year, str), 'years must be a string' - assert isinstance(tree, (str, type(None))), 'tree must be a sring' - assert isinstance(unscale, bool), 'unscale must be bool type' - assert isinstance(str_decode, bool), 'str_decode must be bool type' - assert isinstance(hsds, bool), 'hsds must be bool type' + if not isinstance(lat_lon, (list, tuple)): + raise TypeError(f"lat_lon must be of type list or tuple. Got: {type(lat_lon)}") + if not isinstance(year, str): + raise TypeError(f"year must be a string. Got: {type(year)}") + if not isinstance(tree, (str, type(None))): + raise TypeError(f"If specified, tree must be a string. Got: {type(tree)}") + if not isinstance(unscale, bool): + raise TypeError( + f"If specified, unscale must be bool type. Got: {type(unscale)}" + ) + if not isinstance(str_decode, bool): + raise TypeError( + f"If specified, str_decode must be bool type. Got: {type(str_decode)}" + ) + if not isinstance(hsds, bool): + raise TypeError(f"If specified, hsds must be bool type. Got: {type(hsds)}") + if not isinstance(path, (str, type(None))): + raise TypeError(f"If specified, path must be a string. Got: {type(path)}") # check for multiple region selection if isinstance(lat_lon[0], float): @@ -328,17 +369,25 @@ def request_wpto_directional_spectrum( if reglist.count(reglist[0]) == len(lat_lon): region = reglist[0] else: - sys.exit('Coordinates must be within the same region!') + sys.exit("Coordinates must be within the same region!") + + # Attempt to load data from cache + hash_params = f"{lat_lon}_{year}_{tree}_{unscale}_{str_decode}_{hsds}_{path}" + cache_dir = _get_cache_dir() + data, meta, _ = handle_caching(hash_params, cache_dir) + + if data is not None: + return data, meta wave_path = path or ( - f'/nrel/US_wave/virtual_buoy/{region}/{region}_virtual_buoy_{year}.h5' + f"/nrel/US_wave/virtual_buoy/{region}/{region}_virtual_buoy_{year}.h5" ) - parameter = 'directional_wave_spectrum' + parameter = "directional_wave_spectrum" wave_kwargs = { - 'tree': tree, - 'unscale': unscale, - 'str_decode': str_decode, - 'hsds': hsds + "tree": tree, + "unscale": unscale, + "str_decode": str_decode, + "hsds": hsds, } with WaveX(wave_path, **wave_kwargs) as rex_waves: @@ -348,33 +397,32 @@ def request_wpto_directional_spectrum( # Setup index and columns columns = [gid] if isinstance(gid, (int, np.integer)) else gid time_index = rex_waves.time_index - frequency = rex_waves['frequency'] - direction = rex_waves['direction'] + frequency = rex_waves["frequency"] + direction = rex_waves["direction"] index = pd.MultiIndex.from_product( [time_index, frequency, direction], - names=['time_index', 'frequency', 'direction'] + names=["time_index", "frequency", "direction"], ) # Create bins for multiple smaller API dataset requests N = 6 length = len(rex_waves) quotient, remainder = divmod(length, N) - bins = [i*quotient for i in range(N+1)] + bins = [i * quotient for i in range(N + 1)] bins[-1] += remainder - index_bins = (np.array(bins)*len(frequency)*len(direction)).tolist() + index_bins = (np.array(bins) * len(frequency) * len(direction)).tolist() # Request multiple datasets and add to dictionary datas = {} - for i in range(len(bins)-1): - idx = index[index_bins[i]:index_bins[i+1]] + for i in range(len(bins) - 1): + idx = index[index_bins[i] : index_bins[i + 1]] # Request with exponential back off wait time sleep_time = 2 num_retries = 4 for _ in range(num_retries): try: - data_array = rex_waves[parameter, - bins[i]:bins[i+1], :, :, gid] + data_array = rex_waves[parameter, bins[i] : bins[i + 1], :, :, gid] str_error = None except Exception as err: str_error = str(err) @@ -388,51 +436,57 @@ def request_wpto_directional_spectrum( ax1 = np.product(data_array.shape[:3]) ax2 = data_array.shape[-1] if len(data_array.shape) == 4 else 1 datas[i] = pd.DataFrame( - data_array.reshape(ax1, ax2), - columns=columns, - index=idx + data_array.reshape(ax1, ax2), columns=columns, index=idx ) data_raw = pd.concat(datas.values()) data = data_raw.to_xarray() - data['time_index'] = pd.to_datetime(data.time_index) + data["time_index"] = pd.to_datetime(data.time_index) # Get metadata meta = rex_waves.meta.loc[columns, :] meta = meta.reset_index(drop=True) - meta['gid'] = gid + meta["gid"] = gid # Convert gid to integer or list of integers - # gid_list = [int(g) for g in gid] if isinstance(gid, list) else [int(gid)] - # gid_list = [int(g) for g in gid] if isinstance(gid, list) else [int(gid)] - gid_list = [int(g) for g in gid] if isinstance( - gid, (list, np.ndarray)) else [int(gid)] + gid_list = ( + [int(g) for g in gid] if isinstance(gid, (list, np.ndarray)) else [int(gid)] + ) - data_var_concat = xr.concat([data[g] for g in gid_list], dim='gid') + data_var_concat = xr.concat([data[g] for g in gid_list], dim="gid") # Create a new DataArray with the correct dimensions and coordinates spectral_density = xr.DataArray( - data_var_concat.data.reshape(-1, len(frequency), - len(direction), len(gid_list)), - dims=['time_index', 'frequency', 'direction', 'gid'], + data_var_concat.data.reshape( + -1, len(frequency), len(direction), len(gid_list) + ), + dims=["time_index", "frequency", "direction", "gid"], coords={ - 'time_index': data['time_index'], - 'frequency': data['frequency'], - 'direction': data['direction'], - 'gid': gid_list - } + "time_index": data["time_index"], + "frequency": data["frequency"], + "direction": data["direction"], + "gid": gid_list, + }, ) # Create the new dataset data = xr.Dataset( - { - 'spectral_density': spectral_density - }, + {"spectral_density": spectral_density}, coords={ - 'time_index': data['time_index'], - 'frequency': data['frequency'], - 'direction': data['direction'], - 'gid': gid_list - } + "time_index": data["time_index"], + "frequency": data["frequency"], + "direction": data["direction"], + "gid": gid_list, + }, ) + + handle_caching(hash_params, cache_dir, data, meta) + return data, meta + + +def _get_cache_dir(): + """ + Returns the path to the cache directory. + """ + return os.path.join(os.path.expanduser("~"), ".cache", "mhkit", "hindcast") diff --git a/mhkit/wave/io/hindcast/wind_toolkit.py b/mhkit/wave/io/hindcast/wind_toolkit.py index 3adb083c5..f945089b3 100644 --- a/mhkit/wave/io/hindcast/wind_toolkit.py +++ b/mhkit/wave/io/hindcast/wind_toolkit.py @@ -1,63 +1,219 @@ +""" +Wind Toolkit Data Utility Functions +=================================== + +This module contains a collection of utility functions designed to facilitate +the extraction, caching, and visualization of wind data from the WIND Toolkit +hindcast dataset hosted on AWS. This dataset includes offshore wind hindcast data +with various parameters like wind speed, direction, temperature, and pressure. + +Key Functions: +-------------- +- `region_selection`: Determines which predefined wind region a given latitude + and longitude fall within. + +- `get_region_data`: Retrieves latitude and longitude data points for a specified + wind region. Uses caching to speed up repeated requests. + +- `plot_region`: Plots the geographical extent of a specified wind region and + can overlay a given latitude-longitude point. + +- `elevation_to_string`: Converts a parameter (e.g., 'windspeed') and elevation + values (e.g., [20, 40, 120]) to the formatted strings used in the WIND Toolkit. + +- `request_wtk_point_data`: Fetches specified wind data parameters for given + latitude-longitude points and years from the WIND Toolkit hindcast dataset. + Supports caching for faster repeated data retrieval. + +Dependencies: +------------- +- rex: Library to handle renewable energy datasets. +- pandas: Data manipulation and analysis. +- os, hashlib, pickle: Used for caching functionality. +- matplotlib: Used for plotting. + +Notes: +------ +- To access the WIND Toolkit hindcast data, users need to configure `h5pyd` + for data access on HSDS (see the metocean_example or WPTO_hindcast_example + notebook for more details). + +- While some functions perform basic checks (e.g., verifying that latitude + and longitude are within a predefined region), it's essential to understand + the boundaries of each region and the available parameters and elevations in the dataset. + +Author: +------- +akeeste +ssolson + +Date: +----- +2023-09-26 + +""" + +import os +import hashlib +import pickle import pandas as pd + from rex import MultiYearWindX import matplotlib.pyplot as plt +from mhkit.utils.cache import handle_caching +from mhkit.utils.type_handling import convert_to_dataset -def region_selection(lat_lon, preferred_region=''): - ''' +def region_selection(lat_lon, preferred_region=""): + """ Returns the name of the predefined region in which the given coordinates reside. - Can be used to check if the passed lat/lon pair is within the WIND Toolkit hindcast dataset. + Can be used to check if the passed lat/lon pair is within the WIND Toolkit hindcast dataset. Parameters ---------- lat_lon : tuple Latitude and longitude coordinates as floats or integers - + preferred_region : string (optional) Latitude and longitude coordinates as floats or integers - + Returns ------- region : string Name of predefined region for given coordinates - ''' - assert isinstance(lat_lon, tuple), 'lat_lon must be of type list or tuple' - assert len(lat_lon)==2, 'lat_lon must be of length 2' - assert isinstance(lat_lon[0], (float,int)), 'lat_lon values must be of type float or int' - assert isinstance(lat_lon[1], (float,int)), 'lat_lon values must be of type float or int' - assert isinstance(preferred_region, str), 'preferred_region must be of type string' - - # Note that this check is fast, but not robust because region are not + """ + if not isinstance(lat_lon, tuple): + raise TypeError(f"lat_lon must be of type tuple, got {type(lat_lon).__name__}") + + if len(lat_lon) != 2: + raise ValueError(f"lat_lon must be of length 2, got length {len(lat_lon)}") + + if not isinstance(lat_lon[0], (float, int)): + raise TypeError( + f"lat_lon values must be floats or ints, got {type(lat_lon[0]).__name__}" + ) + + if not isinstance(lat_lon[1], (float, int)): + raise TypeError( + f"lat_lon values must be floats or ints, got {type(lat_lon[1]).__name__}" + ) + + if not isinstance(preferred_region, str): + raise TypeError( + f"preferred_region must be a string, got {type(preferred_region).__name__}" + ) + + # Note that this check is fast, but not robust because region are not # rectangular on a lat-lon grid rDict = { - 'CA_NWP_overlap':{'lat':[41.213, 42.642], 'lon':[-129.090, -121.672]}, - 'Offshore_CA':{ 'lat':[31.932, 42.642], 'lon':[-129.090, -115.806]}, - 'Hawaii':{ 'lat':[15.565, 26.221], 'lon':[-164.451, -151.278]}, - 'NW_Pacific':{ 'lat':[41.213, 49.579], 'lon':[-130.831, -121.672]}, - 'Mid_Atlantic':{ 'lat':[37.273, 42.211], 'lon':[-76.427, -64.800]}, + "CA_NWP_overlap": {"lat": [41.213, 42.642], "lon": [-129.090, -121.672]}, + "Offshore_CA": {"lat": [31.932, 42.642], "lon": [-129.090, -115.806]}, + "Hawaii": {"lat": [15.565, 26.221], "lon": [-164.451, -151.278]}, + "NW_Pacific": {"lat": [41.213, 49.579], "lon": [-130.831, -121.672]}, + "Mid_Atlantic": {"lat": [37.273, 42.211], "lon": [-76.427, -64.800]}, } - region_search = lambda x: all( ( True if rDict[x][dk][0] <= d <= rDict[x][dk][1] else False - for dk, d in {'lat':lat_lon[0],'lon':lat_lon[1]}.items() ) ) + def region_search(x): + return all( + ( + True if rDict[x][dk][0] <= d <= rDict[x][dk][1] else False + for dk, d in {"lat": lat_lon[0], "lon": lat_lon[1]}.items() + ) + ) + region = [key for key in rDict if region_search(key)] - - if region[0] == 'CA_NWP_overlap': - if preferred_region == 'Offshore_CA': - region[0] = 'Offshore_CA' - elif preferred_region == 'NW_Pacific': - region[0] = 'NW_Pacific' + + if region[0] == "CA_NWP_overlap": + if preferred_region == "Offshore_CA": + region[0] = "Offshore_CA" + elif preferred_region == "NW_Pacific": + region[0] = "NW_Pacific" else: - raise TypeError(f"Preferred_region ({preferred_region}) must be 'Offshore_CA' or 'NW_Pacific' when lat_lon {lat_lon} falls in the overlap region") - - if len(region)==0: - raise TypeError(f'Coordinates {lat_lon} out of bounds. Must be within {rDict}') + raise TypeError( + f"Preferred_region ({preferred_region}) must be 'Offshore_CA' or 'NW_Pacific' when lat_lon {lat_lon} falls in the overlap region" + ) + + if len(region) == 0: + raise TypeError(f"Coordinates {lat_lon} out of bounds. Must be within {rDict}") else: return region[0] -def plot_region(region,lat_lon=None,ax=None): - ''' - Visualizes the area that a given region covers. Can help users understand +def get_region_data(region): + """ + Retrieves the latitude and longitude data points for the specified region + from the cache if available; otherwise, fetches the data and caches it for + subsequent calls. + + The function forms a unique identifier from the `region` parameter and checks + whether the corresponding data is available in the cache. If the data is found, + it's loaded and returned. If not, the data is fetched, cached, and then returned. + + Parameters + ---------- + region : str + Name of the predefined region in the WIND Toolkit for which to + retrieve latitude and longitude data points. It is case-sensitive. + Examples: 'Offshore_CA','Hawaii','Mid_Atlantic','NW_Pacific' + + Returns + ------- + lats : numpy.ndarray + A 1D array containing the latitude coordinates of data points + in the specified region. + + lons : numpy.ndarray + A 1D array containing the longitude coordinates of data points + in the specified region. + + Example + ------- + >>> lats, lons = get_region_data('Offshore_CA') + """ + if not isinstance(region, str): + raise TypeError("region must be of type string") + # Define the path to the cache directory + cache_dir = os.path.join(os.path.expanduser("~"), ".cache", "mhkit", "hindcast") + + # Create a unique identifier for this function call + hash_id = hashlib.md5(region.encode()).hexdigest() + + # Create cache directory if it doesn't exist + os.makedirs(cache_dir, exist_ok=True) + + # Create a path to the cache file for this function call + cache_file = os.path.join(cache_dir, f"{hash_id}.pkl") + + if os.path.isfile(cache_file): + # If the cache file exists, load the data from the cache + with open(cache_file, "rb") as f: + lats, lons = pickle.load(f) + return lats, lons + else: + wind_path = "/nrel/wtk/" + region.lower() + "/" + region + "_*.h5" + windKwargs = { + "tree": None, + "unscale": True, + "str_decode": True, + "hsds": True, + "years": [2019], + } + + # Get the latitude and longitude list from the region in rex + rex_wind = MultiYearWindX(wind_path, **windKwargs) + lats = rex_wind.lat_lon[:, 0] + lons = rex_wind.lat_lon[:, 1] + + # Save data to cache + with open(cache_file, "wb") as f: + pickle.dump((lats, lons), f) + + return lats, lons + + +def plot_region(region, lat_lon=None, ax=None): + """ + Visualizes the area that a given region covers. Can help users understand the extent of a region since they are not all rectangular. Parameters @@ -66,48 +222,47 @@ def plot_region(region,lat_lon=None,ax=None): Name of predefined region in the WIND Toolkit Options: 'Offshore_CA','Hawaii','Mid_Atlantic','NW_Pacific' lat_lon : couple (optional) - Latitude and longitude pair to plot on top of the chosen region. Useful + Latitude and longitude pair to plot on top of the chosen region. Useful to inform accurate latitude-longitude selection for data analysis. ax : matplotlib axes object (optional) Axes for plotting. If None, then a new figure is created. - + Returns --------- - ax : matplotlib pyplot axes - ''' - assert isinstance(region, str), 'region must be of type string' - assert region in ['Offshore_CA','Hawaii','Mid_Atlantic','NW_Pacific'], f'{region} not in list of supported regions' - - wind_path = '/nrel/wtk/'+region.lower()+'/'+region+'_*.h5' - windKwargs = {'tree':None, 'unscale':True, 'str_decode':True, 'hsds':True, - 'years':[2019]} - - # Get the latitude and longitude list from the region in rex - rex_wind = MultiYearWindX(wind_path, **windKwargs) - lats = rex_wind.lat_lon[:,0] - lons = rex_wind.lat_lon[:,1] - + ax : matplotlib pyplot axes + """ + if not isinstance(region, str): + raise TypeError("region must be of type string") + + supported_regions = ["Offshore_CA", "Hawaii", "Mid_Atlantic", "NW_Pacific"] + if region not in supported_regions: + raise ValueError( + f'{region} not in list of supported regions: {", ".join(supported_regions)}' + ) + + lats, lons = get_region_data(region) + # Plot the latitude longitude pairs if ax is None: fig, ax = plt.subplots() - ax.plot(lons,lats,'o',label=f'{region} region') + ax.plot(lons, lats, "o", label=f"{region} region") if lat_lon is not None: - ax.plot(lat_lon[1],lat_lon[0],'o',label='Specified lat-lon point') - ax.set_xlabel('Longitude (deg)') - ax.set_ylabel('Latitude (deg)') + ax.plot(lat_lon[1], lat_lon[0], "o", label="Specified lat-lon point") + ax.set_xlabel("Longitude (deg)") + ax.set_ylabel("Latitude (deg)") ax.grid() - ax.set_title(f'Extent of the WIND Toolkit {region} region') + ax.set_title(f"Extent of the WIND Toolkit {region} region") ax.legend() - + return ax def elevation_to_string(parameter, elevations): - """ - Takes in a parameter (e.g. 'windspeed') and elevations (e.g. [20, 40, 120]) + """ + Takes in a parameter (e.g. 'windspeed') and elevations (e.g. [20, 40, 120]) and returns the formatted strings that are input to WIND Toolkit (e.g. windspeed_10m). Does not check parameter against the elevation levels. This is done in request_wtk_point_data. - + Parameters ---------- parameter: string @@ -116,40 +271,57 @@ def elevation_to_string(parameter, elevations): elevations : list List of elevations (float). Values can range from approxiamtely 20 to 200 in increments of 20, depending - on the parameter in question. See Documentation for request_wtk_point_data + on the parameter in question. See Documentation for request_wtk_point_data for the full list of available parameters. Returns --------- parameter_list: list Formatted List of WIND Toolkit parameter strings - + """ - - assert isinstance(parameter,str) - assert isinstance(elevations,(float,list)) - assert parameter in ['windspeed','winddirection','temperature','pressure'] - + + if not isinstance(parameter, str): + raise TypeError(f"parameter must be a string, got {type(parameter)}") + + if not isinstance(elevations, (float, list)): + raise TypeError(f"elevations must be a float or list, got {type(elevations)}") + + if parameter not in ["windspeed", "winddirection", "temperature", "pressure"]: + raise ValueError(f"Invalid parameter: {parameter}") + parameter_list = [] for e in elevations: - parameter_list.append(parameter+'_'+str(e)+'m') - + parameter_list.append(parameter + "_" + str(e) + "m") + return parameter_list -def request_wtk_point_data(time_interval, parameter, lat_lon, years, preferred_region='', - tree=None, unscale=True, str_decode=True,hsds=True): - """ - Returns data from the WIND Toolkit offshore wind hindcast hosted on AWS at the specified latitude and longitude point(s), - or the closest available point(s). - Visit https://registry.opendata.aws/nrel-pds-wtk/ for more information about the dataset and available - locations and years. - - Calls with multiple parameters must have the same time interval. Calls - with multiple locations must use the same region (use the plot_region function). - - Note: To access the WIND Toolkit hindcast data, you will need to configure h5pyd for data access on HSDS. - Please see the WTK_hindcast_example notebook for more information. +def request_wtk_point_data( + time_interval, + parameter, + lat_lon, + years, + preferred_region="", + tree=None, + unscale=True, + str_decode=True, + hsds=True, + clear_cache=False, + to_pandas=True, +): + """ + Returns data from the WIND Toolkit offshore wind hindcast hosted on + AWS at the specified latitude and longitude point(s), or the closest + available point(s).Visit https://registry.opendata.aws/nrel-pds-wtk/ + for more information about the dataset and available locations and years. + + Calls with multiple parameters must have the same time interval. Calls + with multiple locations must use the same region (use the plot_region function). + + Note: To access the WIND Toolkit hindcast data, you will need to + configure h5pyd for data access on HSDS. Please see the + metocean_example or WPTO_hindcast_example notebook for more information. Parameters ---------- @@ -159,33 +331,33 @@ def request_wtk_point_data(time_interval, parameter, lat_lon, years, preferred_r parameter : string or list of strings Dataset parameter to be downloaded. Other parameters may be available. This list is limited to those available at both 5-minute and 1-hour - time intervals for all regions. - Options: - 'precipitationrate_0m', 'inversemoninobukhovlength_2m', - 'relativehumidity_2m', 'surface_sea_temperature', - 'pressure_0m', 'pressure_100m', 'pressure_200m', - 'temperature_10m', 'temperature_20m', 'temperature_40m', - 'temperature_60m', 'temperature_80m', 'temperature_100m', - 'temperature_120m', 'temperature_140m', 'temperature_160m', - 'temperature_180m', 'temperature_200m', - 'winddirection_10m', 'winddirection_20m', 'winddirection_40m', - 'winddirection_60m', 'winddirection_80m', 'winddirection_100m', - 'winddirection_120m', 'winddirection_140m', 'winddirection_160m', - 'winddirection_180m', 'winddirection_200m', - 'windspeed_10m', 'windspeed_20m', 'windspeed_40m', - 'windspeed_60m', 'windspeed_80m', 'windspeed_100m', - 'windspeed_120m', 'windspeed_140m', 'windspeed_160m', + time intervals for all regions. + Options: + 'precipitationrate_0m', 'inversemoninobukhovlength_2m', + 'relativehumidity_2m', 'surface_sea_temperature', + 'pressure_0m', 'pressure_100m', 'pressure_200m', + 'temperature_10m', 'temperature_20m', 'temperature_40m', + 'temperature_60m', 'temperature_80m', 'temperature_100m', + 'temperature_120m', 'temperature_140m', 'temperature_160m', + 'temperature_180m', 'temperature_200m', + 'winddirection_10m', 'winddirection_20m', 'winddirection_40m', + 'winddirection_60m', 'winddirection_80m', 'winddirection_100m', + 'winddirection_120m', 'winddirection_140m', 'winddirection_160m', + 'winddirection_180m', 'winddirection_200m', + 'windspeed_10m', 'windspeed_20m', 'windspeed_40m', + 'windspeed_60m', 'windspeed_80m', 'windspeed_100m', + 'windspeed_120m', 'windspeed_140m', 'windspeed_160m', 'windspeed_180m', 'windspeed_200m' lat_lon : tuple or list of tuples - Latitude longitude pairs at which to extract data. Use plot_region() or + Latitude longitude pairs at which to extract data. Use plot_region() or region_selection() to see the corresponding region for a given location. - years : list - Year(s) to be accessed. The years 2000-2019 available (up to 2020 + years : list + Year(s) to be accessed. The years 2000-2019 available (up to 2020 for Mid-Atlantic). Examples: [2015] or [2004,2006,2007] preferred_region : string (optional) Region that the lat_lon belongs to ('Offshore_CA' or 'NW_Pacific'). Required when a lat_lon point falls in both the Offshore California - and NW Pacific regions. Overlap region defined by + and NW Pacific regions. Overlap region defined by latitude = (41.213, 42.642) and longitude = (-129.090, -121.672). Default = '' tree : str | cKDTree (optional) @@ -200,69 +372,116 @@ def request_wtk_point_data(time_interval, parameter, lat_lon, years, preferred_r Default = True hsds : bool (optional) Boolean flag to use h5pyd to handle .h5 'files' hosted on AWS - behind HSDS. Setting to False will indicate to look for files on + behind HSDS. Setting to False will indicate to look for files on local machine, not AWS. Default = True + clear_cache : bool (optional) + Boolean flag to clear the cache related to this specific request. + Default is False. + to_pandas: bool (optional) + Flag to output pandas instead of xarray. Default = True. Returns --------- - data: DataFrame - Data indexed by datetime with columns named for parameter and cooresponding metadata index - meta: DataFrame - Location metadata for the requested data location + data: DataFrame + Data indexed by datetime with columns named for parameter and + cooresponding metadata index + meta: DataFrame + Location metadata for the requested data location """ - - assert isinstance(parameter, (str, list)), 'parameter must be of type string or list' - assert isinstance(lat_lon, (list,tuple)), 'lat_lon must be of type list or tuple' - assert isinstance(time_interval, str), 'time_interval must be a string' - assert isinstance(years,list), 'years must be a list' - assert isinstance(preferred_region, str), 'preferred_region must be a string' - assert isinstance(tree,(str,type(None))), 'tree must be a string' - assert isinstance(unscale,bool), 'unscale must be bool type' - assert isinstance(str_decode,bool), 'str_decode must be bool type' - assert isinstance(hsds,bool), 'hsds must be bool type' - - # check for multiple region selection - if isinstance(lat_lon[0], float): - region = region_selection(lat_lon, preferred_region) + + if not isinstance(parameter, (str, list)): + raise TypeError("parameter must be of type string or list") + if not isinstance(lat_lon, (list, tuple)): + raise TypeError("lat_lon must be of type list or tuple") + if not isinstance(time_interval, str): + raise TypeError("time_interval must be a string") + if not isinstance(years, list): + raise TypeError("years must be a list") + if not isinstance(preferred_region, str): + raise TypeError("preferred_region must be a string") + if not isinstance(tree, (str, type(None))): + raise TypeError("tree must be a string or None") + if not isinstance(unscale, bool): + raise TypeError("unscale must be bool type") + if not isinstance(str_decode, bool): + raise TypeError("str_decode must be bool type") + if not isinstance(hsds, bool): + raise TypeError("hsds must be bool type") + if not isinstance(clear_cache, bool): + raise TypeError("clear_cache must be of type bool") + + # Define the path to the cache directory + cache_dir = os.path.join(os.path.expanduser("~"), ".cache", "mhkit", "hindcast") + + # Construct a string representation of the function parameters + hash_params = f"{time_interval}_{parameter}_{lat_lon}_{years}_{preferred_region}_{tree}_{unscale}_{str_decode}_{hsds}" + + # Use handle_caching to manage caching. + data, meta, _ = handle_caching(hash_params, cache_dir, clear_cache_file=clear_cache) + + if data is not None and meta is not None: + if not to_pandas: + data = convert_to_dataset(data) + data.attrs = meta + + return data, meta # Return cached data and meta if available else: - reglist = [] - for loc in lat_lon: - reglist.append(region_selection(loc)) - if reglist.count(reglist[0]) == len(lat_lon): - region = reglist[0] + # check for multiple region selection + if isinstance(lat_lon[0], float): + region = region_selection(lat_lon, preferred_region) else: - raise TypeError('Coordinates must be within the same region!') - - if time_interval == '1-hour': - wind_path = f'/nrel/wtk/'+region.lower()+'/'+region+'_*.h5' - elif time_interval == '5-minute': - wind_path = f'/nrel/wtk/'+region.lower()+'-5min/'+region+'_*.h5' - else: - raise TypeError(f"Invalid time_interval '{time_interval}', must be '1-hour' or '5-minute'") - windKwargs = {'tree':tree,'unscale':unscale,'str_decode':str_decode, 'hsds':hsds, - 'years':years} - data_list = [] - - with MultiYearWindX(wind_path, **windKwargs) as rex_wind: - if isinstance(parameter, list): - for p in parameter: - temp_data = rex_wind.get_lat_lon_df(p,lat_lon) - col = temp_data.columns[:] - for i,c in zip(range(len(col)),col): - temp = f'{p}_{i}' - temp_data = temp_data.rename(columns={c:temp}) - - data_list.append(temp_data) - data= pd.concat(data_list, axis=1) - + reglist = [] + for loc in lat_lon: + reglist.append(region_selection(loc)) + if reglist.count(reglist[0]) == len(lat_lon): + region = reglist[0] + else: + raise TypeError("Coordinates must be within the same region!") + + if time_interval == "1-hour": + wind_path = f"/nrel/wtk/{region.lower()}/{region}_*.h5" + elif time_interval == "5-minute": + wind_path = f"/nrel/wtk/{region.lower()}-5min/{region}_*.h5" else: - data = rex_wind.get_lat_lon_df(parameter,lat_lon) - col = data.columns[:] + raise TypeError( + f"Invalid time_interval '{time_interval}', must be '1-hour' or '5-minute'" + ) + windKwargs = { + "tree": tree, + "unscale": unscale, + "str_decode": str_decode, + "hsds": hsds, + "years": years, + } + data_list = [] + with MultiYearWindX(wind_path, **windKwargs) as rex_wind: + if isinstance(parameter, list): + for p in parameter: + temp_data = rex_wind.get_lat_lon_df(p, lat_lon) + col = temp_data.columns[:] + for i, c in zip(range(len(col)), col): + temp = f"{p}_{i}" + temp_data = temp_data.rename(columns={c: temp}) + + data_list.append(temp_data) + data = pd.concat(data_list, axis=1) + + else: + data = rex_wind.get_lat_lon_df(parameter, lat_lon) + col = data.columns[:] + + for i, c in zip(range(len(col)), col): + temp = f"{parameter}_{i}" + data = data.rename(columns={c: temp}) + + meta = rex_wind.meta.loc[col, :] + meta = meta.reset_index(drop=True) + + # Save the retrieved data and metadata to cache. + handle_caching(hash_params, cache_dir, data=data, metadata=meta) - for i,c in zip(range(len(col)),col): - temp = f'{parameter}_{i}' - data = data.rename(columns={c:temp}) + if not to_pandas: + data = convert_to_dataset(data) + data.attrs = meta - meta = rex_wind.meta.loc[col,:] - meta = meta.reset_index(drop=True) - return data, meta + return data, meta diff --git a/mhkit/wave/io/ndbc.py b/mhkit/wave/io/ndbc.py index 019481bc8..268c3390e 100644 --- a/mhkit/wave/io/ndbc.py +++ b/mhkit/wave/io/ndbc.py @@ -1,3 +1,4 @@ +import os from collections import OrderedDict as _OrderedDict from collections import defaultdict as _defaultdict from io import BytesIO @@ -11,9 +12,15 @@ import xarray as xr from bs4 import BeautifulSoup +from mhkit.utils.cache import handle_caching +from mhkit.utils import ( + convert_to_dataset, + convert_to_dataarray, + convert_nested_dict_and_pandas, +) -def read_file(file_name, missing_values=['MM', 9999, 999, 99]): +def read_file(file_name, missing_values=["MM", 9999, 999, 99], to_pandas=True): """ Reads a NDBC wave buoy data file (from https://www.ndbc.noaa.gov). @@ -36,23 +43,31 @@ def read_file(file_name, missing_values=['MM', 9999, 999, 99]): missing_value: list of values List of values that denote missing data + to_pandas: bool (optional) + Flag to output pandas instead of xarray. Default = True. + Returns --------- - data: pandas DataFrame + data: pandas DataFrame or xarray Dataset Data indexed by datetime with columns named according to header row metadata: dict or None Dictionary with {column name: units} key value pairs when the NDBC file contains unit information, otherwise None is returned """ - assert isinstance(file_name, str), 'file_name must be of type str' - assert isinstance( - missing_values, list), 'missing_values must be of type list' + if not isinstance(file_name, str): + raise TypeError(f"file_name must be of type str. Got: {type(file_name)}") + if not isinstance(missing_values, list): + raise TypeError( + f"If specified, missing_values must be of type list. Got: {type(missing_values)}" + ) + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type bool. Got: {type(to_pandas)}") # Open file and get header rows f = open(file_name, "r") header = f.readline().rstrip().split() # read potential headers - units = f.readline().rstrip().split() # read potential units + units = f.readline().rstrip().split() # read potential units f.close() # If first line is commented, remove comment sign # @@ -70,31 +85,38 @@ def read_file(file_name, missing_values=['MM', 9999, 999, 99]): # Check if the time stamp contains minutes, and create list of column names # to parse for date - if header[4] == 'mm': + if header[4] == "mm": parse_vals = header[0:5] - date_format = '%Y %m %d %H %M' + date_format = "%Y %m %d %H %M" units = units[5:] # remove date columns from units else: parse_vals = header[0:4] - date_format = '%Y %m %d %H' + date_format = "%Y %m %d %H" units = units[4:] # remove date columns from units # If first line is commented, manually feed in column names if header_commented: - data = pd.read_csv(file_name, sep='\s+', header=None, names=header, - comment="#", parse_dates=[parse_vals]) + data = pd.read_csv( + file_name, + sep="\s+", + header=None, + names=header, + comment="#", + parse_dates=[parse_vals], + ) # If first line is not commented, then the first row can be used as header else: - data = pd.read_csv(file_name, sep='\s+', header=0, - comment="#", parse_dates=[parse_vals]) + data = pd.read_csv( + file_name, sep="\s+", header=0, comment="#", parse_dates=[parse_vals] + ) # Convert index to datetime date_column = "_".join(parse_vals) - data['Time'] = pd.to_datetime(data[date_column], format=date_format) - data.index = data['Time'].values + data["Time"] = pd.to_datetime(data[date_column], format=date_format) + data.index = data["Time"].values # Remove date columns del data[date_column] - del data['Time'] + del data["Time"] # If there was a row of units, convert to dictionary if units_exist: @@ -104,7 +126,7 @@ def read_file(file_name, missing_values=['MM', 9999, 999, 99]): # Convert columns to numeric data if possible, otherwise leave as string for column in data: - data[column] = pd.to_numeric(data[column], errors='ignore') + data[column] = pd.to_numeric(data[column], errors="ignore") # Convert column names to float if possible (handles frequency headers) # if there is non-numeric name, just leave all as strings. @@ -116,12 +138,17 @@ def read_file(file_name, missing_values=['MM', 9999, 999, 99]): # Replace indicated missing values with nan data.replace(missing_values, np.nan, inplace=True) + if not to_pandas: + data = convert_to_dataset(data) + return data, metadata -def available_data(parameter, buoy_number=None, proxy=None): - ''' - For a given parameter this will return a DataFrame of years, +def available_data( + parameter, buoy_number=None, proxy=None, clear_cache=False, to_pandas=True +): + """ + For a given parameter this will return a DataFrame or Dataset of years, station IDs and file names that contain that parameter data. Parameters @@ -142,58 +169,95 @@ def available_data(parameter, buoy_number=None, proxy=None): Proxy dict passed to python requests, (e.g. proxy_dict= {"http": 'http:wwwproxy.yourProxy:80/'}) + to_pandas: bool (optional) + Flag to output pandas instead of xarray. Default = True. + Returns ------- - available_data: DataFrame + available_data: pandas DataFrame or xarray Dataset DataFrame with station ID, years, and NDBC file names. - ''' - assert isinstance(parameter, str), 'parameter must be a string' - assert isinstance(buoy_number, (str, type(None), list)), ('If ' - 'specified the buoy number must be a string or list of strings') - assert isinstance(proxy, (dict, type(None)) - ), 'If specified proxy must be a dict' - supported = _supported_params(parameter) + """ + if not isinstance(parameter, str): + raise TypeError(f"parameter must be a string. Got: {type(parameter)}") + if not isinstance(buoy_number, (str, type(None), list)): + raise TypeError( + f"If specified, buoy_number must be a string or list of strings. Got: {type(buoy_number)}" + ) + if not isinstance(proxy, (dict, type(None))): + raise TypeError(f"If specified, proxy must be a dict. Got: {type(proxy)}") + _supported_params(parameter) if isinstance(buoy_number, str): - assert len(buoy_number) == 5, ('Buoy must be 5-character' - f'alpha-numeric station identifier got: {buoy_number}') + if not len(buoy_number) == 5: + raise ValueError( + "buoy_number must be 5-character" + f"alpha-numeric station identifier. Got: {buoy_number}" + ) elif isinstance(buoy_number, list): for buoy in buoy_number: - assert len(buoy) == 5, ('Each buoy must be a 5-character' - f'alpha-numeric station identifier got: {buoy}') - ndbc_data = f'https://www.ndbc.noaa.gov/data/historical/{parameter}/' - if proxy == None: - response = requests.get(ndbc_data) + if not len(buoy) == 5: + raise ValueError( + "Each value in the buoy_number list must be a 5-character" + f"alpha-numeric station identifier. Got: {buoy_number}" + ) + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type bool. Got: {type(to_pandas)}") + + # Generate a unique hash_params based on the function parameters + hash_params = f"parameter:{parameter}_buoy_number:{buoy_number}_proxy:{proxy}" + cache_dir = os.path.join(os.path.expanduser("~"), ".cache", "mhkit", "ndbc") + + # Check the cache before making the request + data, _, _ = handle_caching(hash_params, cache_dir, clear_cache_file=clear_cache) + + # no coverage bc in coverage runs we have already cached the data/ run this code + if data is None: # pragma: no cover + ndbc_data = f"https://www.ndbc.noaa.gov/data/historical/{parameter}/" + + try: + response = requests.get(ndbc_data, proxies=proxy, timeout=30) + response.raise_for_status() + + except requests.exceptions.Timeout: + print("The request timed out") + response = None + + except requests.exceptions.RequestException as error: + print(f"An error occurred: {error}") + response = None + + if response and response.status_code != 200: + msg = f"request.get({ndbc_data}) failed by returning code of {response.status_code}" + raise Exception(msg) + + filenames = pd.read_html(response.text)[0].Name.dropna() + buoys = _parse_filenames(parameter, filenames) + + available_data = buoys.copy(deep=True) + + # Set year to numeric (makes year key non-unique) + available_data["year"] = available_data.year.str.strip("b") + available_data["year"] = pd.to_numeric(available_data.year.str.strip("_old")) + + if isinstance(buoy_number, str): + available_data = available_data[available_data.id == buoy_number] + elif isinstance(buoy_number, list): + available_data = available_data[available_data.id == buoy_number[0]] + for i in range(1, len(buoy_number)): + data = available_data[available_data.id == buoy_number[i]] + available_data = available_data.append(data) + # Cache the result + handle_caching(hash_params, cache_dir, data=available_data) else: - response = requests.get(ndbc_data, proxies=proxy) + available_data = data - status = response.status_code - if status != 200: - msg = f"request.get{ndbc_data} failed by returning code of {status}" - raise Exception(msg) - - filenames = pd.read_html(response.text)[0].Name.dropna() - buoys = _parse_filenames(parameter, filenames) - - available_data = buoys.copy(deep=True) - - # Set year to numeric (makes year key non-unique) - available_data['year'] = available_data.year.str.strip('b') - available_data['year'] = pd.to_numeric( - available_data.year.str.strip('_old')) - - if isinstance(buoy_number, str): - available_data = available_data[available_data.id == buoy_number] - elif isinstance(buoy_number, list): - available_data = available_data[available_data.id == buoy_number[0]] - for i in range(1, len(buoy_number)): - data = available_data[available_data.id == buoy_number[i]] - available_data = available_data.append(data) + if not to_pandas: + available_data = convert_to_dataset(available_data) return available_data def _parse_filenames(parameter, filenames): - ''' + """ Takes a list of available filenames as a series from NDBC then parses out the station ID and year from the file name. @@ -215,37 +279,38 @@ def _parse_filenames(parameter, filenames): ------- buoys: DataFrame DataFrame with keys=['id','year','file_name'] - ''' - assert isinstance( - filenames, pd.Series), 'filenames must be of type pd.Series' - assert isinstance(parameter, str), 'parameter must be a string' + """ + if not isinstance(filenames, pd.Series): + raise TypeError(f"filenames must be of type pd.Series. Got: {type(filenames)}") + if not isinstance(parameter, str): + raise TypeError(f"parameter must be a string. Got: {type(parameter)}") supported = _supported_params(parameter) file_seps = { - 'swden': 'w', - 'swdir': 'd', - 'swdir2': 'i', - 'swr1': 'j', - 'swr2': 'k', - 'stdmet': 'h', - 'cwind': 'c' + "swden": "w", + "swdir": "d", + "swdir2": "i", + "swr1": "j", + "swr2": "k", + "stdmet": "h", + "cwind": "c", } file_sep = file_seps[parameter] - filenames = filenames[filenames.str.contains('.txt.gz')] - buoy_id_year_str = filenames.str.split('.', expand=True)[0] + filenames = filenames[filenames.str.contains(".txt.gz")] + buoy_id_year_str = filenames.str.split(".", expand=True)[0] buoy_id_year = buoy_id_year_str.str.split(file_sep, n=1, expand=True) - buoys = buoy_id_year.rename(columns={0: 'id', 1: 'year'}) + buoys = buoy_id_year.rename(columns={0: "id", 1: "year"}) expected_station_id_length = 5 buoys = buoys[buoys.id.str.len() == expected_station_id_length] - buoys['filename'] = filenames + buoys["filename"] = filenames return buoys -def request_data(parameter, filenames, proxy=None): - ''' - Requests data by filenames and returns a dictionary of DataFrames +def request_data(parameter, filenames, proxy=None, clear_cache=False, to_pandas=True): + """ + Requests data by filenames and returns a dictionary of DataFrames or dictionary of Datasets for each filename passed. If filenames for a single buoy are passed then the yearly DataFrames in the returned dictionary (ndbc_data) are indexed by year (e.g. ndbc_data['2014']). If multiple buoy ids are @@ -263,74 +328,107 @@ def request_data(parameter, filenames, proxy=None): 'stdmet': 'Standard Meteorological Current Year Historical Data' 'cwind' : 'Continuous Winds Current Year Historical Data' - filenames: pandas Series or DataFrame + filenames: pandas Series, pandas DataFrame, xarray DataArray, or xarray Dataset Data filenames on https://www.ndbc.noaa.gov/data/historical/{parameter}/ proxy: dict Proxy dict passed to python requests, (e.g. proxy_dict= {"http": 'http:wwwproxy.yourProxy:80/'}) + to_pandas: bool (optional) + Flag to output a dictionary of pandas objects instead of a dictionary + of xarray objects. Default = True. + Returns ------- ndbc_data: dict - Dictionary of DataFrames indexed by buoy and year. - ''' - assert isinstance(filenames, (pd.Series, pd.DataFrame)), ( - 'filenames must be of type pd.Series') - assert isinstance(parameter, str), 'parameter must be a string' - assert isinstance(proxy, (dict, type(None))), ('If specified proxy' - 'must be a dict') - - supported = _supported_params(parameter) - if isinstance(filenames, pd.DataFrame): - filenames = pd.Series(filenames.squeeze()) - assert len(filenames) > 0, "At least 1 filename must be passed" + Dictionary of DataFrames/Datasets indexed by buoy and year. + """ + filenames = convert_to_dataarray(filenames) + filenames = pd.Series(filenames) + if not isinstance(parameter, str): + raise TypeError(f"parameter must be a string. Got: {type(parameter)}") + if not isinstance(proxy, (dict, type(None))): + raise TypeError(f"If specified, proxy must be a dict. Got: {type(proxy)}") + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type bool. Got: {type(to_pandas)}") + + _supported_params(parameter) + if not len(filenames) > 0: + raise ValueError("At least 1 filename must be passed") + + # Define the path to the cache directory + cache_dir = os.path.join(os.path.expanduser("~"), ".cache", "mhkit", "ndbc") buoy_data = _parse_filenames(parameter, filenames) - parameter_url = f'https://www.ndbc.noaa.gov/data/historical/{parameter}' ndbc_data = _defaultdict(dict) - for buoy_id in buoy_data['id'].unique(): - buoy = buoy_data[buoy_data['id'] == buoy_id] + for buoy_id in buoy_data["id"].unique(): + buoy = buoy_data[buoy_data["id"] == buoy_id] years = buoy.year filenames = buoy.filename for year, filename in zip(years, filenames): - file_url = f'{parameter_url}/{filename}' + # Create a unique filename based on the function parameters for caching + hash_params = f"{buoy_id}_{parameter}_{year}_{filename}" + cached_data, _, _ = handle_caching( + hash_params, cache_dir, clear_cache_file=clear_cache + ) + + if cached_data is not None: + ndbc_data[buoy_id][year] = cached_data + continue + file_url = ( + f"https://www.ndbc.noaa.gov/data/historical/{parameter}/{filename}" + ) if proxy == None: response = requests.get(file_url) else: response = requests.get(file_url, proxies=proxy) try: - data = zlib.decompress(response.content, 16+zlib.MAX_WBITS) - df = pd.read_csv(BytesIO(data), sep='\s+', low_memory=False) + data = zlib.decompress(response.content, 16 + zlib.MAX_WBITS) + df = pd.read_csv(BytesIO(data), sep="\s+", low_memory=False) # catch when units are included below the header - firstYear = df['MM'][0] - if isinstance(firstYear, str) and firstYear == 'mo': - df = pd.read_csv(BytesIO(data), sep='\s+', - low_memory=False, skiprows=[1]) + firstYear = df["MM"][0] + if isinstance(firstYear, str) and firstYear == "mo": + df = pd.read_csv( + BytesIO(data), sep="\s+", low_memory=False, skiprows=[1] + ) except zlib.error: - msg = (f'Issue decompressing the NDBC file {filename}' - f'(id: {buoy_id}, year: {year}). Please request ' - 'the data again.') + msg = ( + f"Issue decompressing the NDBC file {filename}" + f"(id: {buoy_id}, year: {year}). Please request " + "the data again." + ) print(msg) except pandas.errors.EmptyDataError: - msg = (f'The NDBC buoy {buoy_id} for year {year} with ' - f'filename {filename} is empty or missing ' - 'data. Please omit this file from your data ' - 'request in the future.') + msg = ( + f"The NDBC buoy {buoy_id} for year {year} with " + f"filename {filename} is empty or missing " + "data. Please omit this file from your data " + "request in the future." + ) print(msg) else: ndbc_data[buoy_id][year] = df - if len(ndbc_data) == 1: + # Cache the data after processing it if it exists + if year in ndbc_data[buoy_id]: + handle_caching( + hash_params, cache_dir, data=ndbc_data[buoy_id][year] + ) + + if buoy_id and len(ndbc_data) == 1: ndbc_data = ndbc_data[buoy_id] + if not to_pandas: + ndbc_data = convert_nested_dict_and_pandas(ndbc_data) + return ndbc_data -def to_datetime_index(parameter, ndbc_data): - ''' +def to_datetime_index(parameter, ndbc_data, to_pandas=True): + """ Converts the NDBC date and time information reported in separate columns into a DateTime index and removed the NDBC date & time columns. @@ -346,39 +444,55 @@ def to_datetime_index(parameter, ndbc_data): 'stdmet': 'Standard Meteorological Current Year Historical Data' 'cwind': 'Continuous Winds Current Year Historical Data' - ndbc_data: DataFrame + ndbc_data: pandas DataFrame or xarray Dataset NDBC data in dataframe with date and time columns to be converted + to_pandas: bool (optional) + Flag to output pandas instead of xarray. Default = True. + Returns ------- - df_datetime: DataFrame + df_datetime: pandas DataFrame or xarray Dataset Dataframe with NDBC date columns removed, and datetime index - ''' + """ - assert isinstance(parameter, str), 'parameter must be a string' - assert isinstance( - ndbc_data, pd.DataFrame), 'ndbc_data must be of type pd.DataFrame' + if not isinstance(parameter, str): + raise TypeError(f"parameter must be a string. Got: {type(parameter)}") + if isinstance(ndbc_data, xr.Dataset): + ndbc_data = ndbc_data.to_pandas() + if not isinstance(ndbc_data, pd.DataFrame): + raise TypeError( + f"ndbc_data must be of type pd.DataFrame. Got: {type(ndbc_data)}" + ) + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type bool. Got: {type(to_pandas)}") df_datetime = ndbc_data.copy(deep=True) - df_datetime['date'], ndbc_date_cols = dates_to_datetime( - df_datetime, return_date_cols=True) + df_datetime["date"], ndbc_date_cols = dates_to_datetime( + df_datetime, return_date_cols=True + ) df_datetime = df_datetime.drop(ndbc_date_cols, axis=1) - df_datetime = df_datetime.set_index('date') - if parameter in ['swden', 'swdir', 'swdir2', 'swr1', 'swr2']: + df_datetime = df_datetime.set_index("date") + if parameter in ["swden", "swdir", "swdir2", "swr1", "swr2"]: df_datetime.columns = df_datetime.columns.astype(float) + if not to_pandas: + df_datetime = convert_to_dataset(df_datetime) + return df_datetime -def dates_to_datetime(data, return_date_cols=False, return_as_dataframe=False): - ''' - Takes a DataFrame and converts the NDBC date columns - (e.g. "#YY MM DD hh mm") to datetime. Returns a DataFrame with the +def dates_to_datetime( + data, return_date_cols=False, return_as_dataframe=False, to_pandas=True +): + """ + Takes a DataFrame/Dataset and converts the NDBC date columns + (e.g. "#YY MM DD hh mm") to datetime. Returns a DataFrame/Dataset with the removed NDBC date columns a new ['date'] columns with DateTime Format. Parameters ---------- - data: DataFrame + data: pandas DataFrame or xarray Dataset Dataframe with headers (e.g. ['YY', 'MM', 'DD', 'hh', {'mm'}]) return_date_col: Bool (optional) @@ -387,52 +501,62 @@ def dates_to_datetime(data, return_date_cols=False, return_as_dataframe=False): return_as_dataFrame: bool Results returned as a DataFrame (useful for MHKiT-MATLAB) + to_pandas: bool (optional) + Flag to output pandas instead of xarray. Default = True. + Returns ------- - date: Series + date: pandas Series or xarray DataArray Series with NDBC dates dropped and new ['date'] column in DateTime format ndbc_date_cols: list (optional) - List of the DataFrame columns headers for dates as provided by + List of the DataFrame/Dataset columns headers for dates as provided by NDBC - ''' - assert isinstance(data, pd.DataFrame), 'data must be of type pd.DataFrame' - assert isinstance(return_date_cols, - bool), 'return_date_cols must be of type bool' + """ + if isinstance(data, xr.Dataset): + data = pd.DataFrame(data) + if not isinstance(data, pd.DataFrame): + raise TypeError(f"data must be of type pd.DataFrame. Got: {type(data)}") + if not isinstance(return_date_cols, bool): + raise TypeError( + f"return_date_cols must be of type bool. Got: {type(return_date_cols)}" + ) + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type bool. Got: {type(to_pandas)}") df = data.copy(deep=True) cols = df.columns.values.tolist() try: - minutes_loc = cols.index('mm') + minutes_loc = cols.index("mm") minutes = True except: - df['mm'] = np.zeros(len(df)).astype(int).astype(str) + df["mm"] = np.zeros(len(df)).astype(int).astype(str) minutes = False row_0_is_units = False - year_string = [col for col in cols if col.startswith('Y')] + year_string = [col for col in cols if col.startswith("Y")] if not year_string: - year_string = [col for col in cols if col.startswith('#')] + year_string = [col for col in cols if col.startswith("#")] if not year_string: - print(f'ERROR: Could Not Find Year Column in {cols}') + print(f"ERROR: Could Not Find Year Column in {cols}") year_string = year_string[0] - year_fmt = '%Y' - if str(df[year_string][0]).startswith('#'): + year_fmt = "%Y" + if str(df[year_string][0]).startswith("#"): row_0_is_units = True df = df.drop(df.index[0]) - elif year_string[0] == 'YYYY': + elif year_string[0] == "YYYY": year_string = year_string[0] - year_fmt = '%Y' - elif year_string[0] == 'YY': + year_fmt = "%Y" + elif year_string[0] == "YY": year_string = year_string[0] - year_fmt = '%y' + year_fmt = "%y" - parse_columns = [year_string, 'MM', 'DD', 'hh', 'mm'] + parse_columns = [year_string, "MM", "DD", "hh", "mm"] df = _date_string_to_datetime(df, parse_columns, year_fmt) - date = df['date'] + date = df["date"] if row_0_is_units: date = pd.concat([pd.Series([np.nan]), date]) @@ -440,18 +564,23 @@ def dates_to_datetime(data, return_date_cols=False, return_as_dataframe=False): if return_as_dataframe: date = pd.DataFrame(date) + if not to_pandas: + date = convert_to_dataset(date) + elif not to_pandas: + date = convert_to_dataarray(date) + if return_date_cols: if minutes: - ndbc_date_cols = [year_string, 'MM', 'DD', 'hh', 'mm'] + ndbc_date_cols = [year_string, "MM", "DD", "hh", "mm"] else: - ndbc_date_cols = [year_string, 'MM', 'DD', 'hh'] + ndbc_date_cols = [year_string, "MM", "DD", "hh"] return date, ndbc_date_cols return date def _date_string_to_datetime(df, columns, year_fmt): - ''' + """ Takes a NDBC df and creates a datetime from multiple columns headers by combining each column into a single string. Then the datetime method is applied given the expected format. @@ -473,28 +602,31 @@ def _date_string_to_datetime(df, columns, year_fmt): ------- df: DataFrame The passed df with a new column ['date'] with the datetime format - ''' - assert isinstance(df, pd.DataFrame), 'df must be of type pd.DataFrame' - assert isinstance(columns, list), 'Columns must be a list' - assert isinstance(year_fmt, str), 'year_fmt must be a string' + """ + if not isinstance(df, pd.DataFrame): + raise TypeError(f"df must be of type pd.DataFrame. Got: {type(df)}") + if not isinstance(columns, list): + raise TypeError(f"columns must be a list. Got: {type(columns)}") + if not isinstance(year_fmt, str): + raise TypeError(f"year_fmt must be a string. Got: {type(year_fmt)}") # Convert to str and zero pad for key in columns: df[key] = df[key].astype(str).str.zfill(2) - df['date_string'] = df[columns[0]] + df["date_string"] = df[columns[0]] for column in columns[1:]: - df['date_string'] = df[['date_string', column]].apply( - lambda x: ''.join(x), axis=1) - df['date'] = pd.to_datetime( - df['date_string'], format=f'{year_fmt}%m%d%H%M') - del df['date_string'] + df["date_string"] = df[["date_string", column]].apply( + lambda x: "".join(x), axis=1 + ) + df["date"] = pd.to_datetime(df["date_string"], format=f"{year_fmt}%m%d%H%M") + del df["date_string"] return df -def parameter_units(parameter=''): - ''' +def parameter_units(parameter=""): + """ Returns an ordered dictionary of NDBC parameters with unit values. If no parameter is passed then an ordered dictionary of all NDBC parameterz specified unites is returned. If a parameter is specified @@ -530,163 +662,175 @@ def parameter_units(parameter=''): ------- units: dict Dictionary of parameter units - ''' - - assert isinstance(parameter, str), 'parameter must be a string' - - if parameter == 'adcp': - units = {'DEP01': 'm', - 'DIR01': 'deg', - 'SPD01': 'cm/s', - } - elif parameter == 'cwind': - units = {'WDIR': 'degT', - 'WSPD': 'm/s', - 'GDR': 'degT', - 'GST': 'm/s', - 'GTIME': 'hhmm' - } - elif parameter == 'dart': - units = {'T': '-', - 'HEIGHT': 'm', - } - elif parameter == 'derived2': - units = {'CHILL': 'degC', - 'HEAT': 'degC', - 'ICE': 'cm/hr', - 'WSPD10': 'm/s', - 'WSPD20': 'm/s' - } - elif parameter == 'ocean': - units = {'DEPTH': 'm', - 'OTMP': 'degC', - 'COND': 'mS/cm', - 'SAL': 'psu', - 'O2%': '%', - 'O2PPM': 'ppm', - 'CLCON': 'ug/l', - 'TURB': 'FTU', - 'PH': '-', - 'EH': 'mv', - } - elif parameter == 'rain': - units = {'ACCUM': 'mm', - } - elif parameter == 'rain10': - units = {'RATE': 'mm/h', - } - elif parameter == 'rain24': - units = {'RATE': 'mm/h', - 'PCT': '%', - 'SDEV': '-', - } - elif parameter == 'realtime2': - units = {'WVHT': 'm', - 'SwH': 'm', - 'SwP': 'sec', - 'WWH': 'm', - 'WWP': 'sec', - 'SwD': '-', - 'WWD': 'degT', - 'STEEPNESS': '-', - 'APD': 'sec', - 'MWD': 'degT', - } - elif parameter == 'srad': - units = {'SRAD1': 'w/m2', - 'SRAD2': 'w/m2', - 'SRAD3': 'w/m2', - } - elif parameter == 'stdmet': - units = {'WDIR': 'degT', - 'WSPD': 'm/s', - 'GST': 'm/s', - 'WVHT': 'm', - 'DPD': 'sec', - 'APD': 'sec', - 'MWD': 'degT', - 'PRES': 'hPa', - 'ATMP': 'degC', - 'WTMP': 'degC', - 'DEWP': 'degC', - 'VIS': 'nmi', - 'PTDY': 'hPa', - 'TIDE': 'ft'} - elif parameter == 'supl': - units = {'PRES': 'hPa', - 'PTIME': 'hhmm', - 'WSPD': 'm/s', - 'WDIR': 'degT', - 'WTIME': 'hhmm' - } - elif parameter == 'swden': - units = {'swden': '(m*m)/Hz'} - elif parameter == 'swdir': - units = {'swdir': 'deg'} - elif parameter == 'swdir2': - units = {'swdir2': 'deg'} - elif parameter == 'swr1': - units = {'swr1': ''} - elif parameter == 'swr2': - units = {'swr2': ''} + """ + + if not isinstance(parameter, str): + raise TypeError(f"parameter must be a string. Got: {type(parameter)}") + + if parameter == "adcp": + units = { + "DEP01": "m", + "DIR01": "deg", + "SPD01": "cm/s", + } + elif parameter == "cwind": + units = { + "WDIR": "degT", + "WSPD": "m/s", + "GDR": "degT", + "GST": "m/s", + "GTIME": "hhmm", + } + elif parameter == "dart": + units = { + "T": "-", + "HEIGHT": "m", + } + elif parameter == "derived2": + units = { + "CHILL": "degC", + "HEAT": "degC", + "ICE": "cm/hr", + "WSPD10": "m/s", + "WSPD20": "m/s", + } + elif parameter == "ocean": + units = { + "DEPTH": "m", + "OTMP": "degC", + "COND": "mS/cm", + "SAL": "psu", + "O2%": "%", + "O2PPM": "ppm", + "CLCON": "ug/l", + "TURB": "FTU", + "PH": "-", + "EH": "mv", + } + elif parameter == "rain": + units = { + "ACCUM": "mm", + } + elif parameter == "rain10": + units = { + "RATE": "mm/h", + } + elif parameter == "rain24": + units = { + "RATE": "mm/h", + "PCT": "%", + "SDEV": "-", + } + elif parameter == "realtime2": + units = { + "WVHT": "m", + "SwH": "m", + "SwP": "sec", + "WWH": "m", + "WWP": "sec", + "SwD": "-", + "WWD": "degT", + "STEEPNESS": "-", + "APD": "sec", + "MWD": "degT", + } + elif parameter == "srad": + units = { + "SRAD1": "w/m2", + "SRAD2": "w/m2", + "SRAD3": "w/m2", + } + elif parameter == "stdmet": + units = { + "WDIR": "degT", + "WSPD": "m/s", + "GST": "m/s", + "WVHT": "m", + "DPD": "sec", + "APD": "sec", + "MWD": "degT", + "PRES": "hPa", + "ATMP": "degC", + "WTMP": "degC", + "DEWP": "degC", + "VIS": "nmi", + "PTDY": "hPa", + "TIDE": "ft", + } + elif parameter == "supl": + units = { + "PRES": "hPa", + "PTIME": "hhmm", + "WSPD": "m/s", + "WDIR": "degT", + "WTIME": "hhmm", + } + elif parameter == "swden": + units = {"swden": "(m*m)/Hz"} + elif parameter == "swdir": + units = {"swdir": "deg"} + elif parameter == "swdir2": + units = {"swdir2": "deg"} + elif parameter == "swr1": + units = {"swr1": ""} + elif parameter == "swr2": + units = {"swr2": ""} else: - units = {'swden': '(m*m)/Hz', - 'PRES': 'hPa', - 'PTIME': 'hhmm', - 'WDIR': 'degT', - 'WTIME': 'hhmm', - 'GST': 'm/s', - 'WVHT': 'm', - 'DPD': 'sec', - 'APD': 'sec', - 'MWD': 'degT', - 'ATMP': 'degC', - 'WTMP': 'degC', - 'DEWP': 'degC', - 'VIS': 'nmi', - 'PTDY': 'hPa', - 'TIDE': 'ft', - 'SRAD1': 'w/m2', - 'SRAD2': 'w/m2', - 'SRAD3': 'w/m2', - 'WVHT': 'm', - 'SwH': 'm', - 'SwP': 'sec', - 'WWH': 'm', - 'WWP': 'sec', - 'SwD': '-', - 'WWD': 'degT', - 'STEEPNESS': '-', - 'APD': 'sec', - 'RATE': 'mm/h', - 'PCT': '%', - 'SDEV': '-', - 'ACCUM': 'mm', - 'DEPTH': 'm', - 'OTMP': 'degC', - 'COND': 'mS/cm', - 'SAL': 'psu', - 'O2%': '%', - 'O2PPM': 'ppm', - 'CLCON': 'ug/l', - 'TURB': 'FTU', - 'PH': '-', - 'EH': 'mv', - 'CHILL': 'degC', - 'HEAT': 'degC', - 'ICE': 'cm/hr', - 'WSPD': 'm/s', - 'WSPD10': 'm/s', - 'WSPD20': 'm/s', - 'T': '-', - 'HEIGHT': 'm', - 'GDR': 'degT', - 'GST': 'm/s', - 'GTIME': 'hhmm', - 'DEP01': 'm', - 'DIR01': 'deg', - 'SPD01': 'cm/s', - } + units = { + "swden": "(m*m)/Hz", + "PRES": "hPa", + "PTIME": "hhmm", + "WDIR": "degT", + "WTIME": "hhmm", + "DPD": "sec", + "MWD": "degT", + "ATMP": "degC", + "WTMP": "degC", + "DEWP": "degC", + "VIS": "nmi", + "PTDY": "hPa", + "TIDE": "ft", + "SRAD1": "w/m2", + "SRAD2": "w/m2", + "SRAD3": "w/m2", + "WVHT": "m", + "SwH": "m", + "SwP": "sec", + "WWH": "m", + "WWP": "sec", + "SwD": "-", + "WWD": "degT", + "STEEPNESS": "-", + "APD": "sec", + "RATE": "mm/h", + "PCT": "%", + "SDEV": "-", + "ACCUM": "mm", + "DEPTH": "m", + "OTMP": "degC", + "COND": "mS/cm", + "SAL": "psu", + "O2%": "%", + "O2PPM": "ppm", + "CLCON": "ug/l", + "TURB": "FTU", + "PH": "-", + "EH": "mv", + "CHILL": "degC", + "HEAT": "degC", + "ICE": "cm/hr", + "WSPD": "m/s", + "WSPD10": "m/s", + "WSPD20": "m/s", + "T": "-", + "HEIGHT": "m", + "GDR": "degT", + "GST": "m/s", + "GTIME": "hhmm", + "DEP01": "m", + "DIR01": "deg", + "SPD01": "cm/s", + } units = _OrderedDict(sorted(units.items())) @@ -694,7 +838,7 @@ def parameter_units(parameter=''): def _supported_params(parameter): - ''' + """ There is a significant number of datasets provided by NDBC. There is specific data processing required for each type. Therefore this function throws an error for any data type not currently covered. @@ -712,33 +856,28 @@ def _supported_params(parameter): ------- msg: bool Whether the parameter is supported. - ''' - assert isinstance(parameter, str), 'parameter must be a string' + """ + if not isinstance(parameter, str): + raise TypeError(f"parameter must be a string. Got: {type(parameter)}") supported = True - supported_params = [ - 'swden', - 'swdir', - 'swdir2', - 'swr1', - 'swr2', - 'stdmet', - 'cwind' - ] + supported_params = ["swden", "swdir", "swdir2", "swr1", "swr2", "stdmet", "cwind"] param = [param for param in supported_params if param == parameter] if not param: supported = False - msg = ["Currently parameters ['swden', 'swdir', 'swdir2', " + - "'swr1', 'swr2', 'stdmet', 'cwind'] are supported. \n" + - "If you would like to see more data types please \n" + - " open an issue or submit a Pull Request on GitHub"] + msg = [ + "Currently parameters ['swden', 'swdir', 'swdir2', " + + "'swr1', 'swr2', 'stdmet', 'cwind'] are supported. \n" + + "If you would like to see more data types please \n" + + " open an issue or submit a Pull Request on GitHub" + ] raise Exception(msg[0]) return supported def _historical_parameters(): - ''' + """ Names and description of all NDBC Historical Data. Available Data: https://www.ndbc.noaa.gov/data/ @@ -754,26 +893,26 @@ def _historical_parameters(): ------- msg: dict Names and decriptions of historical parameters. - ''' + """ parameters = { - 'adcp': 'Acoustic Doppler Current Profiler Current Year Historical Data', - 'adcp2': 'Acoustic Doppler Current Profiler Current Year Historical Data', - 'cwind': 'Continuous Winds Current Year Historical Data', - 'dart': 'Water Column Height (DART) Current Year Historical Data', - 'mmbcur': 'Marsh-McBirney Current Measurements', - 'ocean': 'Oceanographic Current Year Historical Data', - 'rain': 'Hourly Rain Current Year Historical Data', - 'rain10': '10-Minute Rain Current Year Historical Data', - 'rain24': '24-Hour Rain Current Year Historical Data', - 'srad': 'Solar Radiation Current Year Historical Data', - 'stdmet': 'Standard Meteorological Current Year Historical Data', - 'supl': 'Supplemental Measurements Current Year Historical Data', - 'swden': 'Raw Spectral Wave Current Year Historical Data', - 'swdir': 'Spectral Wave Current Year Historical Data (alpha1)', - 'swdir2': 'Spectral Wave Current Year Historical Data (alpha2)', - 'swr1': 'Spectral Wave Current Year Historical Data (r1)', - 'swr2': 'Spectral Wave Current Year Historical Data (r2)', - 'wlevel': 'Tide Current Year Historical Data', + "adcp": "Acoustic Doppler Current Profiler Current Year Historical Data", + "adcp2": "Acoustic Doppler Current Profiler Current Year Historical Data", + "cwind": "Continuous Winds Current Year Historical Data", + "dart": "Water Column Height (DART) Current Year Historical Data", + "mmbcur": "Marsh-McBirney Current Measurements", + "ocean": "Oceanographic Current Year Historical Data", + "rain": "Hourly Rain Current Year Historical Data", + "rain10": "10-Minute Rain Current Year Historical Data", + "rain24": "24-Hour Rain Current Year Historical Data", + "srad": "Solar Radiation Current Year Historical Data", + "stdmet": "Standard Meteorological Current Year Historical Data", + "supl": "Supplemental Measurements Current Year Historical Data", + "swden": "Raw Spectral Wave Current Year Historical Data", + "swdir": "Spectral Wave Current Year Historical Data (alpha1)", + "swdir2": "Spectral Wave Current Year Historical Data (alpha2)", + "swr1": "Spectral Wave Current Year Historical Data (r1)", + "swr2": "Spectral Wave Current Year Historical Data (r2)", + "wlevel": "Tide Current Year Historical Data", } return parameters @@ -801,74 +940,88 @@ def request_directional_data(buoy, year): Dataset containing the five parameter data indexed by frequency and date. """ - assert isinstance(buoy, str), 'buoy must be a string' - assert isinstance(year, int), 'year must be an int' - - directional_parameters = ['swden', 'swdir', 'swdir2', 'swr1', 'swr2'] - - seps = {'swden': 'w', - 'swdir': 'd', - 'swdir2': 'i', - 'swr1': 'j', - 'swr2': 'k', - } + if not isinstance(buoy, str): + raise TypeError(f"buoy must be a string. Got: {type(buoy)}") + if not isinstance(year, int): + raise TypeError(f"year must be an int. Got: {type(year)}") + + directional_parameters = ["swden", "swdir", "swdir2", "swr1", "swr2"] + + seps = { + "swden": "w", + "swdir": "d", + "swdir2": "i", + "swr1": "j", + "swr2": "k", + } data_dict = {} for param in directional_parameters: - file = f'{buoy}{seps[param]}{year}.txt.gz' - raw_data = request_data(param, pd.Series([file,]))[str(year)] + file = f"{buoy}{seps[param]}{year}.txt.gz" + raw_data = request_data( + param, + pd.Series( + [ + file, + ] + ), + )[str(year)] pd_data = to_datetime_index(param, raw_data) xr_data = xr.DataArray(pd_data) - xr_data = xr_data.astype(float).rename({'dim_1': 'frequency', }) - if param in ['swr1', 'swr2']: - xr_data = xr_data/100.0 + xr_data = xr_data.astype(float).rename( + { + "dim_1": "frequency", + } + ) + if param in ["swr1", "swr2"]: + xr_data = xr_data / 100.0 xr_data.frequency.attrs = { - 'units': 'Hz', - 'long_name': 'frequency', - 'standard_name': 'f', + "units": "Hz", + "long_name": "frequency", + "standard_name": "f", } xr_data.date.attrs = { - 'units': '', - 'long_name': 'datetime', - 'standard_name': 't', + "units": "", + "long_name": "datetime", + "standard_name": "t", } data_dict[param] = xr_data - data_dict['swden'].attrs = { - 'units': 'm^2/Hz', - 'long_name': 'omnidirecational spectrum', - 'standard_name': 'S', - 'description': 'Omnidirectional *sea surface elevation variance (m^2)* spectrum (/Hz).' + data_dict["swden"].attrs = { + "units": "m^2/Hz", + "long_name": "omnidirecational spectrum", + "standard_name": "S", + "description": "Omnidirectional *sea surface elevation variance (m^2)* spectrum (/Hz).", } - data_dict['swdir'].attrs = { - 'units': 'deg', - 'long_name': 'mean wave direction', - 'standard_name': 'α1', - 'description': 'Mean wave direction.' + data_dict["swdir"].attrs = { + "units": "deg", + "long_name": "mean wave direction", + "standard_name": "α1", + "description": "Mean wave direction.", } - data_dict['swdir2'].attrs = { - 'units': 'deg', - 'long_name': 'principal wave direction', - 'standard_name': 'α2', - 'description': 'Principal wave direction.' + data_dict["swdir2"].attrs = { + "units": "deg", + "long_name": "principal wave direction", + "standard_name": "α2", + "description": "Principal wave direction.", } - data_dict['swr1'].attrs = { - 'units': '', - 'long_name': 'coordinate r1', - 'standard_name': 'r1', - 'description': 'First normalized polar coordinate of the Fourier coefficients (nondimensional).' + data_dict["swr1"].attrs = { + "units": "", + "long_name": "coordinate r1", + "standard_name": "r1", + "description": "First normalized polar coordinate of the Fourier coefficients (nondimensional).", } - data_dict['swr2'].attrs = { - 'units': '', - 'long_name': 'coordinate r2', - 'standard_name': 'r2', - 'description': 'Second normalized polar coordinate of the Fourier coefficients (nondimensional).' + data_dict["swr2"].attrs = { + "units": "", + "long_name": "coordinate r2", + "standard_name": "r2", + "description": "Second normalized polar coordinate of the Fourier coefficients (nondimensional).", } return xr.Dataset(data_dict) @@ -899,40 +1052,52 @@ def _create_spectrum(data, frequencies, directions, name, units): DataArray containing the spectrum values indexed by frequency and wave direction. """ - assert isinstance(data, np.ndarray), 'data must be an array' - assert isinstance(frequencies, np.ndarray), 'frequencies must be an array' - assert isinstance(directions, np.ndarray), 'directions must be an array' - assert isinstance(name, str), 'name must be a string' - assert isinstance(units, str), 'units must be a string' - - msg = (f'data has wrong shape {data.shape}, ' + - f'expected {(len(frequencies), len(directions))}') - assert data.shape == (len(frequencies), len(directions)), msg + if not isinstance(data, np.ndarray): + raise TypeError(f"data must be of type np.ndarray. Got: {type(data)}") + if not isinstance(frequencies, np.ndarray): + raise TypeError( + f"frequencies must be of type np.ndarray. Got: {type(frequencies)}" + ) + if not isinstance(directions, np.ndarray): + raise TypeError( + f"directions must be of type np.ndarray. Got: {type(directions)}" + ) + if not isinstance(name, str): + raise TypeError(f"name must be of type string. Got: {type(name)}") + if not isinstance(units, str): + raise TypeError(f"units must be of type string. Got: {type(units)}") + + msg = ( + f"data has wrong shape {data.shape}, " + + f"expected {(len(frequencies), len(directions))}" + ) + if not data.shape == (len(frequencies), len(directions)): + raise ValueError(msg) direction_attrs = { - 'units': 'deg', - 'long_name': 'wave direction', - 'standard_name': 'direction', + "units": "deg", + "long_name": "wave direction", + "standard_name": "direction", } frequency_attrs = { - 'units': 'Hz', - 'long_name': 'frequency', - 'standard_name': 'f', + "units": "Hz", + "long_name": "frequency", + "standard_name": "f", } spectrum = xr.DataArray( data, coords={ - 'frequency': ('frequency', frequencies, frequency_attrs), - 'direction': ('direction', directions, direction_attrs) + "frequency": ("frequency", frequencies, frequency_attrs), + "direction": ("direction", directions, direction_attrs), }, attrs={ - 'units': f'{units}/Hz/deg', - 'long_name': f'{name} spectrum', - 'standard_name': 'spectrum', - 'description': f'*{name} ({units})* spectrum (/Hz/deg).', - } + "units": f"{units}/Hz/deg", + "long_name": f"{name} spectrum", + "standard_name": "spectrum", + "description": f"*{name} ({units})* spectrum (/Hz/deg).", + }, ) return spectrum @@ -957,27 +1122,26 @@ def create_spread_function(data, directions): DataArray containing the spread function values indexed by frequency and wave direction. """ - assert isinstance(data, xr.Dataset), 'data must be a Dataset' - assert isinstance(directions, np.ndarray), 'directions must be an array' + if not isinstance(data, xr.Dataset): + raise TypeError(f"data must be of type xr.Dataset. Got: {type(data)}") + if not isinstance(directions, np.ndarray): + raise TypeError( + f"directions must be of type np.ndarray. Got: {type(directions)}" + ) - r1 = data['swr1'].data.reshape(-1, 1) - r2 = data['swr2'].data.reshape(-1, 1) - a1 = data['swdir'].data.reshape(-1, 1) - a2 = data['swdir2'].data.reshape(-1, 1) + r1 = data["swr1"].data.reshape(-1, 1) + r2 = data["swr2"].data.reshape(-1, 1) + a1 = data["swdir"].data.reshape(-1, 1) + a2 = data["swdir2"].data.reshape(-1, 1) a = directions.reshape(1, -1) spread = ( - 1/np.pi * ( - 0.5 + - r1*np.cos(np.deg2rad(a-a1)) + - r2*np.cos(2*np.deg2rad(a-a2)) - ) + 1 + / np.pi + * (0.5 + r1 * np.cos(np.deg2rad(a - a1)) + r2 * np.cos(2 * np.deg2rad(a - a2))) ) spread = _create_spectrum( - spread, - data.frequency.values, - directions, - name="Spread", - units="1") + spread, data.frequency.values, directions, name="Spread", units="1" + ) return spread @@ -1000,27 +1164,32 @@ def create_directional_spectrum(data, directions): DataArray containing the spectrum values indexed by frequency and wave direction. """ - assert isinstance(data, xr.Dataset), 'data must be a Dataset' - assert isinstance(directions, np.ndarray), 'directions must be an array' + if not isinstance(data, xr.Dataset): + raise TypeError(f"data must be of type xr.Dataset. Got: {type(data)}") + if not isinstance(directions, np.ndarray): + raise TypeError( + f"directions must be of type np.ndarray. Got: {type(directions)}" + ) spread = create_spread_function(data, directions).values - omnidirectional_spectrum = data['swden'].data.reshape(-1, 1) + omnidirectional_spectrum = data["swden"].data.reshape(-1, 1) spectrum = omnidirectional_spectrum * spread spectrum = _create_spectrum( spectrum, data.frequency.values, directions, name="Elevation variance", - units="m^2") + units="m^2", + ) return spectrum def get_buoy_metadata(station_number: str): """ - Fetches and parses the metadata of a National Data Buoy Center (NDBC) station + Fetches and parses the metadata of a National Data Buoy Center (NDBC) station from https://www.ndbc.noaa.gov. - Extracts information such as provider, buoy type, latitude, longitude, and + Extracts information such as provider, buoy type, latitude, longitude, and other metadata from the station's webpage. Parameters @@ -1046,29 +1215,28 @@ def get_buoy_metadata(station_number: str): soup = BeautifulSoup(content, "html.parser") # Find the title element - title_element = soup.find('h1') + title_element = soup.find("h1") # Extract the title (remove the trailing image and whitespace) - title = title_element.get_text(strip=True).split('\n')[0] + title = title_element.get_text(strip=True).split("\n")[0] # Check if the title element exists - if title == 'Station not found': - raise ValueError( - f"Invalid or nonexistent station number: {station_number}") + if title == "Station not found": + raise ValueError(f"Invalid or nonexistent station number: {station_number}") # Save buoy name to a dictionary data = {} - data['buoy'] = title + data["buoy"] = title # Find the specific div containing the buoy metadata - metadata_div = soup.find('div', id='stn_metadata') + metadata_div = soup.find("div", id="stn_metadata") # Extract the metadata - lines = metadata_div.p.text.split('\n') + lines = metadata_div.p.text.split("\n") line_count = 1 for line in lines: line = line.strip() - if line.startswith(''): + if line.startswith(""): line = line[3:] # Line should be the data provider if line_count == 1: @@ -1077,13 +1245,13 @@ def get_buoy_metadata(station_number: str): elif line_count == 2: data["type"] = line # Special case look for lat/long - elif re.match(r'\d+\.\d+\s+[NS]\s+\d+\.\d+\s+[EW]', line): - lat, lon = line.split(' ', 3)[0:3:2] + elif re.match(r"\d+\.\d+\s+[NS]\s+\d+\.\d+\s+[EW]", line): + lat, lon = line.split(" ", 3)[0:3:2] data["lat"] = lat.strip() data["lon"] = lon.strip() # Split key value pairs on colon - elif ':' in line: - key, value = line.split(':', 1) + elif ":" in line: + key, value = line.split(":", 1) data[key.strip()] = value.strip() # Catch all other lines as keys with empty values elif line: diff --git a/mhkit/wave/io/swan.py b/mhkit/wave/io/swan.py index c71a1a514..c344561d0 100644 --- a/mhkit/wave/io/swan.py +++ b/mhkit/wave/io/swan.py @@ -1,295 +1,355 @@ from scipy.io import loadmat from os.path import isfile import pandas as pd +import xarray as xr import numpy as np -import re - +import re +from mhkit.utils import convert_to_dataset, convert_nested_dict_and_pandas -def read_table(swan_file): - ''' + +def read_table(swan_file, to_pandas=True): + """ Reads in SWAN table format output - + Parameters ---------- swan_file: str filename to import - + to_pandas: bool (optional) + Flag to output pandas instead of xarray. Default = True. + Returns ------- - swan_data: DataFrame + swan_data: pandas DataFrame or xarray Dataset Dataframe of swan output metaDict: Dictionary Dictionary of metaData - ''' - assert isinstance(swan_file, str), 'swan_file must be of type str' - assert isfile(swan_file)==True, f'File not found: {swan_file}' - - f = open(swan_file,'r') + """ + if not isinstance(swan_file, str): + raise TypeError(f"swan_file must be of type str. Got: {type(swan_file)}") + if not isfile(swan_file): + raise ValueError(f"File not found: {swan_file}") + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type bool. Got: {type(to_pandas)}") + + f = open(swan_file, "r") header_line_number = 4 - for i in range(header_line_number+2): + for i in range(header_line_number + 2): line = f.readline() - if line.startswith('% Run'): + if line.startswith("% Run"): metaDict = _parse_line_metadata(line) - if metaDict['Table'].endswith('SWAN'): - metaDict['Table'] = metaDict['Table'].split(' SWAN')[:-1] - if i == header_line_number: - header = re.split("\s+",line.rstrip().strip('%').lstrip()) - metaDict['header'] = header - if i == header_line_number+1: - units = re.split('\s+',line.strip(' %\n').replace('[','').replace(']','')) - metaDict['units'] = units - f.close() - - swan_data = pd.read_csv(swan_file, sep='\s+', comment='%', - names=metaDict['header']) - return swan_data, metaDict - - -def read_block(swan_file): - ''' - Reads in SWAN block output with headers and creates a dictionary - of DataFrames for each SWAN output variable in the output file. - + if metaDict["Table"].endswith("SWAN"): + metaDict["Table"] = metaDict["Table"].split(" SWAN")[:-1] + if i == header_line_number: + header = re.split("\s+", line.rstrip().strip("%").lstrip()) + metaDict["header"] = header + if i == header_line_number + 1: + units = re.split( + "\s+", line.strip(" %\n").replace("[", "").replace("]", "") + ) + metaDict["units"] = units + f.close() + + swan_data = pd.read_csv(swan_file, sep="\s+", comment="%", names=metaDict["header"]) + + if not to_pandas: + swan_data = convert_to_dataset(swan_data) + + return swan_data, metaDict + + +def read_block(swan_file, to_pandas=True): + """ + Reads in SWAN block output with headers and creates a dictionary + of DataFrames or Datasets for each SWAN output variable in the output file. + Parameters ---------- swan_file: str swan block file to import - + to_pandas: bool (optional) + Flag to output a dictionary of pandas objects instead of a dictionary + of xarray objects. Default = True. + Returns ------- data: Dictionary - Dictionary of DataFrame of swan output variables + Dictionary of DataFrames or Datasets of swan output variables metaDict: Dictionary - Dictionary of metaData dependent on file type - ''' - assert isinstance(swan_file, str), 'swan_file must be of type str' - assert isfile(swan_file)==True, f'File not found: {swan_file}' - - extension = swan_file.split('.')[1].lower() - if extension == 'mat': + Dictionary of metaData dependent on file type + """ + if not isinstance(swan_file, str): + raise TypeError(f"swan_file must be of type str. Got: {type(swan_file)}") + if not isfile(swan_file): + raise ValueError(f"File not found: {swan_file}") + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type bool. Got: {type(to_pandas)}") + + extension = swan_file.split(".")[1].lower() + if extension == "mat": dataDict = _read_block_mat(swan_file) - metaData = {'filetype': 'mat', - 'variables': [var for var in dataDict.keys()]} + metaData = {"filetype": "mat", "variables": [var for var in dataDict.keys()]} else: dataDict, metaData = _read_block_txt(swan_file) + + if not to_pandas: + dataDict = convert_nested_dict_and_pandas(dataDict) + return dataDict, metaData - + def _read_block_txt(swan_file): - ''' - Reads in SWAN block output with headers and creates a dictionary + """ + Reads in SWAN block output with headers and creates a dictionary of DataFrames for each SWAN output variable in the output file. - + Parameters ---------- swan_file: str swan block file to import (must be written with headers) - + Returns ------- dataDict: Dictionary Dictionary of DataFrame of swan output variables metaDict: Dictionary - Dictionary of metaData dependent on file type - ''' - assert isinstance(swan_file, str), 'swan_file must be of type str' - assert isfile(swan_file)==True, f'File not found: {swan_file}' - - f = open(swan_file) - runLines=[] + Dictionary of metaData dependent on file type + """ + if not isinstance(swan_file, str): + raise TypeError(f"swan_file must be of type str. Got: {type(swan_file)}") + if not isfile(swan_file): + raise ValueError(f"File not found: {swan_file}") + + f = open(swan_file) + runLines = [] metaDict = {} column_position = None - dataDict={} + dataDict = {} for position, line in enumerate(f): - - if line.startswith('% Run'): + if line.startswith("% Run"): varPosition = position runLines.extend([position]) - column_position = position + 5 - varDict = _parse_line_metadata(line) - varDict['unitMultiplier'] = float(varDict['Unit'].split(' ')[0]) - - metaDict[varPosition] = varDict - variable = varDict['vars'] + column_position = position + 5 + varDict = _parse_line_metadata(line) + varDict["unitMultiplier"] = float(varDict["Unit"].split(" ")[0]) + + metaDict[varPosition] = varDict + variable = varDict["vars"] dataDict[variable] = {} - - if position==column_position and column_position!=None: - columns = line.strip('% \n').split() - metaDict[varPosition]['cols'] = columns - N_columns = len(columns) - columns_position = None - - - if not line.startswith('%'): - raw_data = ' '.join(re.split(' |\.', line.strip(' \n'))).split() + + if position == column_position and column_position != None: + columns = line.strip("% \n").split() + metaDict[varPosition]["cols"] = columns + N_columns = len(columns) + columns_position = None + + if not line.startswith("%"): + raw_data = " ".join(re.split(" |\.", line.strip(" \n"))).split() index_number = int(raw_data[0]) columns_data = raw_data[1:] - data=[] - possibleNaNs = ['****'] + data = [] + possibleNaNs = ["****"] NNaNsTotal = sum([line.count(nanVal) for nanVal in possibleNaNs]) - - if NNaNsTotal>0: + + if NNaNsTotal > 0: for vals in columns_data: - NNaNs = 0 + NNaNs = 0 for nanVal in possibleNaNs: NNaNs += vals.count(nanVal) if NNaNs > 0: for i in range(NNaNs): - data.extend([np.nan]) + data.extend([np.nan]) else: data.extend([float(vals)]) - else: - data.extend([float(val) for val in columns_data]) - + else: + data.extend([float(val) for val in columns_data]) + dataDict[variable][index_number] = data - - metaData = pd.DataFrame(metaDict).T + + metaData = pd.DataFrame(metaDict).T f.close() - - for var in metaData.vars.values: - df = pd.DataFrame(dataDict[var]).T - varCols = metaData[metaData.vars == var].cols.values.tolist()[0] + + for var in metaData.vars.values: + df = pd.DataFrame(dataDict[var]).T + varCols = metaData[metaData.vars == var].cols.values.tolist()[0] colsDict = dict(zip(df.columns.values.tolist(), varCols)) df.rename(columns=colsDict) unitMultiplier = metaData[metaData.vars == var].unitMultiplier.values[0] - dataDict[var] = df * unitMultiplier - - metaData.pop('cols') - metaData = metaData.set_index('vars').T.to_dict() - return dataDict, metaData - + dataDict[var] = df * unitMultiplier + + metaData.pop("cols") + metaData = metaData.set_index("vars").T.to_dict() + return dataDict, metaData + def _read_block_mat(swan_file): - ''' + """ Reads in SWAN matlab output and creates a dictionary of DataFrames for each swan output variable. - + Parameters ---------- swan_file: str filename to import - + Returns ------- dataDict: Dictionary Dictionary of DataFrame of swan output variables - ''' - assert isinstance(swan_file, str), 'swan_file must be of type str' - assert isfile(swan_file)==True, f'File not found: {swan_file}' - + """ + if not isinstance(swan_file, str): + raise TypeError(f"swan_file must be of type str. Got: {type(swan_file)}") + if not isfile(swan_file): + raise ValueError(f"File not found: {swan_file}") + dataDict = loadmat(swan_file, struct_as_record=False, squeeze_me=True) - removeKeys = ['__header__', '__version__', '__globals__'] + removeKeys = ["__header__", "__version__", "__globals__"] for key in removeKeys: dataDict.pop(key, None) for key in dataDict.keys(): dataDict[key] = pd.DataFrame(dataDict[key]) return dataDict - - + + def _parse_line_metadata(line): - ''' + """ Parses the variable metadata into a dictionary - + Parameters ---------- line: str line from block swan data to parse - + Returns ------- metaDict: Dictionary Dictionary of variable metadata - ''' - assert isinstance(line, str), 'line must be of type str' - - metaDict={} - meta=re.sub('\s+', " ", line.replace(',', ' ').strip('% \n').replace('**', 'vars:')) - mList = meta.split(':') - elms = [elm.split(' ') for elm in mList] + """ + if not isinstance(line, str): + raise TypeError(f"line must be of type str. Got: {type(line)}") + + metaDict = {} + meta = re.sub( + "\s+", " ", line.replace(",", " ").strip("% \n").replace("**", "vars:") + ) + mList = meta.split(":") + elms = [elm.split(" ") for elm in mList] for elm in elms: try: - elm.remove('') + elm.remove("") except: - pass - for i in range(len(elms)-1): + pass + for i in range(len(elms) - 1): elm = elms[i] key = elm[-1] - val = ' '.join(elms[i+1][:-1]) + val = " ".join(elms[i + 1][:-1]) metaDict[key] = val - metaDict[key] = ' '.join(elms[-1]) - - return metaDict + metaDict[key] = " ".join(elms[-1]) + return metaDict + + +def dictionary_of_block_to_table(dictionary_of_DataFrames, names=None, to_pandas=True): + """ + Converts a dictionary of structured 2D grid SWAN block format + x (columns),y (index) to SWAN table format x (column),y (column), + values (column) DataFrame or Dataset. -def dictionary_of_block_to_table(dictionary_of_DataFrames, names=None): - ''' - Converts a dictionary of structured 2D grid SWAN block format - x (columns),y (index) to SWAN table format x (column),y (column), - values (column) DataFrame. - Parameters ---------- - dictionary_of_DataFrames: Dictionary + dictionary_of_DataFrames: Dictionary Dictionary of DataFrames in with columns as X indicie and Y as index. names: List (Optional) Name of data column in returned table. Default=Dictionary.keys() + to_pandas: bool (optional) + Flag to output pandas instead of xarray. Default = True. + Returns ------- - swanTables: DataFrame - DataFrame with columns x,y,values where values = Dictionary.keys() - or names - ''' - assert isinstance(dictionary_of_DataFrames, dict), ( - 'dictionary_of_DataFrames must be of type Dict') - assert bool(dictionary_of_DataFrames), 'dictionary_of_DataFrames is empty' - for key in dictionary_of_DataFrames: - assert isinstance(dictionary_of_DataFrames[key],pd.DataFrame), ( - f'Dictionary key:{key} must be of type pd.DataFrame') + swanTables: pandas DataFrame or xarray Dataset + DataFrame/Dataset with columns x,y,values where values = Dictionary.keys() + or names + """ + if not isinstance(dictionary_of_DataFrames, dict): + raise TypeError( + f"dictionary_of_DataFrames must be of type dict. Got: {type(dictionary_of_DataFrames)}" + ) + if not bool(dictionary_of_DataFrames): + raise ValueError( + f"dictionary_of_DataFrames is empty. Got: {dictionary_of_DataFrames}" + ) + for key in dictionary_of_DataFrames: + if not isinstance(dictionary_of_DataFrames[key], pd.DataFrame): + raise TypeError( + f"Dictionary key:{key} must be of type pd.DataFrame. Got: {type(dictionary_of_DataFrames[key])}" + ) if not isinstance(names, type(None)): - assert isinstance(names, list), ( - 'If specified names must be of type list') - assert all([isinstance(elm, str) for elm in names]), ( - 'If specified all elements in names must be of type string') - assert len(names) == len(dictionary_of_DataFrames), ( - 'If specified names must the same length as dictionary_of_DataFrames') - + if not isinstance(names, list): + raise TypeError( + f"If specified, names must be of type list. Got: {type(names)}" + ) + if not all([isinstance(elm, str) for elm in names]): + raise ValueError( + f"If specified, all elements in names must be of type string. Got: {names}" + ) + if not len(names) == len(dictionary_of_DataFrames): + raise ValueError( + "If specified, names must the same length as dictionary_of_DataFrames" + ) + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type bool. Got: {type(to_pandas)}") + if names == None: - variables = [var for var in dictionary_of_DataFrames.keys() ] + variables = [var for var in dictionary_of_DataFrames.keys()] else: variables = names - + var0 = variables[0] swanTables = block_to_table(dictionary_of_DataFrames[var0], name=var0) - for var in variables[1:]: + for var in variables[1:]: tmp_dat = block_to_table(dictionary_of_DataFrames[var], name=var) swanTables[var] = tmp_dat[var] - + + if not to_pandas: + swanTables = convert_to_dataset(swanTables) + return swanTables - -def block_to_table(data, name='values'): - ''' - Converts structured 2D grid SWAN block format x (columns), y (index) - to SWAN table format x (column),y (column), values (column) + +def block_to_table(data, name="values", to_pandas=True): + """ + Converts structured 2D grid SWAN block format x (columns), y (index) + to SWAN table format x (column),y (column), values (column) DataFrame. - + Parameters ---------- - data: DataFrame + data: pandas DataFrame or xarray Dataset DataFrame in with columns as X indicie and Y as index. name: string (Optional) Name of data column in returned table. Default='values' + to_pandas: bool (optional) + Flag to output pandas instead of xarray. Default = True. + Returns ------- - table: DataFrame - DataFrame with columns x,y,values - ''' - assert isinstance(data,pd.DataFrame), 'data must be of type pd.DataFrame' - assert isinstance(name, str), 'Name must be of type str' - + table: pandas DataFrame or xarray Dataset + DataFrame with columns x,y,values + """ + if isinstance(data, xr.Dataset): + data = data.to_pandas() + if not isinstance(data, pd.DataFrame): + raise TypeError(f"data must be of type pd.DataFrame. Got: {type(data)}") + if not isinstance(name, str): + raise TypeError(f"If specified, name must be of type str. Got: {type(name)}") + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type bool. Got: {type(to_pandas)}") + table = data.unstack().reset_index(name=name) - table = table.rename(columns={'level_0':'x', 'level_1': 'y'}) - table.sort_values(['x', 'y'], ascending=[True, True], inplace=True) + table = table.rename(columns={"level_0": "x", "level_1": "y"}) + table.sort_values(["x", "y"], ascending=[True, True], inplace=True) - return table + if not to_pandas: + table = convert_to_dataset(table) + return table diff --git a/mhkit/wave/io/wecsim.py b/mhkit/wave/io/wecsim.py index 65ce071cf..78298a475 100644 --- a/mhkit/wave/io/wecsim.py +++ b/mhkit/wave/io/wecsim.py @@ -1,31 +1,41 @@ import pandas as pd import numpy as np import scipy.io as sio +from os.path import isfile +from mhkit.utils import convert_nested_dict_and_pandas -def read_output(file_name): +def read_output(file_name, to_pandas=True): """ - Loads the wecSim response class once 'output' has been saved to a `.mat` - structure. - - NOTE: Python is unable to import MATLAB objects. - MATLAB must be used to save the wecSim object as a structure. - + Loads the wecSim response class once 'output' has been saved to a `.mat` + structure. + + NOTE: Python is unable to import MATLAB objects. + MATLAB must be used to save the wecSim object as a structure. + Parameters ------------ file_name: string Name of wecSim output file saved as a `.mat` structure - - + to_pandas: bool (optional) + Flag to output a dictionary of pandas objects instead of a dictionary + of xarray objects. Default = True. + Returns --------- - ws_output: dict - Dictionary of pandas DataFrames, indexed by time (s) - + ws_output: dict + Dictionary of pandas DataFrames or xarray Datasets, indexed by time (s) + """ - + if not isinstance(file_name, str): + raise TypeError(f"file_name must be of type str. Got: {type(file_name)}") + if not isfile(file_name): + raise ValueError(f"File not found: {file_name}") + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type bool. Got: {type(to_pandas)}") + ws_data = sio.loadmat(file_name) - output = ws_data['output'] + output = ws_data["output"] ###################################### ## import wecSim wave class @@ -33,25 +43,24 @@ def read_output(file_name): # time: [iterations x 1 double] # elevation: [iterations x 1 double] ###################################### - try: - wave = output['wave'] - wave_type = wave[0][0][0][0][0][0] - time = wave[0][0]['time'][0][0].squeeze() - elevation = wave[0][0]['elevation'][0][0].squeeze() - + try: + wave = output["wave"] + wave_type = wave[0][0][0][0][0][0] + time = wave[0][0]["time"][0][0].squeeze() + elevation = wave[0][0]["elevation"][0][0].squeeze() + ###################################### ## create wave_output DataFrame ###################################### - wave_output = pd.DataFrame(data = time,columns=['time']) - wave_output = wave_output.set_index('time') - wave_output['elevation'] = elevation + wave_output = pd.DataFrame(data=time, columns=["time"]) + wave_output = wave_output.set_index("time") + wave_output["elevation"] = elevation wave_output.name = wave_type - + except: - print("wave class not used") - wave_output = [] - - + print("wave class not used") + wave_output = [] + ###################################### ## import wecSim body class # name: '' @@ -66,11 +75,11 @@ def read_output(file_name): # forceRestoring: [iterations x 6 double] # forceMorisonAndViscous: [iterations x 6 double] # forceLinearDamping: [iterations x 6 double] - ###################################### + ###################################### try: - bodies = output['bodies'] - num_bodies = len(bodies[0][0]['name'][0]) - name = [] + bodies = output["bodies"] + num_bodies = len(bodies[0][0]["name"][0]) + name = [] time = [] position = [] velocity = [] @@ -83,57 +92,66 @@ def read_output(file_name): forceMorisonAndViscous = [] forceLinearDamping = [] for body in range(num_bodies): - name.append(bodies[0][0]['name'][0][body][0]) - time.append(bodies[0][0]['time'][0][body]) - position.append(bodies[0][0]['position'][0][body]) - velocity.append(bodies[0][0]['velocity'][0][body]) - acceleration.append(bodies[0][0]['acceleration'][0][body]) - forceTotal.append(bodies[0][0]['forceTotal'][0][body]) - forceExcitation.append(bodies[0][0]['forceExcitation'][0][body]) - forceRadiationDamping.append(bodies[0][0]['forceRadiationDamping'][0][body]) - forceAddedMass.append(bodies[0][0]['forceAddedMass'][0][body]) - forceRestoring.append(bodies[0][0]['forceRestoring'][0][body]) + name.append(bodies[0][0]["name"][0][body][0]) + time.append(bodies[0][0]["time"][0][body]) + position.append(bodies[0][0]["position"][0][body]) + velocity.append(bodies[0][0]["velocity"][0][body]) + acceleration.append(bodies[0][0]["acceleration"][0][body]) + forceTotal.append(bodies[0][0]["forceTotal"][0][body]) + forceExcitation.append(bodies[0][0]["forceExcitation"][0][body]) + forceRadiationDamping.append(bodies[0][0]["forceRadiationDamping"][0][body]) + forceAddedMass.append(bodies[0][0]["forceAddedMass"][0][body]) + forceRestoring.append(bodies[0][0]["forceRestoring"][0][body]) try: - # Format in WEC-Sim responseClass >= v4.2 - forceMorisonAndViscous.append(bodies[0][0]['forceMorisonAndViscous'][0][body]) + # Format in WEC-Sim responseClass >= v4.2 + forceMorisonAndViscous.append( + bodies[0][0]["forceMorisonAndViscous"][0][body] + ) except: # Format in WEC-Sim responseClass <= v4.1 - forceMorisonAndViscous.append(bodies[0][0]['forceMorrisonAndViscous'][0][body]) - forceLinearDamping.append(bodies[0][0]['forceLinearDamping'][0][body]) + forceMorisonAndViscous.append( + bodies[0][0]["forceMorrisonAndViscous"][0][body] + ) + forceLinearDamping.append(bodies[0][0]["forceLinearDamping"][0][body]) except: - num_bodies = 0 - + num_bodies = 0 + ###################################### ## create body_output DataFrame - ###################################### + ###################################### def _write_body_output(body): - for dof in range(6): - tmp_body[f'position_dof{dof+1}'] = position[body][:,dof] - tmp_body[f'velocity_dof{dof+1}'] = velocity[body][:,dof] - tmp_body[f'acceleration_dof{dof+1}'] = acceleration[body][:,dof] - tmp_body[f'forceTotal_dof{dof+1}'] = forceTotal[body][:,dof] - tmp_body[f'forceExcitation_dof{dof+1}'] = forceExcitation[body][:,dof] - tmp_body[f'forceRadiationDamping_dof{dof+1}'] = forceRadiationDamping[body][:,dof] - tmp_body[f'forceAddedMass_dof{dof+1}'] = forceAddedMass[body][:,dof] - tmp_body[f'forceRestoring_dof{dof+1}'] = forceRestoring[body][:,dof] - tmp_body[f'forceMorisonAndViscous_dof{dof+1}'] = forceMorisonAndViscous[body][:,dof] - tmp_body[f'forceLinearDamping_dof{dof+1}'] = forceLinearDamping[body][:,dof] + for dof in range(6): + tmp_body[f"position_dof{dof+1}"] = position[body][:, dof] + tmp_body[f"velocity_dof{dof+1}"] = velocity[body][:, dof] + tmp_body[f"acceleration_dof{dof+1}"] = acceleration[body][:, dof] + tmp_body[f"forceTotal_dof{dof+1}"] = forceTotal[body][:, dof] + tmp_body[f"forceExcitation_dof{dof+1}"] = forceExcitation[body][:, dof] + tmp_body[f"forceRadiationDamping_dof{dof+1}"] = forceRadiationDamping[body][ + :, dof + ] + tmp_body[f"forceAddedMass_dof{dof+1}"] = forceAddedMass[body][:, dof] + tmp_body[f"forceRestoring_dof{dof+1}"] = forceRestoring[body][:, dof] + tmp_body[f"forceMorisonAndViscous_dof{dof+1}"] = forceMorisonAndViscous[ + body + ][:, dof] + tmp_body[f"forceLinearDamping_dof{dof+1}"] = forceLinearDamping[body][ + :, dof + ] return tmp_body if num_bodies >= 1: body_output = {} for body in range(num_bodies): - tmp_body = pd.DataFrame(data = time[0],columns=['time']) - tmp_body = tmp_body.set_index('time') + tmp_body = pd.DataFrame(data=time[0], columns=["time"]) + tmp_body = tmp_body.set_index("time") tmp_body.name = name[body] if num_bodies == 1: body_output = _write_body_output(body) elif num_bodies > 1: - body_output[f'body{body+1}'] = _write_body_output(body) + body_output[f"body{body+1}"] = _write_body_output(body) else: - print("body class not used") - body_output = [] - + print("body class not used") + body_output = [] ###################################### ## import wecSim pto class @@ -149,9 +167,9 @@ def _write_body_output(body): # powerInternalMechanics: [iterations x 6 double] ###################################### try: - ptos = output['ptos'] - num_ptos = len(ptos[0][0]['name'][0]) - name = [] + ptos = output["ptos"] + num_ptos = len(ptos[0][0]["name"][0]) + name = [] time = [] position = [] velocity = [] @@ -160,110 +178,118 @@ def _write_body_output(body): forceActuation = [] forceConstraint = [] forceInternalMechanics = [] - powerInternalMechanics= [] + powerInternalMechanics = [] for pto in range(num_ptos): - name.append(ptos[0][0]['name'][0][pto][0]) - time.append(ptos[0][0]['time'][0][pto]) - position.append(ptos[0][0]['position'][0][pto]) - velocity.append(ptos[0][0]['velocity'][0][pto]) - acceleration.append(ptos[0][0]['acceleration'][0][pto]) - forceTotal.append(ptos[0][0]['forceTotal'][0][pto]) - forceActuation.append(ptos[0][0]['forceActuation'][0][pto]) - forceConstraint.append(ptos[0][0]['forceConstraint'][0][pto]) - forceInternalMechanics.append(ptos[0][0]['forceInternalMechanics'][0][pto]) - powerInternalMechanics.append(ptos[0][0]['powerInternalMechanics'][0][pto]) + name.append(ptos[0][0]["name"][0][pto][0]) + time.append(ptos[0][0]["time"][0][pto]) + position.append(ptos[0][0]["position"][0][pto]) + velocity.append(ptos[0][0]["velocity"][0][pto]) + acceleration.append(ptos[0][0]["acceleration"][0][pto]) + forceTotal.append(ptos[0][0]["forceTotal"][0][pto]) + forceActuation.append(ptos[0][0]["forceActuation"][0][pto]) + forceConstraint.append(ptos[0][0]["forceConstraint"][0][pto]) + forceInternalMechanics.append(ptos[0][0]["forceInternalMechanics"][0][pto]) + powerInternalMechanics.append(ptos[0][0]["powerInternalMechanics"][0][pto]) except: - num_ptos = 0 - + num_ptos = 0 + ###################################### ## create pto_output DataFrame - ###################################### + ###################################### def _write_pto_output(pto): - for dof in range(6): - tmp_pto[f'position_dof{dof+1}'] = position[pto][:,dof] - tmp_pto[f'velocity_dof{dof+1}'] = velocity[pto][:,dof] - tmp_pto[f'acceleration_dof{dof+1}'] = acceleration[pto][:,dof] - tmp_pto[f'forceTotal_dof{dof+1}'] = forceTotal[pto][:,dof] - tmp_pto[f'forceTotal_dof{dof+1}'] = forceTotal[pto][:,dof] - tmp_pto[f'forceActuation_dof{dof+1}'] = forceActuation[pto][:,dof] - tmp_pto[f'forceConstraint_dof{dof+1}'] = forceConstraint[pto][:,dof] - tmp_pto[f'forceInternalMechanics_dof{dof+1}'] = forceInternalMechanics[pto][:,dof] - tmp_pto[f'powerInternalMechanics_dof{dof+1}'] = powerInternalMechanics[pto][:,dof] + for dof in range(6): + tmp_pto[f"position_dof{dof+1}"] = position[pto][:, dof] + tmp_pto[f"velocity_dof{dof+1}"] = velocity[pto][:, dof] + tmp_pto[f"acceleration_dof{dof+1}"] = acceleration[pto][:, dof] + tmp_pto[f"forceTotal_dof{dof+1}"] = forceTotal[pto][:, dof] + tmp_pto[f"forceTotal_dof{dof+1}"] = forceTotal[pto][:, dof] + tmp_pto[f"forceActuation_dof{dof+1}"] = forceActuation[pto][:, dof] + tmp_pto[f"forceConstraint_dof{dof+1}"] = forceConstraint[pto][:, dof] + tmp_pto[f"forceInternalMechanics_dof{dof+1}"] = forceInternalMechanics[pto][ + :, dof + ] + tmp_pto[f"powerInternalMechanics_dof{dof+1}"] = powerInternalMechanics[pto][ + :, dof + ] return tmp_pto if num_ptos >= 1: - pto_output = {} + pto_output = {} for pto in range(num_ptos): - tmp_pto = pd.DataFrame(data = time[0],columns=['time']) - tmp_pto = tmp_pto.set_index('time') + tmp_pto = pd.DataFrame(data=time[0], columns=["time"]) + tmp_pto = tmp_pto.set_index("time") tmp_pto.name = name[pto] - if num_ptos == 1: + if num_ptos == 1: pto_output = _write_pto_output(pto) elif num_ptos > 1: - pto_output[f'pto{pto+1}'] = _write_pto_output(pto) + pto_output[f"pto{pto+1}"] = _write_pto_output(pto) else: - print("pto class not used") + print("pto class not used") pto_output = [] - ###################################### ## import wecSim constraint class - # + # # name: '' # time: [iterations x 1 double] # position: [iterations x 6 double] # velocity: [iterations x 6 double] # acceleration: [iterations x 6 double] # forceConstraint: [iterations x 6 double] - ###################################### + ###################################### try: - constraints = output['constraints'] - num_constraints = len(constraints[0][0]['name'][0]) - name = [] + constraints = output["constraints"] + num_constraints = len(constraints[0][0]["name"][0]) + name = [] time = [] position = [] velocity = [] acceleration = [] forceConstraint = [] for constraint in range(num_constraints): - name.append(constraints[0][0]['name'][0][constraint][0]) - time.append(constraints[0][0]['time'][0][constraint]) - position.append(constraints[0][0]['position'][0][constraint]) - velocity.append(constraints[0][0]['velocity'][0][constraint]) - acceleration.append(constraints[0][0]['acceleration'][0][constraint]) - forceConstraint.append(constraints[0][0]['forceConstraint'][0][constraint]) + name.append(constraints[0][0]["name"][0][constraint][0]) + time.append(constraints[0][0]["time"][0][constraint]) + position.append(constraints[0][0]["position"][0][constraint]) + velocity.append(constraints[0][0]["velocity"][0][constraint]) + acceleration.append(constraints[0][0]["acceleration"][0][constraint]) + forceConstraint.append(constraints[0][0]["forceConstraint"][0][constraint]) except: - num_constraints = 0 - + num_constraints = 0 + ###################################### ## create constraint_output DataFrame - ###################################### + ###################################### def _write_constraint_output(constraint): - for dof in range(6): - tmp_constraint[f'position_dof{dof+1}'] = position[constraint][:,dof] - tmp_constraint[f'velocity_dof{dof+1}'] = velocity[constraint][:,dof] - tmp_constraint[f'acceleration_dof{dof+1}'] = acceleration[constraint][:,dof] - tmp_constraint[f'forceConstraint_dof{dof+1}'] = forceConstraint[constraint][:,dof] + for dof in range(6): + tmp_constraint[f"position_dof{dof+1}"] = position[constraint][:, dof] + tmp_constraint[f"velocity_dof{dof+1}"] = velocity[constraint][:, dof] + tmp_constraint[f"acceleration_dof{dof+1}"] = acceleration[constraint][ + :, dof + ] + tmp_constraint[f"forceConstraint_dof{dof+1}"] = forceConstraint[constraint][ + :, dof + ] return tmp_constraint if num_constraints >= 1: constraint_output = {} for constraint in range(num_constraints): - tmp_constraint = pd.DataFrame(data = time[0],columns=['time']) - tmp_constraint = tmp_constraint.set_index('time') + tmp_constraint = pd.DataFrame(data=time[0], columns=["time"]) + tmp_constraint = tmp_constraint.set_index("time") tmp_constraint.name = name[constraint] if num_constraints == 1: constraint_output = _write_constraint_output(constraint) elif num_constraints > 1: - constraint_output[f'constraint{constraint+1}'] = _write_constraint_output(constraint) + constraint_output[f"constraint{constraint+1}"] = ( + _write_constraint_output(constraint) + ) else: - print("constraint class not used") + print("constraint class not used") constraint_output = [] - ###################################### ## import wecSim mooring class - # + # # name: '' # time: [iterations x 1 double] # position: [iterations x 6 double] @@ -271,47 +297,46 @@ def _write_constraint_output(constraint): # forceMooring: [iterations x 6 double] ###################################### try: - moorings = output['mooring'] - num_moorings = len(moorings[0][0]['name'][0]) - name = [] + moorings = output["mooring"] + num_moorings = len(moorings[0][0]["name"][0]) + name = [] time = [] position = [] velocity = [] forceMooring = [] for mooring in range(num_moorings): - name.append(moorings[0][0]['name'][0][mooring][0]) - time.append(moorings[0][0]['time'][0][mooring]) - position.append(moorings[0][0]['position'][0][mooring]) - velocity.append(moorings[0][0]['velocity'][0][mooring]) - forceMooring.append(moorings[0][0]['forceMooring'][0][mooring]) + name.append(moorings[0][0]["name"][0][mooring][0]) + time.append(moorings[0][0]["time"][0][mooring]) + position.append(moorings[0][0]["position"][0][mooring]) + velocity.append(moorings[0][0]["velocity"][0][mooring]) + forceMooring.append(moorings[0][0]["forceMooring"][0][mooring]) except: - num_moorings = 0 + num_moorings = 0 ###################################### ## create mooring_output DataFrame - ###################################### + ###################################### def _write_mooring_output(mooring): - for dof in range(6): - tmp_mooring[f'position_dof{dof+1}'] = position[mooring][:,dof] - tmp_mooring[f'velocity_dof{dof+1}'] = velocity[mooring][:,dof] - tmp_mooring[f'forceMooring_dof{dof+1}'] = forceMooring[mooring][:,dof] + for dof in range(6): + tmp_mooring[f"position_dof{dof+1}"] = position[mooring][:, dof] + tmp_mooring[f"velocity_dof{dof+1}"] = velocity[mooring][:, dof] + tmp_mooring[f"forceMooring_dof{dof+1}"] = forceMooring[mooring][:, dof] return tmp_mooring - if num_moorings >= 1: + if num_moorings >= 1: mooring_output = {} for mooring in range(num_moorings): - tmp_mooring = pd.DataFrame(data = time[0],columns=['time']) - tmp_mooring = tmp_mooring.set_index('time') + tmp_mooring = pd.DataFrame(data=time[0], columns=["time"]) + tmp_mooring = tmp_mooring.set_index("time") tmp_mooring.name = name[mooring] - if num_moorings == 1: + if num_moorings == 1: mooring_output = _write_mooring_output(mooring) - elif num_moorings > 1: - mooring_output[f'mooring{mooring+1}'] = _write_mooring_output(mooring) + elif num_moorings > 1: + mooring_output[f"mooring{mooring+1}"] = _write_mooring_output(mooring) else: - print("mooring class not used") + print("mooring class not used") mooring_output = [] - - + ###################################### ## import wecSim moorDyn class # @@ -321,46 +346,45 @@ def _write_mooring_output(mooring): # Line3: [1×1 struct] # Line4: [1×1 struct] # Line5: [1×1 struct] - # Line6: [1×1 struct] + # Line6: [1×1 struct] ###################################### try: - moorDyn = output['moorDyn'] - num_lines = len(moorDyn[0][0][0].dtype) - 1 # number of moorDyn lines - - Lines = moorDyn[0][0]['Lines'][0][0][0] + moorDyn = output["moorDyn"] + num_lines = len(moorDyn[0][0][0].dtype) - 1 # number of moorDyn lines + + Lines = moorDyn[0][0]["Lines"][0][0][0] signals = Lines.dtype.names num_signals = len(Lines.dtype.names) - data = Lines[0] + data = Lines[0] time = data[0] - Lines = pd.DataFrame(data = time,columns=['time']) - Lines = Lines.set_index('time') - for signal in range(1,num_signals): - Lines[signals[signal]] = data[signal] - moorDyn_output= {'Lines': Lines} - - Line_num_output = {} - for line_num in range(1,num_lines+1): - tmp_moordyn = moorDyn[0][0][f'Line{line_num}'][0][0][0] - signals = tmp_moordyn.dtype.names - num_signals = len(tmp_moordyn.dtype.names) - data = tmp_moordyn[0] - time = data[0] - tmp_moordyn = pd.DataFrame(data = time,columns=['time']) - tmp_moordyn = tmp_moordyn.set_index('time') - for signal in range(1,num_signals): - tmp_moordyn[signals[signal]] = data[signal] - Line_num_output[f'Line{line_num}'] = tmp_moordyn - + Lines = pd.DataFrame(data=time, columns=["time"]) + Lines = Lines.set_index("time") + for signal in range(1, num_signals): + Lines[signals[signal]] = data[signal] + moorDyn_output = {"Lines": Lines} + + Line_num_output = {} + for line_num in range(1, num_lines + 1): + tmp_moordyn = moorDyn[0][0][f"Line{line_num}"][0][0][0] + signals = tmp_moordyn.dtype.names + num_signals = len(tmp_moordyn.dtype.names) + data = tmp_moordyn[0] + time = data[0] + tmp_moordyn = pd.DataFrame(data=time, columns=["time"]) + tmp_moordyn = tmp_moordyn.set_index("time") + for signal in range(1, num_signals): + tmp_moordyn[signals[signal]] = data[signal] + Line_num_output[f"Line{line_num}"] = tmp_moordyn + moorDyn_output.update(Line_num_output) - + except: - print("moorDyn class not used") + print("moorDyn class not used") moorDyn_output = [] - ###################################### ## import wecSim ptosim class - # + # # name: '' # pistonCF: [1×1 struct] # pistonNCF: [1×1 struct] @@ -372,19 +396,18 @@ def _write_mooring_output(mooring): # pmLinearGenerator: [1×1 struct] # pmRotaryGenerator: [1×1 struct] # motionMechanism: [1×1 struct] - ###################################### + ###################################### try: - ptosim = output['ptosim'] - num_ptosim = len(ptosim[0][0]['name'][0]) # number of ptosim - print("ptosim class output not supported at this time") + ptosim = output["ptosim"] + num_ptosim = len(ptosim[0][0]["name"][0]) # number of ptosim + print("ptosim class output not supported at this time") except: - print("ptosim class not used") + print("ptosim class not used") ptosim_output = [] - - + ###################################### ## import wecSim cable class - # + # # name: '' # time: [iterations x 1 double] # position: [iterations x 6 double] @@ -392,9 +415,9 @@ def _write_mooring_output(mooring): # forcecable: [iterations x 6 double] ###################################### try: - cables = output['cables'] - num_cables = len(cables[0][0]['name'][0]) - name = [] + cables = output["cables"] + num_cables = len(cables[0][0]["name"][0]) + name = [] time = [] position = [] velocity = [] @@ -403,56 +426,59 @@ def _write_mooring_output(mooring): forceactuation = [] forceconstraint = [] for cable in range(num_cables): - name.append(cables[0][0]['name'][0][cable][0]) - time.append(cables[0][0]['time'][0][cable]) - position.append(cables[0][0]['position'][0][cable]) - velocity.append(cables[0][0]['velocity'][0][cable]) - acceleration.append(cables[0][0]['acceleration'][0][cable]) - forcetotal.append(cables[0][0]['forceTotal'][0][cable]) - forceactuation.append(cables[0][0]['forceActuation'][0][cable]) - forceconstraint.append(cables[0][0]['forceConstraint'][0][cable]) + name.append(cables[0][0]["name"][0][cable][0]) + time.append(cables[0][0]["time"][0][cable]) + position.append(cables[0][0]["position"][0][cable]) + velocity.append(cables[0][0]["velocity"][0][cable]) + acceleration.append(cables[0][0]["acceleration"][0][cable]) + forcetotal.append(cables[0][0]["forceTotal"][0][cable]) + forceactuation.append(cables[0][0]["forceActuation"][0][cable]) + forceconstraint.append(cables[0][0]["forceConstraint"][0][cable]) except: - num_cables = 0 + num_cables = 0 ###################################### ## create cable_output DataFrame - ###################################### + ###################################### def _write_cable_output(cable): - for dof in range(6): - tmp_cable[f'position_dof{dof+1}'] = position[cable][:,dof] - tmp_cable[f'velocity_dof{dof+1}'] = velocity[cable][:,dof] - tmp_cable[f'acceleration_dof{dof+1}'] = acceleration[cable][:,dof] - tmp_cable[f'forcetotal_dof{dof+1}'] = forcetotal[cable][:,dof] - tmp_cable[f'forceactuation_dof{dof+1}'] = forceactuation[cable][:,dof] - tmp_cable[f'forceconstraint_dof{dof+1}'] = forceconstraint[cable][:,dof] + for dof in range(6): + tmp_cable[f"position_dof{dof+1}"] = position[cable][:, dof] + tmp_cable[f"velocity_dof{dof+1}"] = velocity[cable][:, dof] + tmp_cable[f"acceleration_dof{dof+1}"] = acceleration[cable][:, dof] + tmp_cable[f"forcetotal_dof{dof+1}"] = forcetotal[cable][:, dof] + tmp_cable[f"forceactuation_dof{dof+1}"] = forceactuation[cable][:, dof] + tmp_cable[f"forceconstraint_dof{dof+1}"] = forceconstraint[cable][:, dof] return tmp_cable - if num_cables >= 1: + if num_cables >= 1: cable_output = {} for cable in range(num_cables): - tmp_cable = pd.DataFrame(data = time[0],columns=['time']) - tmp_cable = tmp_cable.set_index('time') + tmp_cable = pd.DataFrame(data=time[0], columns=["time"]) + tmp_cable = tmp_cable.set_index("time") tmp_cable.name = name[cable] - if num_cables == 1: + if num_cables == 1: cable_output = _write_cable_output(cable) - elif num_cables > 1: - cable_output[f'cable{cable+1}'] = _write_cable_output(cable) + elif num_cables > 1: + cable_output[f"cable{cable+1}"] = _write_cable_output(cable) else: - print("cable class not used") + print("cable class not used") cable_output = [] + ############################################ + ## create wecSim output - Dict of DataFrames + ############################################ + ws_output = { + "wave": wave_output, + "bodies": body_output, + "ptos": pto_output, + "constraints": constraint_output, + "mooring": mooring_output, + "moorDyn": moorDyn_output, + "ptosim": ptosim_output, + "cables": cable_output, + } + if not to_pandas: + ws_output = convert_nested_dict_and_pandas(ws_output) - ###################################### - ## create wecSim output DataFrame of Dict - ###################################### - ws_output = {'wave' : wave_output, - 'bodies' : body_output, - 'ptos' : pto_output, - 'constraints' : constraint_output, - 'mooring' : mooring_output, - 'moorDyn': moorDyn_output, - 'ptosim' : ptosim_output, - 'cables': cable_output - } - return ws_output + return ws_output diff --git a/mhkit/wave/performance.py b/mhkit/wave/performance.py index 2b96809a9..02cf1670a 100644 --- a/mhkit/wave/performance.py +++ b/mhkit/wave/performance.py @@ -1,37 +1,47 @@ import numpy as np import pandas as pd -import xarray +import xarray as xr import types from scipy.stats import binned_statistic_2d as _binned_statistic_2d from mhkit import wave import matplotlib.pylab as plt from os.path import join +from mhkit.utils import convert_to_dataarray, convert_to_dataset -def capture_length(P, J): + +def capture_length(P, J, to_pandas=True): """ Calculates the capture length (often called capture width). Parameters ------------ - P: numpy array or pandas Series + P: numpy array, pandas Series, pandas DataFrame, xarray DataArray, or xarray Dataset Power [W] - J: numpy array or pandas Series + J: numpy array, pandas Series, pandas DataFrame, xarray DataArray, or xarray Dataset Omnidirectional wave energy flux [W/m] + to_pandas: bool (optional) + Flag to output pandas instead of xarray. Default = True. Returns --------- - L: numpy array or pandas Series + L: pandas Series or xarray DataArray Capture length [m] """ - assert isinstance(P, (np.ndarray, pd.Series)), 'P must be of type np.ndarray or pd.Series' - assert isinstance(J, (np.ndarray, pd.Series)), 'J must be of type np.ndarray or pd.Series' + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type bool. Got: {type(to_pandas)}") + + P = convert_to_dataarray(P) + J = convert_to_dataarray(J) - L = P/J + L = P / J + + if to_pandas: + L = L.to_pandas() return L -def statistics(X): +def statistics(X, to_pandas=True): """ Calculates statistics, including count, mean, standard deviation (std), min, percentiles (25%, 50%, 75%), and max. @@ -41,18 +51,35 @@ def statistics(X): Parameters ------------ - X: numpy array or pandas Series + X: numpy array, pandas Series, pandas DataFrame, xarray DataArray, or xarray Dataset Data + to_pandas: bool (optional) + Flag to output pandas instead of xarray. Default = True. Returns --------- - stats: pandas Series + stats: pandas Series or xarray DataArray Statistics """ - assert isinstance(X, (np.ndarray, pd.Series)), 'X must be of type np.ndarray or pd.Series' + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type bool. Got: {type(to_pandas)}") + + X = convert_to_dataarray(X) - stats = pd.Series(X).describe() - stats['std'] = _std_ddof1(X) + count = X.count().item() + mean = X.mean().item() + std = _std_ddof1(X) + q = X.quantile([0.0, 0.25, 0.5, 0.75, 1.0]).values + variables = ["count", "mean", "std", "min", "25%", "50%", "75%", "max"] + + stats = xr.DataArray( + data=[count, mean, std, q[0], q[1], q[2], q[3], q[4]], + dims="index", + coords={"index": variables}, + ) + + if to_pandas: + stats = stats.to_pandas() return stats @@ -71,33 +98,39 @@ def _performance_matrix(X, Y, Z, statistic, x_centers, y_centers): # General performance matrix function # Convert bin centers to edges - xi = [np.mean([x_centers[i], x_centers[i+1]]) for i in range(len(x_centers)-1)] - xi.insert(0,-np.inf) + xi = [np.mean([x_centers[i], x_centers[i + 1]]) for i in range(len(x_centers) - 1)] + xi.insert(0, -np.inf) xi.append(np.inf) - yi = [np.mean([y_centers[i], y_centers[i+1]]) for i in range(len(y_centers)-1)] - yi.insert(0,-np.inf) + yi = [np.mean([y_centers[i], y_centers[i + 1]]) for i in range(len(y_centers) - 1)] + yi.insert(0, -np.inf) yi.append(np.inf) # Override standard deviation with degree of freedom equal to 1 - if statistic == 'std': + if statistic == "std": statistic = _std_ddof1 # Provide function to compute frequency def _frequency(a): - return len(a)/len(Z) - if statistic == 'frequency': + return len(a) / len(Z) + + if statistic == "frequency": statistic = _frequency - zi, x_edge, y_edge, binnumber = _binned_statistic_2d(X, Y, Z, statistic, - bins=[xi,yi], expand_binnumbers=False) + zi, x_edge, y_edge, binnumber = _binned_statistic_2d( + X, Y, Z, statistic, bins=[xi, yi], expand_binnumbers=False + ) - M = pd.DataFrame(zi, index=x_centers, columns=y_centers) + M = xr.DataArray( + data=zi, + dims=["x_centers", "y_centers"], + coords={"x_centers": x_centers, "y_centers": y_centers}, + ) return M -def capture_length_matrix(Hm0, Te, L, statistic, Hm0_bins, Te_bins): +def capture_length_matrix(Hm0, Te, L, statistic, Hm0_bins, Te_bins, to_pandas=True): """ Generates a capture length matrix for a given statistic @@ -106,11 +139,11 @@ def capture_length_matrix(Hm0, Te, L, statistic, Hm0_bins, Te_bins): Parameters ------------ - Hm0: numpy array or pandas Series + Hm0: numpy array, pandas Series, pandas DataFrame, xarray DataArray, or xarray Dataset Significant wave height from spectra [m] - Te: numpy array or pandas Series + Te: numpy array, pandas Series, pandas DataFrame, xarray DataArray, or xarray Dataset Energy period from spectra [s] - L : numpy array or pandas Series + L : numpy array, pandas Series, pandas DataFrame, xarray DataArray, or xarray Dataset Capture length [m] statistic: string Statistic for each bin, options include: 'mean', 'std', 'median', @@ -120,37 +153,50 @@ def capture_length_matrix(Hm0, Te, L, statistic, Hm0_bins, Te_bins): Bin centers for Hm0 [m] Te_bins: numpy array Bin centers for Te [s] + to_pandas: bool (optional) + Flag to output pandas instead of xarray. Default = True. Returns --------- - LM: pandas DataFrames + LM: pandas DataFrame or xarray DataArray Capture length matrix with index equal to Hm0_bins and columns equal to Te_bins """ - assert isinstance(Hm0, (np.ndarray, pd.Series)), 'Hm0 must be of type np.ndarray or pd.Series' - assert isinstance(Te, (np.ndarray, pd.Series)), 'Te must be of type np.ndarray or pd.Series' - assert isinstance(L, (np.ndarray, pd.Series)), 'L must be of type np.ndarray or pd.Series' - assert isinstance(statistic, (str, types.FunctionType)), 'statistic must be of type str or callable' - assert isinstance(Hm0_bins, np.ndarray), 'Hm0_bins must be of type np.ndarray' - assert isinstance(Te_bins, np.ndarray), 'Te_bins must be of type np.ndarray' + Hm0 = convert_to_dataarray(Hm0) + Te = convert_to_dataarray(Te) + L = convert_to_dataarray(L) + + if not isinstance(statistic, (str, types.FunctionType)): + raise TypeError( + f"statistic must be of type str or callable. Got: {type(statistic)}" + ) + if not isinstance(Hm0_bins, np.ndarray): + raise TypeError(f"Hm0_bins must be of type np.ndarray. Got: {type(Hm0_bins)}") + if not isinstance(Te_bins, np.ndarray): + raise TypeError(f"Te_bins must be of type np.ndarray. Got: {type(Te_bins)}") + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type bool. Got: {type(to_pandas)}") LM = _performance_matrix(Hm0, Te, L, statistic, Hm0_bins, Te_bins) + if to_pandas: + LM = LM.to_pandas() + return LM -def wave_energy_flux_matrix(Hm0, Te, J, statistic, Hm0_bins, Te_bins): +def wave_energy_flux_matrix(Hm0, Te, J, statistic, Hm0_bins, Te_bins, to_pandas=True): """ Generates a wave energy flux matrix for a given statistic Parameters ------------ - Hm0: numpy array or pandas Series + Hm0: numpy array, pandas Series, pandas DataFrame, xarray DataArray, or xarray Dataset Significant wave height from spectra [m] - Te: numpy array or pandas Series + Te: numpy array, pandas Series, pandas DataFrame, xarray DataArray, or xarray Dataset Energy period from spectra [s] - J : numpy array or pandas Series + J : numpy array, pandas Series, pandas DataFrame, xarray DataArray, or xarray Dataset Wave energy flux from spectra [W/m] statistic: string Statistic for each bin, options include: 'mean', 'std', 'median', @@ -160,25 +206,38 @@ def wave_energy_flux_matrix(Hm0, Te, J, statistic, Hm0_bins, Te_bins): Bin centers for Hm0 [m] Te_bins: numpy array Bin centers for Te [s] + to_pandas: bool (optional) + Flag to output pandas instead of xarray. Default = True. Returns --------- - JM: pandas DataFrames + JM: pandas DataFrame or xarray DataArray Wave energy flux matrix with index equal to Hm0_bins and columns equal to Te_bins """ - assert isinstance(Hm0, (np.ndarray, pd.Series)), 'Hm0 must be of type np.ndarray or pd.Series' - assert isinstance(Te, (np.ndarray, pd.Series)), 'Te must be of type np.ndarray or pd.Series' - assert isinstance(J, (np.ndarray, pd.Series)), 'J must be of type np.ndarray or pd.Series' - assert isinstance(statistic, (str, callable)), 'statistic must be of type str or callable' - assert isinstance(Hm0_bins, np.ndarray), 'Hm0_bins must be of type np.ndarray' - assert isinstance(Te_bins, np.ndarray), 'Te_bins must be of type np.ndarray' + Hm0 = convert_to_dataarray(Hm0) + Te = convert_to_dataarray(Te) + J = convert_to_dataarray(J) + if not isinstance(statistic, (str, callable)): + raise TypeError( + f"statistic must be of type str or callable. Got: {type(statistic)}" + ) + if not isinstance(Hm0_bins, np.ndarray): + raise TypeError(f"Hm0_bins must be of type np.ndarray. Got: {type(Hm0_bins)}") + if not isinstance(Te_bins, np.ndarray): + raise TypeError(f"Te_bins must be of type np.ndarray. Got: {type(Te_bins)}") + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type bool. Got: {type(to_pandas)}") JM = _performance_matrix(Hm0, Te, J, statistic, Hm0_bins, Te_bins) + if to_pandas: + JM = JM.to_pandas() + return JM + def power_matrix(LM, JM): """ Generates a power matrix from a capture length matrix and wave energy @@ -186,33 +245,40 @@ def power_matrix(LM, JM): Parameters ------------ - LM: pandas DataFrame + LM: pandas DataFrame or xarray Dataset Capture length matrix - JM: pandas DataFrame + JM: pandas DataFrame or xarray Dataset Wave energy flux matrix Returns --------- - PM: pandas DataFrames + PM: pandas DataFrame or xarray Dataset Power matrix """ - assert isinstance(LM, pd.DataFrame), 'LM must be of type pd.DataFrame' - assert isinstance(JM, pd.DataFrame), 'JM must be of type pd.DataFrame' + if not isinstance(LM, (pd.DataFrame, xr.Dataset)): + raise TypeError( + f"LM must be of type pd.DataFrame or xr.Dataset. Got: {type(LM)}" + ) + if not isinstance(JM, (pd.DataFrame, xr.Dataset)): + raise TypeError( + f"JM must be of type pd.DataFrame or xr.Dataset. Got: {type(JM)}" + ) - PM = LM*JM + PM = LM * JM return PM + def mean_annual_energy_production_timeseries(L, J): """ Calculates mean annual energy production (MAEP) from time-series Parameters ------------ - L: numpy array or pandas Series + L: numpy array, pandas Series, pandas DataFrame, xarray DataArray, or xarray Dataset Capture length - J: numpy array or pandas Series + J: numpy array, pandas Series, pandas DataFrame, xarray DataArray, or xarray Dataset Wave energy flux Returns @@ -221,16 +287,17 @@ def mean_annual_energy_production_timeseries(L, J): Mean annual energy production """ - assert isinstance(L, (np.ndarray, pd.Series)), 'L must be of type np.ndarray or pd.Series' - assert isinstance(J, (np.ndarray, pd.Series)), 'J must be of type np.ndarray or pd.Series' + L = convert_to_dataarray(L) + J = convert_to_dataarray(J) - T = 8766 # Average length of a year (h) + T = 8766 # Average length of a year (h) n = len(L) - maep = T/n * np.sum(L * J) + maep = T / n * (L * J).sum().item() return maep + def mean_annual_energy_production_matrix(LM, JM, frequency): """ Calculates mean annual energy production (MAEP) from matrix data @@ -238,11 +305,11 @@ def mean_annual_energy_production_matrix(LM, JM, frequency): Parameters ------------ - LM: pandas DataFrame + LM: pandas DataFrame or xarray Dataset Capture length - JM: pandas DataFrame + JM: pandas DataFrame or xarray Dataset Wave energy flux - frequency: pandas DataFrame + frequency: pandas DataFrame or xarray Dataset Data frequency for each bin Returns @@ -251,29 +318,45 @@ def mean_annual_energy_production_matrix(LM, JM, frequency): Mean annual energy production """ - assert isinstance(LM, pd.DataFrame), 'LM must be of type pd.DataFrame' - assert isinstance(JM, pd.DataFrame), 'JM must be of type pd.DataFrame' - assert isinstance(frequency, pd.DataFrame), 'frequency must be of type pd.DataFrame' - assert LM.shape == JM.shape == frequency.shape, 'LM, JM, and frequency must be of the same size' - #assert frequency.sum().sum() == 1 + LM = convert_to_dataarray(LM) + JM = convert_to_dataarray(JM) + frequency = convert_to_dataarray(frequency) + + if not LM.shape == JM.shape == frequency.shape: + raise ValueError("LM, JM, and frequency must be of the same size") + if not np.abs(frequency.sum() - 1) < 1e-6: + raise ValueError("Frequency components must sum to one.") - T = 8766 # Average length of a year (h) + T = 8766 # Average length of a year (h) maep = T * np.nansum(LM * JM * frequency) return maep -def power_performance_workflow(S, h, P, statistic, frequency_bins=None, deep=False, rho=1205, g=9.80665, ratio=2, show_values=False, savepath=""): + +def power_performance_workflow( + S, + h, + P, + statistic, + frequency_bins=None, + deep=False, + rho=1205, + g=9.80665, + ratio=2, + show_values=False, + savepath="", +): """ High-level function to compute power performance quantities of interest following IEC TS 62600-100 for given wave spectra. Parameters ------------ - S: pandas DataFrame or Series + S: pandas Series, pandas DataFrame, xarray DataArray, or xarray Dataset Spectral density [m^2/Hz] indexed by frequency [Hz] h: float Water depth [m] - P: numpy array or pandas Series + P: numpy ndarray, pandas DataFrame, pandas Series, xarray DataArray, or xarray Dataset Power [W] statistic: string or list of strings Statistics for plotting capture length matrices, @@ -309,59 +392,95 @@ def power_performance_workflow(S, h, P, statistic, frequency_bins=None, deep=Fal maep_matrix: float Mean annual energy production """ - assert isinstance(S, (pd.DataFrame,pd.Series)), 'S must be of type pd.DataFrame or pd.Series' - assert isinstance(h, (int,float)), 'h must be of type int or float' - assert isinstance(P, (np.ndarray, pd.Series)), 'P must be of type np.ndarray or pd.Series' - assert isinstance(deep, bool), 'deep must be of type bool' - assert isinstance(rho, (int,float)), 'rho must be of type int or float' - assert isinstance(g, (int,float)), 'g must be of type int or float' - assert isinstance(ratio, (int,float)), 'ratio must be of type int or float' + S = convert_to_dataset(S) + if not isinstance(h, (int, float)): + raise TypeError(f"h must be of type int or float. Got: {type(h)}") + P = convert_to_dataarray(P) + if not isinstance(deep, bool): + raise TypeError(f"deep must be of type bool. Got: {type(deep)}") + if not isinstance(rho, (int, float)): + raise TypeError(f"rho must be of type int or float. Got: {type(rho)}") + if not isinstance(g, (int, float)): + raise TypeError(f"g must be of type int or float. Got: {type(g)}") + if not isinstance(ratio, (int, float)): + raise TypeError(f"ratio must be of type int or float. Got: {type(ratio)}") # Compute the enegy periods from the spectra data - Te = wave.resource.energy_period(S, frequency_bins=frequency_bins) - Te = Te['Te'] + Te = wave.resource.energy_period(S, frequency_bins=frequency_bins, to_pandas=False) + Te = Te["Te"] # Compute the significant wave height from the NDBC spectra data - Hm0 = wave.resource.significant_wave_height(S, frequency_bins=frequency_bins) - Hm0 = Hm0['Hm0'] + Hm0 = wave.resource.significant_wave_height( + S, frequency_bins=frequency_bins, to_pandas=False + ) + Hm0 = Hm0["Hm0"] # Compute the energy flux from spectra data and water depth - J = wave.resource.energy_flux(S, h, deep=deep, rho=rho, g=g, ratio=ratio) - J = J['J'] + J = wave.resource.energy_flux( + S, h, deep=deep, rho=rho, g=g, ratio=ratio, to_pandas=False + ) + J = J["J"] # Calculate capture length from power and energy flux - L = wave.performance.capture_length(P,J) + L = wave.performance.capture_length(P, J, to_pandas=False) # Generate bins for Hm0 and Te, input format (start, stop, step_size) - Hm0_bins = np.arange(0, Hm0.values.max() + .5, .5) + Hm0_bins = np.arange(0, Hm0.values.max() + 0.5, 0.5) Te_bins = np.arange(0, Te.values.max() + 1, 1) # Create capture length matrices for each statistic based on IEC/TS 62600-100 # Median, sum, frequency additionally provided - LM = xarray.Dataset() - LM['mean'] = wave.performance.capture_length_matrix(Hm0, Te, L, 'mean', Hm0_bins, Te_bins) - LM['std'] = wave.performance.capture_length_matrix(Hm0, Te, L, 'std', Hm0_bins, Te_bins) - LM['median'] = wave.performance.capture_length_matrix(Hm0, Te, L, 'median', Hm0_bins, Te_bins) - LM['count'] = wave.performance.capture_length_matrix(Hm0, Te, L, 'count', Hm0_bins, Te_bins) - LM['sum'] = wave.performance.capture_length_matrix(Hm0, Te, L, 'sum', Hm0_bins, Te_bins) - LM['min'] = wave.performance.capture_length_matrix(Hm0, Te, L, 'min', Hm0_bins, Te_bins) - LM['max'] = wave.performance.capture_length_matrix(Hm0, Te, L, 'max', Hm0_bins, Te_bins) - LM['freq'] = wave.performance.capture_length_matrix(Hm0, Te, L,'frequency', Hm0_bins, Te_bins) + LM = xr.Dataset() + LM["mean"] = wave.performance.capture_length_matrix( + Hm0, Te, L, "mean", Hm0_bins, Te_bins, to_pandas=False + ) + LM["std"] = wave.performance.capture_length_matrix( + Hm0, Te, L, "std", Hm0_bins, Te_bins, to_pandas=False + ) + LM["median"] = wave.performance.capture_length_matrix( + Hm0, Te, L, "median", Hm0_bins, Te_bins, to_pandas=False + ) + LM["count"] = wave.performance.capture_length_matrix( + Hm0, Te, L, "count", Hm0_bins, Te_bins, to_pandas=False + ) + LM["sum"] = wave.performance.capture_length_matrix( + Hm0, Te, L, "sum", Hm0_bins, Te_bins, to_pandas=False + ) + LM["min"] = wave.performance.capture_length_matrix( + Hm0, Te, L, "min", Hm0_bins, Te_bins, to_pandas=False + ) + LM["max"] = wave.performance.capture_length_matrix( + Hm0, Te, L, "max", Hm0_bins, Te_bins, to_pandas=False + ) + LM["freq"] = wave.performance.capture_length_matrix( + Hm0, Te, L, "frequency", Hm0_bins, Te_bins, to_pandas=False + ) # Create wave energy flux matrix using mean - JM = wave.performance.wave_energy_flux_matrix(Hm0, Te, J, 'mean', Hm0_bins, Te_bins) + JM = wave.performance.wave_energy_flux_matrix( + Hm0, Te, J, "mean", Hm0_bins, Te_bins, to_pandas=False + ) # Calculate maep from matrix - maep_matrix = wave.performance.mean_annual_energy_production_matrix(LM['mean'].to_pandas(), JM, LM['freq'].to_pandas()) + maep_matrix = wave.performance.mean_annual_energy_production_matrix( + LM["mean"], JM, LM["freq"] + ) # Plot capture length matrices using statistic for str in statistic: if str not in list(LM.data_vars): - print('ERROR: Invalid Statistics passed') + print("ERROR: Invalid Statistics passed") continue - plt.figure(figsize=(12,12), num='Capture Length Matrix ' + str) + plt.figure(figsize=(12, 12), num="Capture Length Matrix " + str) ax = plt.gca() - wave.graphics.plot_matrix(LM[str].to_pandas(), xlabel='Te (s)', ylabel='Hm0 (m)', zlabel= str + ' of Capture Length', show_values=show_values, ax=ax) - plt.savefig(join(savepath,'Capture Length Matrix ' + str + '.png')) + wave.graphics.plot_matrix( + LM[str], + xlabel="Te (s)", + ylabel="Hm0 (m)", + zlabel=str + " of Capture Length", + show_values=show_values, + ax=ax, + ) + plt.savefig(join(savepath, "Capture Length Matrix " + str + ".png")) return LM, maep_matrix diff --git a/mhkit/wave/resource.py b/mhkit/wave/resource.py index 5e6f54790..e38214eeb 100644 --- a/mhkit/wave/resource.py +++ b/mhkit/wave/resource.py @@ -1,18 +1,28 @@ from scipy.optimize import fsolve as _fsolve from scipy import signal as _signal import pandas as pd +import xarray as xr import numpy as np -from scipy import stats +from mhkit.utils import to_numeric_array, convert_to_dataarray, convert_to_dataset + ### Spectrum -def elevation_spectrum(eta, sample_rate, nnft, window='hann', - detrend=True, noverlap=None): +def elevation_spectrum( + eta, + sample_rate, + nnft, + window="hann", + detrend=True, + noverlap=None, + time_dimension="", + to_pandas=True, +): """ Calculates the wave energy spectrum from wave elevation time-series Parameters ------------ - eta: pandas DataFrame + eta: pandas DataFrame, pandas Series, xarray DataArray, or xarray Dataset Wave surface elevation [m] indexed by time [datetime or s] sample_rate: float Data frequency [Hz] @@ -27,69 +37,110 @@ def elevation_spectrum(eta, sample_rate, nnft, window='hann', noverlap: int, optional Number of points to overlap between segments. If None, ``noverlap = nperseg / 2``. Defaults to None. + time_dimension: string (optional) + Name of the xarray dimension corresponding to time. If not supplied, + defaults to the first dimension. Does not affect pandas input. + to_pandas: bool (optional) + Flag to output pandas instead of xarray. Default = True. Returns --------- - S: pandas DataFrame + S: pandas DataFrame or xr.Dataset Spectral density [m^2/Hz] indexed by frequency [Hz] """ # TODO: Add confidence intervals, equal energy frequency spacing, and NDBC # frequency spacing - # TODO: may need an assert for the length of nnft- signal.welch breaks when nfft is too short - # TODO: check for uniform sampling - assert isinstance(eta, pd.DataFrame), 'eta must be of type pd.DataFrame' - assert isinstance(sample_rate, (float,int)), 'sample_rate must be of type int or float' - assert isinstance(nnft, int), 'nnft must be of type int' - assert isinstance(window, str), 'window must be of type str' - assert isinstance(detrend, bool), 'detrend must be of type bool' - assert nnft > 0, 'nnft must be > 0' - assert sample_rate > 0, 'sample_rate must be > 0' - - S = pd.DataFrame() - for col in eta.columns: - data = eta[col] + # TODO: may need to raise an error for the length of nnft- signal.welch breaks when nfft is too short + eta = convert_to_dataset(eta) + if not isinstance(sample_rate, (float, int)): + raise TypeError( + f"sample_rate must be of type int or float. Got: {type(sample_rate)}" + ) + if not isinstance(nnft, int): + raise TypeError(f"nnft must be of type int. Got: {type(nnft)}") + if not isinstance(window, str): + raise TypeError(f"window must be of type str. Got: {type(window)}") + if not isinstance(detrend, bool): + raise TypeError(f"detrend must be of type bool. Got: {type(detrend)}") + if not nnft > 0: + raise ValueError(f"nnft must be > 0. Got: {nnft}") + if not sample_rate > 0: + raise ValueError(f"sample_rate must be > 0. Got: {sample_rate}") + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type bool. Got: {type(to_pandas)}") + + if time_dimension == "": + time_dimension = list(eta.dims)[0] + else: + if time_dimension not in list(eta.dims): + raise ValueError( + f"time_dimension is not a dimension of eta ({list(eta.dims)}). Got: {time_dimension}." + ) + time = eta[time_dimension] + delta_t = time.values[1] - time.values[0] + if not np.allclose(time.diff(dim=time_dimension)[1:], delta_t): + raise ValueError( + "Time bins are not evenly spaced. Create a constant " + + "temporal spacing for eta." + ) + + S = xr.Dataset() + for var in eta.data_vars: + data = eta[var] if detrend: - data = _signal.detrend(data.dropna(), axis=-1, type='linear', bp=0) - [f, wave_spec_measured] = _signal.welch(data, fs=sample_rate, window=window, - nperseg=nnft, nfft=nnft, noverlap=noverlap) - S[col] = wave_spec_measured - S.index=f - S.columns = eta.columns + data = _signal.detrend( + data.dropna(dim=time_dimension), axis=-1, type="linear", bp=0 + ) + [f, wave_spec_measured] = _signal.welch( + data, + fs=sample_rate, + window=window, + nperseg=nnft, + nfft=nnft, + noverlap=noverlap, + ) + S[var] = (["Frequency"], wave_spec_measured) + S = S.assign_coords({"Frequency": f}) + + if to_pandas: + S = S.to_dataframe() return S -def pierson_moskowitz_spectrum(f, Tp, Hs): +def pierson_moskowitz_spectrum(f, Tp, Hs, to_pandas=True): """ Calculates Pierson-Moskowitz Spectrum from IEC TS 62600-2 ED2 Annex C.2 (2019) Parameters ------------ - f: numpy array + f: list, np.ndarray, pd.Series, xr.DataArray Frequency [Hz] Tp: float/int Peak period [s] Hs: float/int Significant wave height [m] + to_pandas: bool (optional) + Flag to output pandas instead of xarray. Default = True. Returns --------- - S: pandas DataFrame + S: xarray Dataset Spectral density [m^2/Hz] indexed frequency [Hz] """ - try: - f = np.array(f) - except: - pass - assert isinstance(f, np.ndarray), 'f must be of type np.ndarray' - assert isinstance(Tp, (int,float)), 'Tp must be of type int or float' - assert isinstance(Hs, (int,float)), 'Hs must be of type int or float' + f = to_numeric_array(f, "f") + if not isinstance(Tp, (int, float)): + raise TypeError(f"Tp must be of type int or float. Got: {type(Tp)}") + if not isinstance(Hs, (int, float)): + raise TypeError(f"Hs must be of type int or float. Got: {type(Hs)}") + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type bool. Got: {type(to_pandas)}") f.sort() - B_PM = (5/4)*(1/Tp)**4 - A_PM = B_PM*(Hs/2)**2 + B_PM = (5 / 4) * (1 / Tp) ** 4 + A_PM = B_PM * (Hs / 2) ** 2 # Avoid a divide by zero if the 0 frequency is provided # The zero frequency should always have 0 amplitude, otherwise @@ -99,22 +150,25 @@ def pierson_moskowitz_spectrum(f, Tp, Hs): inds = range(1, f.size) else: inds = range(0, f.size) - - Sf[inds] = A_PM*f[inds]**(-5)*np.exp(-B_PM*f[inds]**(-4)) - col_name = 'Pierson-Moskowitz ('+str(Tp)+'s)' - S = pd.DataFrame(Sf, index=f, columns=[col_name]) + Sf[inds] = A_PM * f[inds] ** (-5) * np.exp(-B_PM * f[inds] ** (-4)) + + name = "Pierson-Moskowitz (" + str(Tp) + "s)" + S = xr.Dataset(data_vars={name: (["Frequency"], Sf)}, coords={"Frequency": f}) + + if to_pandas: + S = S.to_pandas() return S -def jonswap_spectrum(f, Tp, Hs, gamma=None): +def jonswap_spectrum(f, Tp, Hs, gamma=None, to_pandas=True): """ Calculates JONSWAP Spectrum from IEC TS 62600-2 ED2 Annex C.2 (2019) Parameters ------------ - f: numpy array + f: list, np.ndarray, pd.Series, xr.DataArray Frequency [Hz] Tp: float/int Peak period [s] @@ -122,26 +176,29 @@ def jonswap_spectrum(f, Tp, Hs, gamma=None): Significant wave height [m] gamma: float (optional) Gamma + to_pandas: bool (optional) + Flag to output pandas instead of xarray. Default = True. Returns --------- - S: pandas DataFrame + S: pandas Series or xarray DataArray Spectral density [m^2/Hz] indexed frequency [Hz] """ - - try: - f = np.array(f) - except: - pass - assert isinstance(f, np.ndarray), 'f must be of type np.ndarray' - assert isinstance(Tp, (int,float)), 'Tp must be of type int or float' - assert isinstance(Hs, (int,float)), 'Hs must be of type int or float' - assert isinstance(gamma, (int,float, type(None))), \ - 'gamma must be of type int or float' + f = to_numeric_array(f, "f") + if not isinstance(Tp, (int, float)): + raise TypeError(f"Tp must be of type int or float. Got: {type(Tp)}") + if not isinstance(Hs, (int, float)): + raise TypeError(f"Hs must be of type int or float. Got: {type(Hs)}") + if not isinstance(gamma, (int, float, type(None))): + raise TypeError( + f"If specified, gamma must be of type int or float. Got: {type(gamma)}" + ) + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type bool. Got: {type(to_pandas)}") f.sort() - B_PM = (5/4)*(1/Tp)**4 - A_PM = B_PM*(Hs/2)**2 + B_PM = (5 / 4) * (1 / Tp) ** 4 + A_PM = B_PM * (Hs / 2) ** 2 # Avoid a divide by zero if the 0 frequency is provided # The zero frequency should always have 0 amplitude, otherwise @@ -152,52 +209,65 @@ def jonswap_spectrum(f, Tp, Hs, gamma=None): else: inds = range(0, f.size) - S_f[inds] = A_PM*f[inds]**(-5)*np.exp(-B_PM*f[inds]**(-4)) + S_f[inds] = A_PM * f[inds] ** (-5) * np.exp(-B_PM * f[inds] ** (-4)) if not gamma: - TpsqrtHs = Tp/np.sqrt(Hs); + TpsqrtHs = Tp / np.sqrt(Hs) if TpsqrtHs <= 3.6: - gamma = 5; + gamma = 5 elif TpsqrtHs > 5: - gamma = 1; + gamma = 1 else: - gamma = np.exp(5.75 - 1.15*TpsqrtHs); + gamma = np.exp(5.75 - 1.15 * TpsqrtHs) # Cutoff frequencies for gamma function siga = 0.07 sigb = 0.09 - fp = 1/Tp # peak frequency - lind = np.where(f<=fp) - hind = np.where(f>fp) + fp = 1 / Tp # peak frequency + lind = np.where(f <= fp) + hind = np.where(f > fp) Gf = np.zeros(f.shape) - Gf[lind] = gamma**np.exp(-(f[lind]-fp)**2/(2*siga**2*fp**2)) - Gf[hind] = gamma**np.exp(-(f[hind]-fp)**2/(2*sigb**2*fp**2)) - C = 1- 0.287*np.log(gamma) - Sf = C*S_f*Gf + Gf[lind] = gamma ** np.exp(-((f[lind] - fp) ** 2) / (2 * siga**2 * fp**2)) + Gf[hind] = gamma ** np.exp(-((f[hind] - fp) ** 2) / (2 * sigb**2 * fp**2)) + C = 1 - 0.287 * np.log(gamma) + Sf = C * S_f * Gf + + name = "JONSWAP (" + str(Hs) + "m," + str(Tp) + "s)" + S = xr.Dataset(data_vars={name: (["Frequency"], Sf)}, coords={"Frequency": f}) - col_name = 'JONSWAP ('+str(Hs)+'m,'+str(Tp)+'s)' - S = pd.DataFrame(Sf, index=f, columns=[col_name]) + if to_pandas: + S = S.to_pandas() return S + ### Metrics -def surface_elevation(S, time_index, seed=None, frequency_bins=None, phases=None, method='ifft'): +def surface_elevation( + S, + time_index, + seed=None, + frequency_bins=None, + phases=None, + method="ifft", + frequency_dimension="", + to_pandas=True, +): """ Calculates wave elevation time-series from spectrum Parameters ------------ - S: pandas DataFrame + S: pandas DataFrame, pandas Series, xarray DataArray, or xarray Dataset Spectral density [m^2/Hz] indexed by frequency [Hz] time_index: numpy array Time used to create the wave elevation time-series [s], for example, time = np.arange(0,100,0.01) seed: int (optional) Random seed - frequency_bins: numpy array or pandas DataFrame (optional) + frequency_bins: numpy array, pandas Series, or xarray DataArray (optional) Bin widths for frequency of S. Required for unevenly sized bins - phases: numpy array or pandas DataFrame (optional) + phases: pandas DataFrame, pandas Series, xarray DataArray, or xarray Dataset Explicit phases for frequency components (overrides seed) for example, phases = np.random.rand(len(S)) * 2 * np.pi method: str (optional) @@ -207,372 +277,524 @@ def surface_elevation(S, time_index, seed=None, frequency_bins=None, phases=None 'sum_of_sines' explicitly sums each frequency component and used by default if frequency_bins are provided. The 'ifft' method is significantly faster. + frequency_dimension: string (optional) + Name of the xarray dimension corresponding to frequency. If not supplied, + defaults to the first dimension. Does not affect pandas input. + to_pandas: bool (optional) + Flag to output pandas instead of xarray. Default = True. Returns --------- - eta: pandas DataFrame + eta: pandas DataFrame or xarray Dataset Wave surface elevation [m] indexed by time [s] """ - time_index = np.array(time_index) - assert isinstance(S, pd.DataFrame), 'S must be of type pd.DataFrame' - assert isinstance(time_index, np.ndarray), ('time_index must be of type' - 'np.ndarray') - assert isinstance(seed, (type(None),int)), 'seed must be of type int' - assert isinstance(frequency_bins, (type(None), np.ndarray, pd.DataFrame)),( - "frequency_bins must be of type None, np.ndarray, or pd,DataFrame") - assert isinstance(phases, (type(None), np.ndarray, pd.DataFrame)), ( - 'phases must be of type None, np.ndarray, or pd,DataFrame') - assert isinstance(method, str) - + time_index = to_numeric_array(time_index, "time_index") + S = convert_to_dataset(S) + if not isinstance(seed, (type(None), int)): + raise TypeError(f"If specified, seed must be of type int. Got: {type(seed)}") + if not isinstance(phases, type(None)): + phases = convert_to_dataset(phases) + if not isinstance(method, str): + raise TypeError(f"method must be of type str. Got: {type(method)}") + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type bool. Got: {type(to_pandas)}") + + if frequency_dimension == "": + frequency_dimension = list(S.coords)[0] + elif frequency_dimension not in list(S.dims): + raise ValueError( + f"frequency_dimension is not a dimension of S ({list(S.dims)}). Got: {frequency_dimension}." + ) + f = S[frequency_dimension] + + if not isinstance(frequency_bins, (type(None), np.ndarray)): + frequency_bins = convert_to_dataarray(frequency_bins) + elif isinstance(frequency_bins, np.ndarray): + frequency_bins = xr.DataArray( + data=frequency_bins, + dims=frequency_dimension, + coords={frequency_dimension: f}, + ) if frequency_bins is not None: - assert frequency_bins.squeeze().shape == (S.squeeze().shape[0],),( - 'shape of frequency_bins must match shape of S') + if not frequency_bins.squeeze().shape == f.shape: + raise ValueError( + "shape of frequency_bins must match shape of the frequency dimension of S" + ) if phases is not None: - assert phases.squeeze().shape == S.squeeze().shape,( - 'shape of phases must match shape of S') - + if not list(phases.data_vars) == list(S.data_vars): + raise ValueError("phases must have the same variable names as S") + for var in phases.data_vars: + if not phases[var].shape == S[var].shape: + raise ValueError( + "shape of variables in phases must match shape of variables in S" + ) if method is not None: - assert method == 'ifft' or method == 'sum_of_sines',( - f"unknown method {method}, options are 'ifft' or 'sum_of_sines'") - - if method == 'ifft': - assert S.index.values[0] == 0, ('ifft method must have zero frequency defined') - - f = pd.Series(S.index) - f.index = f + if not (method == "ifft" or method == "sum_of_sines"): + raise ValueError(f"Method must be 'ifft' or 'sum_of_sines'. Got: {method}") + + if method == "ifft": + if not f[0] == 0: + raise ValueError( + f"ifft method must have zero frequency defined. Lowest frequency is: {S.index.values[0]}" + ) + if frequency_bins is None: - delta_f = f.values[1]-f.values[0] - assert np.allclose(f.diff()[1:], delta_f) - elif isinstance(frequency_bins, np.ndarray): - delta_f = pd.Series(frequency_bins, index=S.index) - method = 'sum_of_sines' - elif isinstance(frequency_bins, pd.DataFrame): - assert len(frequency_bins.columns) == 1, ('frequency_bins must only' - 'contain 1 column') - delta_f = frequency_bins.squeeze() - method = 'sum_of_sines' - - if phases is None: - np.random.seed(seed) - phase = pd.DataFrame(2*np.pi*np.random.rand(S.shape[0], S.shape[1]), - index=S.index, columns=S.columns) - elif isinstance(phases, np.ndarray): - phase = pd.DataFrame(phases, index=S.index, columns=S.columns) - elif isinstance(phases, pd.DataFrame): - phase = phases - - omega = pd.Series(2*np.pi*f) - omega.index = f - - # Wave amplitude times delta f - A = 2*S - A = A.multiply(delta_f, axis=0) - A = np.sqrt(A) - - if method == 'ifft': - A_cmplx = A * (np.cos(phase) + 1j*np.sin(phase)) - - def func(v): - eta = np.fft.irfft(0.5 * v.values.squeeze() * time_index.size, time_index.size) - return pd.Series(data=eta, index=time_index) - - eta = A_cmplx.apply(func) - - elif method == 'sum_of_sines': - # Product of omega and time - B = np.outer(time_index, omega) - B = B.reshape((len(time_index), len(omega))) - B = pd.DataFrame(B, index=time_index, columns=omega.index) - - # wave elevation - eta = pd.DataFrame(columns=S.columns, index=time_index) - for mcol in eta.columns: - C = np.cos(B+phase[mcol]) - C = pd.DataFrame(C, index=time_index, columns=omega.index) - eta[mcol] = (C*A[mcol]).sum(axis=1) - + delta_f = f.values[1] - f.values[0] + if not np.allclose(f.diff(dim=frequency_dimension)[1:], delta_f): + raise ValueError( + "Frequency bins are not evenly spaced. " + + "Define 'frequency_bins' or create a constant " + + "frequency spacing for S." + ) + else: + if not len(frequency_bins.squeeze().shape) == 1: + raise ValueError("frequency_bins must only contain 1 column") + delta_f = frequency_bins + method = "sum_of_sines" + + omega = xr.DataArray( + data=2 * np.pi * f, dims=frequency_dimension, coords={frequency_dimension: f} + ) + + eta = xr.Dataset() + for var in S.data_vars: + if phases is None: + np.random.seed(seed) + phase = xr.DataArray( + data=2 * np.pi * np.random.rand(S[var].size), + dims="Frequency", + coords={"Frequency": f}, + ) + else: + phase = phases[var] + + # Wave amplitude times delta f + A = 2 * S[var] + A = A * delta_f + A = np.sqrt(A) + + if method == "ifft": + A_cmplx = A * (np.cos(phase) + 1j * np.sin(phase)) + eta_tmp = np.fft.irfft( + 0.5 * A_cmplx.values * time_index.size, time_index.size + ) + eta[var] = xr.DataArray( + data=eta_tmp, dims="Time", coords={"Time": time_index} + ) + + elif method == "sum_of_sines": + # Product of omega and time + B = np.outer(time_index, omega) + B = B.reshape((len(time_index), len(omega))) + B = xr.DataArray( + data=B, + dims=["Time", "Frequency"], + coords={"Time": time_index, "Frequency": f}, + ) + + # wave elevation + # eta = xr.DataArray(columns=S.columns, index=time_index) + # for mcol in eta.columns: + C = np.cos(B + phase) + # C = xr.DataArray(data=C, index=time_index, columns=omega.index) + eta[var] = (C * A).sum(axis=1) + + if to_pandas: + eta = eta.to_dataframe() + return eta -def frequency_moment(S, N, frequency_bins=None): +def frequency_moment(S, N, frequency_bins=None, frequency_dimension="", to_pandas=True): """ Calculates the Nth frequency moment of the spectrum Parameters ----------- - S: pandas DataFrame + S: pandas DataFrame, pandas Series, xarray DataArray, or xarray Dataset Spectral density [m^2/Hz] indexed by frequency [Hz] N: int Moment (0 for 0th, 1 for 1st ....) frequency_bins: numpy array or pandas Series (optional) Bin widths for frequency of S. Required for unevenly sized bins + frequency_dimension: string (optional) + Name of the xarray dimension corresponding to frequency. If not supplied, + defaults to the first dimension. Does not affect pandas input. + to_pandas: bool (optional) + Flag to output pandas instead of xarray. Default = True. Returns ------- - m: pandas DataFrame + m: pandas DataFrame or xarray Dataset Nth Frequency Moment indexed by S.columns """ - assert isinstance(S, (pd.Series,pd.DataFrame)), 'S must be of type pd.DataFrame or pd.Series' - assert isinstance(N, int), 'N must be of type int' + S = convert_to_dataset(S) + if not isinstance(N, int): + raise TypeError(f"N must be of type int. Got: {type(N)}") + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type bool. Got: {type(to_pandas)}") + + if frequency_dimension == "": + frequency_dimension = list(S.coords)[0] + elif frequency_dimension not in list(S.dims): + raise ValueError( + f"frequency_dimension is not a dimension of S ({list(S.dims)}). Got: {frequency_dimension}." + ) + f = S[frequency_dimension] # Eq 8 in IEC 62600-101 - spec = S[S.index > 0] # omit frequency of 0 + S = S.sel({frequency_dimension: slice(1e-12, f.max())}) # omit frequency of 0 + f = S[frequency_dimension] # reset frequency_dimension without the 0 frequency - f = spec.index fn = np.power(f, N) if frequency_bins is None: - delta_f = pd.Series(f).diff() - delta_f[0] = f[1]-f[0] + delta_f = f.diff(dim=frequency_dimension) + delta_f0 = f[1] - f[0] + delta_f0 = delta_f0.assign_coords({frequency_dimension: f[0]}) + delta_f = xr.concat([delta_f0, delta_f], dim=frequency_dimension) else: + delta_f = xr.DataArray( + data=convert_to_dataarray(frequency_bins), + dims=frequency_dimension, + coords={frequency_dimension: f}, + ) - assert isinstance(frequency_bins, (np.ndarray,pd.Series,pd.DataFrame)),( - 'frequency_bins must be of type np.ndarray or pd.Series') - delta_f = pd.Series(frequency_bins) + m = S * fn * delta_f + m = m.sum(dim=frequency_dimension) - delta_f.index = f + m = _transform_dataset(m, "m" + str(N)) - m = spec.multiply(fn,axis=0).multiply(delta_f,axis=0) - m = m.sum(axis=0) - if isinstance(S,pd.Series): - m = pd.DataFrame(m, index=[0], columns = ['m'+str(N)]) - else: - m = pd.DataFrame(m, index=S.columns, columns = ['m'+str(N)]) + if to_pandas: + m = m.to_dataframe() return m -def significant_wave_height(S, frequency_bins=None): +def significant_wave_height(S, frequency_bins=None, to_pandas=True): """ Calculates wave height from spectra Parameters ------------ - S: pandas DataFrame + S: pandas DataFrame, pandas Series, xarray DataArray, or xarray Dataset Spectral density [m^2/Hz] indexed by frequency [Hz] frequency_bins: numpy array or pandas Series (optional) Bin widths for frequency of S. Required for unevenly sized bins + to_pandas: bool (optional) + Flag to output pandas instead of xarray. Default = True. Returns --------- - Hm0: pandas DataFrame + Hm0: pandas DataFrame or xarray Dataset Significant wave height [m] index by S.columns """ - assert isinstance(S, (pd.Series,pd.DataFrame)), 'S must be of type pd.DataFrame or pd.Series' + S = convert_to_dataset(S) + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type bool. Got: {type(to_pandas)}") # Eq 12 in IEC 62600-101 + m0 = frequency_moment(S, 0, frequency_bins=frequency_bins, to_pandas=False).rename( + {"m0": "Hm0"} + ) + Hm0 = 4 * np.sqrt(m0) - Hm0 = 4*np.sqrt(frequency_moment(S,0,frequency_bins=frequency_bins)) - Hm0.columns = ['Hm0'] + if to_pandas: + Hm0 = Hm0.to_dataframe() return Hm0 -def average_zero_crossing_period(S,frequency_bins=None): +def average_zero_crossing_period(S, frequency_bins=None, to_pandas=True): """ Calculates wave average zero crossing period from spectra Parameters ------------ - S: pandas DataFrame + S: pandas DataFrame, pandas Series, xarray DataArray, or xarray Dataset Spectral density [m^2/Hz] indexed by frequency [Hz] frequency_bins: numpy array or pandas Series (optional) Bin widths for frequency of S. Required for unevenly sized bins + to_pandas: bool (optional) + Flag to output pandas instead of xarray. Default = True. Returns --------- - Tz: pandas DataFrame + Tz: pandas DataFrame or xarray Dataset Average zero crossing period [s] indexed by S.columns """ - assert isinstance(S, pd.DataFrame), 'S must be of type pd.DataFrame' + S = convert_to_dataset(S) + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type bool. Got: {type(to_pandas)}") # Eq 15 in IEC 62600-101 - m0 = frequency_moment(S,0,frequency_bins=frequency_bins).squeeze() # convert to Series for calculation - m2 = frequency_moment(S,2,frequency_bins=frequency_bins).squeeze() + m0 = frequency_moment(S, 0, frequency_bins=frequency_bins, to_pandas=False).rename( + {"m0": "Tz"} + ) + m2 = frequency_moment(S, 2, frequency_bins=frequency_bins, to_pandas=False).rename( + {"m2": "Tz"} + ) + + Tz = np.sqrt(m0 / m2) - Tz = np.sqrt(m0/m2) - Tz = pd.DataFrame(Tz, index=S.columns, columns = ['Tz']) + if to_pandas: + Tz = Tz.to_dataframe() return Tz -def average_crest_period(S,frequency_bins=None): +def average_crest_period(S, frequency_bins=None, to_pandas=True): """ Calculates wave average crest period from spectra Parameters ------------ - S: pandas DataFrame + S: pandas DataFrame, pandas Series, xarray DataArray, or xarray Dataset Spectral density [m^2/Hz] indexed by frequency [Hz] frequency_bins: numpy array or pandas Series (optional) Bin widths for frequency of S. Required for unevenly sized bins + to_pandas: bool (optional) + Flag to output pandas instead of xarray. Default = True. Returns --------- - Tavg: pandas DataFrame + Tavg: pandas DataFrame or xarray Dataset Average wave period [s] indexed by S.columns """ - assert isinstance(S, pd.DataFrame), 'S must be of type pd.DataFrame' + S = convert_to_dataset(S) + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type bool. Got: {type(to_pandas)}") + + m2 = frequency_moment(S, 2, frequency_bins=frequency_bins, to_pandas=False).rename( + {"m2": "Tavg"} + ) + m4 = frequency_moment(S, 4, frequency_bins=frequency_bins, to_pandas=False).rename( + {"m4": "Tavg"} + ) - m2 = frequency_moment(S,2,frequency_bins=frequency_bins).squeeze() # convert to Series for calculation - m4 = frequency_moment(S,4,frequency_bins=frequency_bins).squeeze() + Tavg = np.sqrt(m2 / m4) - Tavg = np.sqrt(m2/m4) - Tavg = pd.DataFrame(Tavg, index=S.columns, columns=['Tavg']) + if to_pandas: + Tavg = Tavg.to_dataframe() return Tavg -def average_wave_period(S,frequency_bins=None): +def average_wave_period(S, frequency_bins=None, to_pandas=True): """ Calculates mean wave period from spectra Parameters ------------ - S: pandas DataFrame + S: pandas DataFrame, pandas Series, xarray DataArray, or xarray Dataset Spectral density [m^2/Hz] indexed by frequency [Hz] frequency_bins: numpy array or pandas Series (optional) Bin widths for frequency of S. Required for unevenly sized bins + to_pandas: bool (optional) + Flag to output pandas instead of xarray. Default = True. Returns --------- - Tm: pandas DataFrame + Tm: pandas DataFrame or xarray Dataset Mean wave period [s] indexed by S.columns """ - assert isinstance(S, pd.DataFrame), 'S must be of type pd.DataFrame' + S = convert_to_dataset(S) + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type bool. Got: {type(to_pandas)}") - m0 = frequency_moment(S,0,frequency_bins=frequency_bins).squeeze() # convert to Series for calculation - m1 = frequency_moment(S,1,frequency_bins=frequency_bins).squeeze() + m0 = frequency_moment(S, 0, frequency_bins=frequency_bins, to_pandas=False).rename( + {"m0": "Tm"} + ) + m1 = frequency_moment(S, 1, frequency_bins=frequency_bins, to_pandas=False).rename( + {"m1": "Tm"} + ) - Tm = np.sqrt(m0/m1) - Tm = pd.DataFrame(Tm, index=S.columns, columns=['Tm']) + Tm = np.sqrt(m0 / m1) + + if to_pandas: + Tm = Tm.to_dataframe() return Tm -def peak_period(S): +def peak_period(S, frequency_dimension="", to_pandas=True): """ Calculates wave peak period from spectra Parameters ------------ - S: pandas DataFrame + S: pandas DataFrame, pandas Series, xarray DataArray, or xarray Dataset Spectral density [m^2/Hz] indexed by frequency [Hz] + frequency_dimension: string (optional) + Name of the xarray dimension corresponding to frequency. If not supplied, + defaults to the first dimension. Does not affect pandas input. + to_pandas: bool (optional) + Flag to output pandas instead of xarray. Default = True. Returns --------- - Tp: pandas DataFrame + Tp: pandas DataFrame or xarray Dataset Wave peak period [s] indexed by S.columns """ - assert isinstance(S, pd.DataFrame), 'S must be of type pd.DataFrame' + S = convert_to_dataset(S) + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type bool. Got: {type(to_pandas)}") + + if frequency_dimension == "": + frequency_dimension = list(S.coords)[0] + elif frequency_dimension not in list(S.dims): + raise ValueError( + f"frequency_dimension is not a dimension of S ({list(S.dims)}). Got: {frequency_dimension}." + ) # Eq 14 in IEC 62600-101 - fp = S.idxmax(axis=0) # Hz + fp = S.idxmax(dim=frequency_dimension) # Hz + Tp = 1 / fp + + Tp = _transform_dataset(Tp, "Tp") - Tp = 1/fp - Tp = pd.DataFrame(Tp, index=S.columns, columns=["Tp"]) + if to_pandas: + Tp = Tp.to_dataframe() return Tp -def energy_period(S,frequency_bins=None): +def energy_period(S, frequency_bins=None, to_pandas=True): """ Calculates wave energy period from spectra Parameters ------------ - S: pandas DataFrame + S: pandas DataFrame, pandas Series, xarray DataArray, or xarray Dataset Spectral density [m^2/Hz] indexed by frequency [Hz] frequency_bins: numpy array or pandas Series (optional) Bin widths for frequency of S. Required for unevenly sized bins + to_pandas: bool (optional) + Flag to output pandas instead of xarray. Default = True. Returns --------- - Te: pandas DataFrame + Te: pandas DataFrame or xarray Dataset Wave energy period [s] indexed by S.columns """ + S = convert_to_dataset(S) + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type bool. Got: {type(to_pandas)}") - assert isinstance(S, (pd.Series,pd.DataFrame)), 'S must be of type pd.DataFrame or pd.Series' - - mn1 = frequency_moment(S,-1,frequency_bins=frequency_bins).squeeze() # convert to Series for calculation - m0 = frequency_moment(S,0,frequency_bins=frequency_bins).squeeze() + mn1 = frequency_moment( + S, -1, frequency_bins=frequency_bins, to_pandas=False + ).rename({"m-1": "Te"}) + m0 = frequency_moment(S, 0, frequency_bins=frequency_bins, to_pandas=False).rename( + {"m0": "Te"} + ) # Eq 13 in IEC 62600-101 - Te = mn1/m0 - if isinstance(S,pd.Series): - Te = pd.DataFrame(Te, index=[0], columns=['Te']) - else: - Te = pd.DataFrame(Te, S.columns, columns=['Te']) + Te = mn1 / m0 + if to_pandas: + Te = Te.to_dataframe() return Te -def spectral_bandwidth(S,frequency_bins=None): +def spectral_bandwidth(S, frequency_bins=None, to_pandas=True): """ Calculates bandwidth from spectra Parameters ------------ - S: pandas DataFrame + S: pandas DataFrame, pandas Series, xarray DataArray, or xarray Dataset Spectral density [m^2/Hz] indexed by frequency [Hz] frequency_bins: numpy array or pandas Series (optional) Bin widths for frequency of S. Required for unevenly sized bins + to_pandas: bool (optional) + Flag to output pandas instead of xarray. Default = True. Returns --------- - e: pandas DataFrame + e: pandas DataFrame or xarray Dataset Spectral bandwidth [s] indexed by S.columns """ - assert isinstance(S, pd.DataFrame), 'S must be of type pd.DataFrame' + S = convert_to_dataset(S) + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type bool. Got: {type(to_pandas)}") - m2 = frequency_moment(S,2,frequency_bins=frequency_bins).squeeze() # convert to Series for calculation - m0 = frequency_moment(S,0,frequency_bins=frequency_bins).squeeze() - m4 = frequency_moment(S,4,frequency_bins=frequency_bins).squeeze() + m2 = frequency_moment(S, 2, frequency_bins=frequency_bins, to_pandas=False).rename( + {"m2": "e"} + ) + m0 = frequency_moment(S, 0, frequency_bins=frequency_bins, to_pandas=False).rename( + {"m0": "e"} + ) + m4 = frequency_moment(S, 4, frequency_bins=frequency_bins, to_pandas=False).rename( + {"m4": "e"} + ) - e = np.sqrt(1- (m2**2)/(m0/m4)) - e = pd.DataFrame(e, index=S.columns, columns=['e']) + e = np.sqrt(1 - (m2**2) / (m0 / m4)) + + if to_pandas: + e = e.to_dataframe() return e -def spectral_width(S,frequency_bins=None): +def spectral_width(S, frequency_bins=None, to_pandas=True): """ Calculates wave spectral width from spectra Parameters ------------ - S: pandas DataFrame + S: pandas DataFrame, pandas Series, xarray DataArray, or xarray Dataset Spectral density [m^2/Hz] indexed by frequency [Hz] frequency_bins: numpy array or pandas Series (optional) Bin widths for frequency of S. Required for unevenly sized bins + to_pandas: bool (optional) + Flag to output pandas instead of xarray. Default = True. Returns --------- - v: pandas DataFrame + v: pandas DataFrame or xarray Dataset Spectral width [m] indexed by S.columns """ - assert isinstance(S, pd.DataFrame), 'S must be of type pd.DataFrame' - - mn2 = frequency_moment(S,-2,frequency_bins=frequency_bins).squeeze() # convert to Series for calculation - m0 = frequency_moment(S,0,frequency_bins=frequency_bins).squeeze() - mn1 = frequency_moment(S,-1,frequency_bins=frequency_bins).squeeze() + S = convert_to_dataset(S) + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type bool. Got: {type(to_pandas)}") + + mn2 = frequency_moment( + S, -2, frequency_bins=frequency_bins, to_pandas=False + ).rename({"m-2": "v"}) + m0 = frequency_moment(S, 0, frequency_bins=frequency_bins, to_pandas=False).rename( + {"m0": "v"} + ) + mn1 = frequency_moment( + S, -1, frequency_bins=frequency_bins, to_pandas=False + ).rename({"m-1": "v"}) # Eq 16 in IEC 62600-101 - v = np.sqrt((m0*mn2/np.power(mn1,2))-1) - v = pd.DataFrame(v, index=S.columns, columns=['v']) + v = np.sqrt((m0 * mn2 / np.power(mn1, 2)) - 1) + + if to_pandas: + v = v.to_dataframe() return v -def energy_flux(S, h, deep=False, rho=1025, g=9.80665, ratio=2): +def energy_flux( + S, + h, + deep=False, + rho=1025, + g=9.80665, + ratio=2, + frequency_dimension="", + to_pandas=True, +): """ Calculates the omnidirectional wave energy flux of the spectra Parameters ----------- - S: pandas DataFrame or Series + S: pandas DataFrame, pandas Series, xarray DataArray, or xarray Dataset Spectral density [m^2/Hz] indexed by frequency [Hz] h: float Water depth [m] @@ -588,55 +810,70 @@ def energy_flux(S, h, deep=False, rho=1025, g=9.80665, ratio=2): ratio: float or int (optional) Only applied if depth=False. If h/l > ratio, water depth will be set to deep. Default ratio = 2. + frequency_dimension: string (optional) + Name of the xarray dimension corresponding to frequency. If not supplied, + defaults to the first dimension. Does not affect pandas input. + to_pandas: bool (optional) + Flag to output pandas instead of xarray. Default = True. Returns ------- - J: pandas DataFrame + J: pandas DataFrame or xarray Dataset Omni-directional wave energy flux [W/m] indexed by S.columns """ - assert isinstance(S, (pd.Series,pd.DataFrame)), 'S must be of type pd.DataFrame or pd.Series' - assert isinstance(h, (int,float)), 'h must be of type int or float' - assert isinstance(deep, bool), 'deep must be of type bool' - assert isinstance(rho, (int,float)), 'rho must be of type int or float' - assert isinstance(g, (int,float)), 'g must be of type int or float' - assert isinstance(ratio, (int,float)), 'ratio must be of type int or float' + S = convert_to_dataset(S) + if not isinstance(h, (int, float)): + raise TypeError(f"h must be of type int or float. Got: {type(h)}") + if not isinstance(deep, bool): + raise TypeError(f"deep must be of type bool. Got: {type(deep)}") + if not isinstance(rho, (int, float)): + raise TypeError(f"rho must be of type int or float. Got: {type(rho)}") + if not isinstance(g, (int, float)): + raise TypeError(f"g must be of type int or float. Got: {type(g)}") + if not isinstance(ratio, (int, float)): + raise TypeError(f"ratio must be of type int or float. Got: {type(ratio)}") + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type bool. Got: {type(to_pandas)}") + + if frequency_dimension == "": + frequency_dimension = list(S.coords)[0] + elif frequency_dimension not in list(S.dims): + raise ValueError( + f"frequency_dimension is not a dimension of S ({list(S.dims)}). Got: {frequency_dimension}." + ) + f = S[frequency_dimension] if deep: - # Eq 8 in IEC 62600-100, deep water simpilification - Te = energy_period(S) - Hm0 = significant_wave_height(S) + # Eq 8 in IEC 62600-100, deep water simplification + Te = energy_period(S, to_pandas=False).rename({"Te": "J"}) + Hm0 = significant_wave_height(S, to_pandas=False).rename({"Hm0": "J"}) - coeff = rho*(g**2)/(64*np.pi) - - J = coeff*(Hm0.squeeze()**2)*Te.squeeze() - if isinstance(S,pd.Series): - J = pd.DataFrame(J, index=[0], columns=["J"]) - else: - J = pd.DataFrame(J, S.columns, columns=["J"]) + coeff = rho * (g**2) / (64 * np.pi) + J = coeff * (Hm0**2) * Te else: # deep water flag is false - f = S.index - - k = wave_number(f, h, rho, g) + k = wave_number(f, h, rho, g, to_pandas=False) # wave celerity (group velocity) - Cg = wave_celerity(k, h, g, depth_check=True, ratio=ratio).squeeze() + Cg = wave_celerity(k, h, g, depth_check=True, ratio=ratio, to_pandas=False)[ + "Cg" + ] # Calculating the wave energy flux, Eq 9 in IEC 62600-101 - delta_f = pd.Series(f).diff() - delta_f.index = f - delta_f[f[0]] = delta_f[f[1]] # fill the initial NaN + delta_f = f.diff(dim=frequency_dimension) + delta_f0 = f[1] - f[0] + delta_f0 = delta_f0.assign_coords({frequency_dimension: f[0]}) + delta_f = xr.concat([delta_f0, delta_f], dim=frequency_dimension) - CgSdelF = S.multiply(delta_f, axis=0).multiply(Cg, axis=0) + CgSdelF = S * delta_f * Cg - J = rho * g * CgSdelF.sum(axis=0) + J = rho * g * CgSdelF.sum(dim=frequency_dimension) + J = _transform_dataset(J, "J") - if isinstance(S,pd.Series): - J = pd.DataFrame(J, index=[0], columns=["J"]) - else: - J = pd.DataFrame(J, S.columns, columns=["J"]) + if to_pandas: + J = J.to_dataframe() return J @@ -651,8 +888,7 @@ def energy_period_to_peak_period(Te, gamma): Parameters ---------- - Te: float or array - Spectral energy period [s] + Te: int, float, np.ndarray, pd.Series, pd.DataFrame, xr.DataArray, xr.Dataset gamma: float or int Peak enhancement factor for JONSWAP spectrum @@ -661,21 +897,33 @@ def energy_period_to_peak_period(Te, gamma): Tp: float or array Spectral peak period [s] """ - assert isinstance(Te, (float, np.ndarray)), 'Te must be a float or a ndarray' - assert isinstance(gamma, (float, int)), 'gamma must be of type float or int' + if not isinstance( + Te, (int, float, np.ndarray, pd.Series, pd.DataFrame, xr.DataArray, xr.Dataset) + ): + raise TypeError( + f"Te must be an int, float, np.ndarray, pd.Series, pd.DataFrame, xr.DataArray or xr.Dataset. Got: {type(Te)}" + ) + if not isinstance(gamma, (float, int)): + raise TypeError(f"gamma must be of type float or int. Got: {type(gamma)}") + + factor = 0.8255 + 0.03852 * gamma - 0.005537 * gamma**2 + 0.0003154 * gamma**3 - factor = 0.8255 + 0.03852*gamma - 0.005537*gamma**2 + 0.0003154*gamma**3 + Tp = Te / factor + if isinstance(Tp, xr.Dataset): + Tp.rename({"Te": "Tp"}) - return Te / factor + return Tp -def wave_celerity(k, h, g=9.80665, depth_check=False, ratio=2): +def wave_celerity( + k, h, g=9.80665, depth_check=False, ratio=2, frequency_dimension="", to_pandas=True +): """ Calculates wave celerity (group velocity) Parameters ---------- - k: pandas DataFrame or Series + k: pandas DataFrame, pandas Series, xarray DataArray, or xarray Dataset Wave number [1/m] indexed by frequency [Hz] h: float Water depth [m] @@ -686,22 +934,36 @@ def wave_celerity(k, h, g=9.80665, depth_check=False, ratio=2): ratio: float or int (optional) Only applied if depth_check=True. If h/l > ratio, water depth will be set to deep. Default ratio = 2 + frequency_dimension: string (optional) + Name of the xarray dimension corresponding to frequency. If not supplied, + defaults to the first dimension. Does not affect pandas input. + to_pandas: bool (optional) + Flag to output pandas instead of xarray. Default = True. Returns ------- - Cg: pandas DataFrame + Cg: pandas DataFrame or xarray Dataset Water celerity [m/s] indexed by frequency [Hz] """ - if isinstance(k, pd.DataFrame): - k = k.squeeze() - - assert isinstance(k, pd.Series), 'S must be of type pd.Series' - assert isinstance(h, (int,float)), 'h must be of type int or float' - assert isinstance(g, (int,float)), 'g must be of type int or float' - assert isinstance(depth_check, bool), 'depth_check must be of type bool' - assert isinstance(ratio, (int,float)), 'ratio must be of type int or float' - - f = k.index + k = convert_to_dataarray(k) + if not isinstance(h, (int, float)): + raise TypeError(f"h must be of type int or float. Got: {type(h)}") + if not isinstance(g, (int, float)): + raise TypeError(f"g must be of type int or float. Got: {type(g)}") + if not isinstance(depth_check, bool): + raise TypeError(f"depth_check must be of type bool. Got: {type(depth_check)}") + if not isinstance(ratio, (int, float)): + raise TypeError(f"ratio must be of type int or float. Got: {type(ratio)}") + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type bool. Got: {type(to_pandas)}") + + if frequency_dimension == "": + frequency_dimension = list(k.coords)[0] + elif frequency_dimension not in list(k.dims): + raise ValueError( + f"frequency_dimension is not a dimension of k ({list(k.dims)}). Got: {frequency_dimension}." + ) + f = k[frequency_dimension] k = k.values if depth_check: @@ -715,21 +977,36 @@ def wave_celerity(k, h, g=9.80665, depth_check=False, ratio=2): dk = k[dr] # deep water approximation - dCg = (np.pi * df / dk) - dCg = pd.DataFrame(dCg, index=df, columns=["Cg"]) + dCg = np.pi * df / dk + dCg = xr.DataArray( + data=dCg, dims=frequency_dimension, coords={frequency_dimension: df} + ) + dCg.name = "Cg" # shallow frequencies sf = f[~dr] sk = k[~dr] sCg = (np.pi * sf / sk) * (1 + (2 * h * sk) / np.sinh(2 * h * sk)) - sCg = pd.DataFrame(sCg, index = sf, columns = ["Cg"]) + sCg = xr.DataArray( + data=sCg, dims=frequency_dimension, coords={frequency_dimension: sf} + ) + sCg.name = "Cg" - Cg = pd.concat([dCg, sCg]).sort_index() + Cg = xr.concat([dCg, sCg], dim=frequency_dimension).sortby(frequency_dimension) + Cg.name = "Cg" else: # Eq 10 in IEC 62600-101 Cg = (np.pi * f / k) * (1 + (2 * h * k) / np.sinh(2 * h * k)) - Cg = pd.DataFrame(Cg, index=f, columns=["Cg"]) + Cg = xr.DataArray( + data=Cg, dims=frequency_dimension, coords={frequency_dimension: f} + ) + Cg.name = "Cg" + + Cg = Cg.to_dataset() + + if to_pandas: + Cg = Cg.to_dataframe() return Cg @@ -741,29 +1018,27 @@ def wave_length(k): Parameters ------------- - k: pandas Dataframe + k: int, float, numpy ndarray, pandas Series, pandas DataFrame, xarray DataArray, or xarray Dataset Wave number [1/m] indexed by frequency Returns --------- - l: float or array - Wave length [m] indexed by frequency + l: int, float, numpy ndarray, pandas Series, pandas DataFrame, xarray DataArray, or xarray Dataset + Wave length [m] indexed by frequency. Output type is identical to the type of k. """ - if isinstance(k, (int, float, list)): - k = np.array(k) - elif isinstance(k, pd.DataFrame): - k = k.squeeze().values - elif isinstance(k, pd.Series): - k = k.values - - assert isinstance(k, np.ndarray), 'k must be array-like' + if not isinstance( + k, (int, float, np.ndarray, pd.Series, pd.DataFrame, xr.DataArray, xr.Dataset) + ): + raise TypeError( + f"k must be an int, float, np.ndarray, pd.Series, pd.DataFrame, xr.DataArray or xr.Dataset. Got: {type(k)}" + ) - l = 2*np.pi/k + l = 2 * np.pi / k return l -def wave_number(f, h, rho=1025, g=9.80665): +def wave_number(f, h, rho=1025, g=9.80665, to_pandas=True): """ Calculates wave number @@ -772,7 +1047,7 @@ def wave_number(f, h, rho=1025, g=9.80665): Parameters ----------- - f: numpy array + f: int, float, numpy ndarray, pandas DataFrame, pandas Series, xarray DataArray, or xarray Dataset Frequency [Hz] h: float Water depth [m] @@ -780,29 +1055,34 @@ def wave_number(f, h, rho=1025, g=9.80665): Water density [kg/m^3] g: float (optional) Gravitational acceleration [m/s^2] + to_pandas: bool (optional) + Flag to output pandas instead of xarray. Default = True. Returns ------- - k: pandas DataFrame + k: pandas DataFrame or xarray Dataset Wave number [1/m] indexed by frequency [Hz] """ - try: - f = np.atleast_1d(np.array(f)) - except: - pass - assert isinstance(f, np.ndarray), 'f must be of type np.ndarray' - assert isinstance(h, (int,float)), 'h must be of type int or float' - assert isinstance(rho, (int,float)), 'rho must be of type int or float' - assert isinstance(g, (int,float)), 'g must be of type int or float' - - w = 2*np.pi*f # angular frequency - xi = w/np.sqrt(g/h) # note: =h*wa/sqrt(h*g/h) - yi = xi*xi/np.power(1.0-np.exp(-np.power(xi,2.4908)),0.4015) - k0 = yi/h # Initial guess without current-wave interaction + if isinstance(f, (int, float)): + f = np.asarray([f]) + f = convert_to_dataarray(f) + if not isinstance(h, (int, float)): + raise TypeError(f"h must be of type int or float. Got: {type(h)}") + if not isinstance(rho, (int, float)): + raise TypeError(f"rho must be of type int or float. Got: {type(rho)}") + if not isinstance(g, (int, float)): + raise TypeError(f"g must be of type int or float. Got: {type(g)}") + if not isinstance(to_pandas, bool): + raise TypeError(f"to_pandas must be of type bool. Got: {type(to_pandas)}") + + w = 2 * np.pi * f # angular frequency + xi = w / np.sqrt(g / h) # note: =h*wa/sqrt(h*g/h) + yi = xi * xi / np.power(1.0 - np.exp(-np.power(xi, 2.4908)), 0.4015) + k0 = yi / h # Initial guess without current-wave interaction # Eq 11 in IEC 62600-101 using initial guess from Guo (2002) def func(kk): - val = np.power(w,2) - g*kk*np.tanh(kk*h) + val = np.power(w, 2) - g * kk * np.tanh(kk * h) return val mask = np.abs(func(k0)) > 1e-9 @@ -811,16 +1091,21 @@ def func(kk): w = w[mask] k, info, ier, mesg = _fsolve(func, k0_mask, full_output=True) - assert ier == 1, 'Wave number not found. ' + mesg + if not ier == 1: + raise ValueError("Wave number not found. " + mesg) k0[mask] = k - k = pd.DataFrame(k0, index=f, columns=['k']) + k0.name = "k" + k = k0.to_dataset() + + if to_pandas: + k = k.to_dataframe() return k def depth_regime(l, h, ratio=2): - ''' + """ Calculates the depth regime based on wavelength and height Deep water: h/l > ratio This function exists so sinh in wave celerity doesn't blow @@ -833,7 +1118,7 @@ def depth_regime(l, h, ratio=2): Parameters ---------- - l: array-like + l: int, float, np.ndarray, pd.Series, pd.DataFrame, xr.DataArray, xr.Dataset wavelength [m] h: float or int water column depth [m] @@ -842,20 +1127,29 @@ def depth_regime(l, h, ratio=2): Returns ------- - depth_reg: boolean or boolean array + depth_reg: boolean or boolean array-like Boolean True if deep water, False otherwise - ''' - - if isinstance(l, (int, float, list)): - l = np.array(l) - elif isinstance(l, pd.DataFrame): - l = l.squeeze().values - elif isinstance(l, pd.Series): - l = l.values - - assert isinstance(l, (np.ndarray)), "l must be array-like" - assert isinstance(h, (int, float)), "h must be of type int or float" - - depth_reg = h/l > ratio - - return depth_reg + """ + if not isinstance( + l, (int, float, np.ndarray, pd.Series, pd.DataFrame, xr.DataArray, xr.Dataset) + ): + raise TypeError( + f"l must be of type int, float, np.ndarray, pd.DataFrame, pd.Series, xr.DataArray, or xr.Dataset. Got: {type(l)}" + ) + if not isinstance(h, (int, float)): + raise TypeError(f"h must be of type int or float. Got: {type(h)}") + + depth_reg = h / l > ratio + + return depth_reg + + +def _transform_dataset(data, name): + # Converting data from a Dataset into a DataArray will turn the variables + # columns into a 'variable' dimension. + # Converting it back to a dataset will keep this concise variable dimension + # but in the expected xr.Dataset/pd.DataFrame format + data = data.to_array() + data = convert_to_dataset(data, name=name) + data = data.rename({"variable": "index"}) + return data diff --git a/requirements-dev.txt b/requirements-dev.txt new file mode 100644 index 000000000..83e60c9dd --- /dev/null +++ b/requirements-dev.txt @@ -0,0 +1,4 @@ +# requirements-dev.txt +black +pylint +pytest diff --git a/requirements.txt b/requirements.txt index 01dcce300..b4f8bbe98 100644 --- a/requirements.txt +++ b/requirements.txt @@ -1,18 +1,18 @@ -pandas>=1.0.0, <=1.5.0 +pandas>=1.0.0 numpy>=1.21.0 scipy matplotlib requests -pecos>=0.1.9 +pecos>=0.3.0 fatpack lxml scikit-learn NREL-rex>=0.2.63 six>=1.13.0 h5py>=3.6.0 -h5pyd>=0.7.0, <=0.10.3 +h5pyd>=0.7.0 netCDF4>=1.5.8 -xarray<=2022.9.0 +xarray statsmodels bottleneck beautifulsoup4 diff --git a/setup.py b/setup.py index e68d1ef20..1c62eca5e 100644 --- a/setup.py +++ b/setup.py @@ -1,41 +1,43 @@ -from setuptools import setup, find_packages -from distutils.core import Extension import os import re +from setuptools import setup, find_packages -DISTNAME = 'mhkit' +DISTNAME = "mhkit" PACKAGES = find_packages() EXTENSIONS = [] -DESCRIPTION = 'Marine and Hydrokinetic Toolkit' -AUTHOR = 'MHKiT developers' -MAINTAINER_EMAIL = '' -LICENSE = 'Revised BSD' -URL = 'https://github.com/MHKiT-Software/mhkit-python' -CLASSIFIERS = ['Development Status :: 3 - Alpha', - 'Programming Language :: Python :: 3', - 'Topic :: Scientific/Engineering', - 'Intended Audience :: Science/Research', - 'Operating System :: OS Independent', - ] -DEPENDENCIES = ['pandas>=1.0.0, <=1.5.0', - 'numpy>=1.21.0', - 'scipy', - 'matplotlib', - 'requests', - 'pecos>=0.1.9', - 'fatpack', - 'lxml', - 'scikit-learn', - 'NREL-rex>=0.2.63', - 'six>=1.13.0', - 'h5py>=3.6.0', - 'h5pyd >=0.7.0, <=0.10.3', - 'netCDF4<=1.5.8', - 'xarray<=2022.9.0', - 'statsmodels', - 'pytz', - 'bottleneck', - 'beautifulsoup4',] +DESCRIPTION = "Marine and Hydrokinetic Toolkit" +AUTHOR = "MHKiT developers" +MAINTAINER_EMAIL = "" +LICENSE = "Revised BSD" +URL = "https://github.com/MHKiT-Software/mhkit-python" +CLASSIFIERS = [ + "Development Status :: 3 - Alpha", + "Programming Language :: Python :: 3", + "Topic :: Scientific/Engineering", + "Intended Audience :: Science/Research", + "Operating System :: OS Independent", +] +DEPENDENCIES = [ + "pandas>=1.0.0", + "numpy>=1.21.0", + "scipy", + "matplotlib", + "requests", + "pecos>=0.3.0", + "fatpack", + "lxml", + "scikit-learn", + "NREL-rex>=0.2.63", + "six>=1.13.0", + "h5py>=3.6.0", + "h5pyd >=0.7.0", + "netCDF4", + "xarray", + "statsmodels", + "pytz", + "bottleneck", + "beautifulsoup4", +] LONG_DESCRIPTION = """ MHKiT-Python is a Python package designed for marine renewable energy applications to assist in @@ -70,29 +72,29 @@ # get version from __init__.py file_dir = os.path.abspath(os.path.dirname(__file__)) -with open(os.path.join(file_dir, 'mhkit', '__init__.py')) as f: +with open(os.path.join(file_dir, "mhkit", "__init__.py")) as f: version_file = f.read() - version_match = re.search(r"^__version__ = ['\"]([^'\"]*)['\"]", - version_file, re.M) + version_match = re.search(r"^__version__ = ['\"]([^'\"]*)['\"]", version_file, re.M) if version_match: VERSION = version_match.group(1) else: raise RuntimeError("Unable to find version string.") -setup(name=DISTNAME, - version=VERSION, - packages=PACKAGES, - ext_modules=EXTENSIONS, - description=DESCRIPTION, - long_description_content_type="text/markdown", - long_description=LONG_DESCRIPTION, - author=AUTHOR, - maintainer_email=MAINTAINER_EMAIL, - license=LICENSE, - url=URL, - classifiers=CLASSIFIERS, - zip_safe=False, - install_requires=DEPENDENCIES, - scripts=[], - include_package_data=True - ) +setup( + name=DISTNAME, + version=VERSION, + packages=PACKAGES, + ext_modules=EXTENSIONS, + description=DESCRIPTION, + long_description_content_type="text/markdown", + long_description=LONG_DESCRIPTION, + author=AUTHOR, + maintainer_email=MAINTAINER_EMAIL, + license=LICENSE, + url=URL, + classifiers=CLASSIFIERS, + zip_safe=False, + install_requires=DEPENDENCIES, + scripts=[], + include_package_data=True, +)