diff --git a/.environment.yml b/.environment.yml index 9897be9400..b8cf75c44e 100644 --- a/.environment.yml +++ b/.environment.yml @@ -4,69 +4,113 @@ channels: - conda-forge - defaults dependencies: - - ca-certificates=2021.10.8 - - certifi=2021.10.8 + - ca-certificates>=2021.10.8 + - certifi>=2021.10.8 - ipykernel - - libcxx=12.0.0 + - libcxx>=12.0.0 - libffi>=3.3 - - ncurses=6.3 + - ncurses>=6.4 - make=4.3 - - openssl=1.1.1q - - pip=21.2.4 - - python=3.9.13 - - python_abi=3.9 - - readline=8.1.2 - - libzlib=1.2.13 + - openssl>=1.1.1q + - pip>=21.2.4 + - python=3.10.12 + - python_abi=3.10 + - readline>=8.1.2 + - libzlib>=1.2.13 - rust=1.67.1 - setuptools=61.2.0 - sqlite>=3.38.3 - tk>=8.6.11 - - tzdata=2022a - - wheel=0.37.1 - - xz=5.2.5 + - tzdata>=2022a + - wheel>=0.37.1 + - xz>=5.2.5 - zlib>=1.2.12 - pip: - - alabaster==0.7.12 - - babel==2.10.1 - - charset-normalizer==2.0.12 - - docutils==0.17.1 - - idna==3.3 - - imagesize==1.3.0 - - importlib-metadata==4.11.3 - - jupyter==1.0.0 - - markdown-it-py==2.1.0 - - markupsafe==2.1.1 + - accessible-pygments==0.0.4 + - alabaster==0.7.13 + - appnope==0.1.3 + - asttokens==2.2.1 + - attrs==23.1.0 + - autodocsumm==0.2.11 + - Babel==2.12.1 + - backcall==0.2.0 + - beautifulsoup4==4.12.2 + - bleach==6.0.0 + - certifi==2023.5.7 + - charset-normalizer==3.1.0 + - contourpy==1.1.0 + - cycler==0.11.0 + - decorator==5.1.1 + - defusedxml==0.7.1 + - docutils==0.19 + - executing==1.2.0 + - fastjsonschema==2.17.1 + - fonttools==4.40.0 + - idna==3.4 + - imagesize==1.4.1 + - ipython==8.14.0 + - jedi==0.18.2 + - Jinja2==3.1.2 + - jsonpickle==3.0.1 + - jsonschema==4.17.3 + - jupyter_client==8.3.0 + - jupyter_core==5.3.1 + - jupyterlab-pygments==0.2.2 + - kiwisolver==1.4.4 + - MarkupSafe==2.1.3 - matplotlib==3.7.1 - - maturin==0.14.17 - - mdit-py-plugins==0.3.0 - - mdurl==0.1.1 - - myst-parser==0.17.2 + - matplotlib-inline==0.1.6 + - maturin==1.1.0 + - mistune==3.0.1 + - nbclient==0.8.0 + - nbconvert==7.6.0 + - nbformat==5.9.0 + - nbsphinx==0.9.2 + - networkx==3.1 + - numpy==1.25.0 - numpydoc==1.5.0 - - packaging==21.3 - - pandas==2.0.2 - - patchelf==0.17.2.1 - - poetry==1.2.0 - - pygments==2.12.0 - - pyparsing==3.0.8 - - pytz==2022.1 - - pyyaml==6.0 + - packaging==23.1 + - pandas==2.0.3 + - pandocfilters==1.5.0 + - parso==0.8.3 + - pexpect==4.8.0 + - pickleshare==0.7.5 + - Pillow==10.0.0 + - platformdirs==3.8.0 + - prompt-toolkit==3.0.39 + - ptyprocess==0.7.0 + - pure-eval==0.2.2 - pydata-sphinx-theme==0.13.3 + - Pygments==2.15.1 + - pyparsing==3.1.0 + - pyrsistent==0.19.3 + - python-dateutil==2.8.2 + - pytz==2023.3 - pyvis==0.3.2 - - requests==2.27.1 + - pyzmq==25.1.0 + - requests==2.31.0 + - six==1.16.0 - snowballstemmer==2.2.0 - - nbsphinx>=0.8.7 - - sphinx==4.5.0 - - sphinx-rtd-theme==1.0.0 - - sphinxcontrib-applehelp==1.0.2 - - sphinx_copybutton==0.5.2 + - soupsieve==2.4.1 + - Sphinx==6.2.1 + - sphinx-copybutton==0.5.2 + - sphinx-toggleprompt==0.4.0 - sphinx_design==0.4.1 + - sphinxcontrib-applehelp==1.0.4 - sphinxcontrib-devhelp==1.0.2 - - sphinxcontrib-htmlhelp==2.0.0 - - sphinx_toggleprompt==0.4.0 - - sphinx-tabs==3.4.0 + - sphinxcontrib-htmlhelp==2.0.1 - sphinxcontrib-jsmath==1.0.1 - sphinxcontrib-qthelp==1.0.3 - sphinxcontrib-serializinghtml==1.1.5 - - typing-extensions==4.2.0 - - urllib3==1.26.9 - - zipp==3.8.0 + - stack-data==0.6.2 + - tinycss2==1.2.1 + - tomli==2.0.1 + - tornado==6.3.2 + - traitlets==5.9.0 + - typing_extensions==4.7.1 + - tzdata==2023.3 + - urllib3==2.0.3 + - wcwidth==0.2.6 + - webencodings==0.5.1 + + diff --git a/.fleet/settings.json b/.fleet/settings.json new file mode 100644 index 0000000000..a7858d188f --- /dev/null +++ b/.fleet/settings.json @@ -0,0 +1,3 @@ +{ + "editor.guides": [] +} \ No newline at end of file diff --git a/.github/workflows/_release_python.yml b/.github/workflows/_release_python.yml index 0b2154a9a0..0fbc291f82 100644 --- a/.github/workflows/_release_python.yml +++ b/.github/workflows/_release_python.yml @@ -18,8 +18,7 @@ jobs: runs-on: ubuntu-latest strategy: matrix: - target: [x86_64, aarch64, armv7] - python: ['3.9', '3.10'] + target: [x86_64, aarch64] steps: - name: "Check if user has write access" uses: "lannonbr/repo-permission-check-action@2.0.0" @@ -43,16 +42,18 @@ jobs: ref: ${{ inputs.base }} - uses: actions/setup-python@v4 with: - python-version: ${{ matrix.python }} - - name: Setup QEMU - uses: docker/setup-qemu-action@v1 + python-version: | + 3.8 + 3.9 + 3.10 + 3.11 - name: Build wheels uses: PyO3/maturin-action@v1 with: working-directory: ./python command: build target: ${{ matrix.target }} - args: --release --out dist --find-interpreter + args: --release --out dist -i python3.7 -i python3.8 -i python3.9 -i python3.10 -i python3.11 manylinux: 2014 before-script-linux: | if [[ -f /etc/os-release ]]; then @@ -101,7 +102,6 @@ jobs: strategy: matrix: target: [x64] - python: ['3.9', '3.10'] steps: - name: "Check if user has write access" uses: "lannonbr/repo-permission-check-action@2.0.0" @@ -114,7 +114,11 @@ jobs: ref: ${{ inputs.base }} - uses: actions/setup-python@v4 with: - python-version: ${{ matrix.python }} + python-version: | + 3.8 + 3.9 + 3.10 + 3.11 architecture: ${{ matrix.target }} - name: Build wheels uses: PyO3/maturin-action@v1 @@ -122,7 +126,7 @@ jobs: working-directory: ./python command: build target: ${{ matrix.target }} - args: --release --out dist --find-interpreter + args: --release --out dist -i python3.7 -i python3.8 -i python3.9 -i python3.10 -i python3.11 - name: Upload wheels to gh artifact uses: actions/upload-artifact@v3 with: @@ -133,7 +137,6 @@ jobs: strategy: matrix: target: [x86_64, aarch64] - python: ['3.9', '3.10'] steps: - name: "Check if user has write access" uses: "lannonbr/repo-permission-check-action@2.0.0" @@ -157,7 +160,11 @@ jobs: ref: ${{ inputs.base }} - uses: actions/setup-python@v4 with: - python-version: ${{ matrix.python }} + python-version: | + 3.8 + 3.9 + 3.10 + 3.11 - name: Build wheels uses: PyO3/maturin-action@v1 with: diff --git a/.github/workflows/_release_rust.yml b/.github/workflows/_release_rust.yml index 925fb09d54..48d1fd59fa 100644 --- a/.github/workflows/_release_rust.yml +++ b/.github/workflows/_release_rust.yml @@ -61,27 +61,9 @@ jobs: with: command: publish args: --token ${{ secrets.CRATES_TOKEN }} --package raphtory --allow-dirty - - name: "Publish raphtory-io to crates.io" - if: ${{ !inputs.dry_run }} - uses: actions-rs/cargo@v1 - with: - command: publish - args: --token ${{ secrets.CRATES_TOKEN }} --package raphtory-io --allow-dirty - name: "Publish raphtory-graphql to crates.io" if: ${{ !inputs.dry_run }} uses: actions-rs/cargo@v1 with: command: publish args: --token ${{ secrets.CRATES_TOKEN }} --package raphtory-graphql --allow-dirty - - name: "Publish py-raphtory to crates.io" - if: ${{ !inputs.dry_run }} - uses: actions-rs/cargo@v1 - with: - command: publish - args: --token ${{ secrets.CRATES_TOKEN }} --package py-raphtory --allow-dirty - - name: "Publish raphtory-pymodule to crates.io" - if: ${{ !inputs.dry_run }} - uses: actions-rs/cargo@v1 - with: - command: publish - args: --token ${{ secrets.CRATES_TOKEN }} --package raphtory-pymodule --allow-dirty \ No newline at end of file diff --git a/.github/workflows/binder_auto_build.yml b/.github/workflows/binder_auto_build.yml index 1b5d2f8ddb..c91bffcdd3 100644 --- a/.github/workflows/binder_auto_build.yml +++ b/.github/workflows/binder_auto_build.yml @@ -11,6 +11,6 @@ jobs: steps: - uses: s-weigand/trigger-mybinder-build@v1 with: - target-repo: raphtory/raphtory + target-repo: pometry/raphtory service-name: gh use-default-build-servers: true diff --git a/.github/workflows/code_coverage.yml b/.github/workflows/code_coverage.yml index 59195e9bca..e41a7e8d65 100644 --- a/.github/workflows/code_coverage.yml +++ b/.github/workflows/code_coverage.yml @@ -51,7 +51,7 @@ jobs: with: command: clean - name: Run tests (rust) - run: cargo test -p raphtory + run: cargo test -p raphtory --features "io python" env: CARGO_INCREMENTAL: '0' RUSTFLAGS: '-Zprofile -Ccodegen-units=1 -Cinline-threshold=0 -Clink-dead-code -Coverflow-checks=off -Cpanic=abort -Zpanic_abort_tests' @@ -66,7 +66,7 @@ jobs: name: Run rust tests (rust-grcov) and collect coverage uses: actions-rs/grcov@v0.1.5 - name: Run python tests and collect coverage - run: pytest --cov=./ --cov-report=xml + run: cd python/tests && pytest --cov=./ --cov-report=xml - name: Codecov uses: codecov/codecov-action@v3.1.1 with: diff --git a/.github/workflows/rust_format_check.yml b/.github/workflows/rust_format_check.yml new file mode 100644 index 0000000000..6bf9353ffc --- /dev/null +++ b/.github/workflows/rust_format_check.yml @@ -0,0 +1,31 @@ +# this workflow checks out the code, and installs nightly build of cargo and runs a cargo +nightly fmt --all -- --check and fails workflow if any code is not formatted +# + +name: Rust format check +on: + workflow_call: + inputs: + fail_if_not_formatted: + type: boolean + default: true + required: false + description: "Fail the workflow if any code is not formatted" + +jobs: + rust-format-check: + runs-on: ubuntu-latest + steps: + - uses: actions/checkout@v2 + - name: Setup Rust + uses: actions-rs/toolchain@v1 + with: + toolchain: nightly + override: true + components: rustfmt + - name: Run rust format check + run: | + if [ ${{ inputs.fail_if_not_formatted }} == true ]; then + cargo +nightly fmt --all -- --check + else + cargo +nightly fmt --all -- --check || true + fi \ No newline at end of file diff --git a/.github/workflows/test.yml b/.github/workflows/test.yml index 9432888ca0..a7417ee399 100644 --- a/.github/workflows/test.yml +++ b/.github/workflows/test.yml @@ -3,9 +3,6 @@ on: push: branches: - master - pull_request: - branches: - - master concurrency: group: ${{ github.workflow }}-${{ github.event.pull_request.number || github.ref }} @@ -13,6 +10,9 @@ concurrency: jobs: + rust-format-check: + name: Rust format check + uses: ./.github/workflows/rust_format_check.yml call-test-rust-workflow-in-local-repo: name: Run Rust tests uses: ./.github/workflows/test_rust_workflow.yml @@ -20,6 +20,8 @@ jobs: call-test-python-workflow-in-local-repo: name: Run Python tests uses: ./.github/workflows/test_python_workflow.yml + with: + test_python_lower: true secrets: inherit call-benchmark-workflow-in-local-repo: name: Run benchmarks diff --git a/.github/workflows/test_during_pr.yml b/.github/workflows/test_during_pr.yml new file mode 100644 index 0000000000..2169067a6f --- /dev/null +++ b/.github/workflows/test_during_pr.yml @@ -0,0 +1,37 @@ +name: Run tests during PR +on: + pull_request: + branches: + - master + +concurrency: + group: ${{ github.workflow }}-${{ github.event.pull_request.number || github.ref }} + cancel-in-progress: true + + +jobs: + rust-format-check: + name: Rust format check + uses: ./.github/workflows/rust_format_check.yml + call-test-rust-workflow-in-local-repo: + name: Run Rust tests + uses: ./.github/workflows/test_rust_workflow.yml + secrets: inherit + needs: rust-format-check + call-test-python-workflow-in-local-repo: + name: Run Python tests + uses: ./.github/workflows/test_python_workflow.yml + with: + test_python_lower: false + secrets: inherit + needs: rust-format-check + call-benchmark-workflow-in-local-repo: + name: Run benchmarks + uses: ./.github/workflows/benchmark.yml + secrets: inherit + needs: rust-format-check + call-code-coverage: + name: Code Coverage + uses: ./.github/workflows/code_coverage.yml + needs: rust-format-check + diff --git a/.github/workflows/test_python_workflow.yml b/.github/workflows/test_python_workflow.yml index b4c95656ff..faa50cd0f4 100644 --- a/.github/workflows/test_python_workflow.yml +++ b/.github/workflows/test_python_workflow.yml @@ -6,14 +6,31 @@ on: type: boolean default: false required: false + test_python_lower: + type: boolean + default: false + required: false # DO NOT CHANGE NAME OF WORKFLOW, USED IN OTHER WORKFLOWS KEEP "Rust Tests" jobs: + select-strategy: + runs-on: ubuntu-latest + outputs: + python-versions: ${{ steps.set-matrix.outputs.python-versions }} + steps: + - id: set-matrix + run: | + if [ ${{ inputs.test_python_lower }} == true ]; then + echo "python-versions=[\"3.8\",\"3.11\"]" >> $GITHUB_OUTPUT + else + echo "python-versions=[\"3.8\"]" >> $GITHUB_OUTPUT + fi python-test: if: ${{ !inputs.skip_tests }} name: Python Tests + needs: select-strategy strategy: matrix: - python: ['3.9', '3.10'] + python: ${{ fromJson(needs.select-strategy.outputs.python-versions) }} os: [macos-latest, ubuntu-latest, windows-latest] runs-on: '${{ matrix.os }}' steps: @@ -55,6 +72,7 @@ jobs: run: | python -m pip install -q pytest networkx numpy seaborn pandas nbmake pytest-xdist matplotlib pyvis python -m pip install target/wheels/raphtory-*.whl + python -m pip install -e examples/custom_python_extension - name: Install Python dependencies (Windows) if: "contains(matrix.os, 'Windows')" run: | @@ -63,6 +81,10 @@ jobs: Get-ChildItem -Path $folder_path -Recurse -Include *.whl | ForEach-Object { python -m pip install "$($_.FullName)" } + python -m pip install -e examples/custom_python_extension - name: Run Python tests run: | cd python/tests && pytest --nbmake --nbmake-timeout=1200 . + - name: Run Python extension tests + run: | + cd examples/custom_python_extension/test && pytest . diff --git a/.github/workflows/test_rust_workflow.yml b/.github/workflows/test_rust_workflow.yml index 928b8ef762..e13ee211e5 100644 --- a/.github/workflows/test_rust_workflow.yml +++ b/.github/workflows/test_rust_workflow.yml @@ -30,8 +30,6 @@ jobs: ~/.cargo/registry/index/ ~/.cargo/registry/cache/ ~/.cargo/git/db/ - target/debug - target/release key: ${{ runner.os }}-cargo-${{ hashFiles('**/Cargo.lock') }} restore-keys: ${{ runner.os }}-cargo-${{ hashFiles('**/Cargo.lock') }} - uses: actions-rs/toolchain@v1 @@ -47,7 +45,7 @@ jobs: RUSTFLAGS: -Awarnings with: command: test - args: --all --no-default-features + args: --all --no-default-features --features "raphtory/io raphtory/python" doc-test: if: ${{ !inputs.skip_tests }} name: "Doc tests" @@ -68,8 +66,6 @@ jobs: ~/.cargo/registry/index/ ~/.cargo/registry/cache/ ~/.cargo/git/db/ - target/debug - target/release key: ${{ runner.os }}-cargo-${{ hashFiles('**/Cargo.lock') }} restore-keys: ${{ runner.os }}-cargo- - uses: actions-rs/toolchain@v1 diff --git a/.gitignore b/.gitignore index 3838651bdf..82b18e8c99 100644 --- a/.gitignore +++ b/.gitignore @@ -5,9 +5,11 @@ massif.* *.svg # this is for raphtory **/.env/ -**/data/* +comparison-benchmark/python/data/* .vscode docs/source/_rustdoc/* +docs/nx.html +docs/graph.html docs/build/* .DS_Store docs/logs/* @@ -22,3 +24,12 @@ examples/py/enron/emails.csv /docs/lib/ /docs/build/ docs/source/ +.env + +# Byte-compiled / optimized / DLL files +__pycache__/ +.pytest_cache/ +*.py[cod] + +# C extensions +*.so \ No newline at end of file diff --git a/.rustfmt.toml b/.rustfmt.toml new file mode 100644 index 0000000000..4c54ff0d8f --- /dev/null +++ b/.rustfmt.toml @@ -0,0 +1,2 @@ +#will enable when it is stable +imports_granularity = "Crate" \ No newline at end of file diff --git a/Cargo.lock b/Cargo.lock index 3d6745c3d9..ddd7631781 100644 --- a/Cargo.lock +++ b/Cargo.lock @@ -18,15 +18,44 @@ version = "1.0.2" source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "f26201604c87b1e01bd3d98f8d5d9a8fcbb815e8cedb41ffccbeb4bf593a35fe" +[[package]] +name = "aes" +version = "0.8.3" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "ac1f845298e95f983ff1944b728ae08b8cebab80d684f0a832ed0fc74dfa27e2" +dependencies = [ + "cfg-if 1.0.0", + "cipher", + "cpufeatures", +] + +[[package]] +name = "ahash" +version = "0.8.3" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "2c99f64d1e06488f620f932677e24bc6e2897582980441ae90a671415bd7ec2f" +dependencies = [ + "cfg-if 1.0.0", + "getrandom 0.2.10", + "once_cell", + "version_check", +] + [[package]] name = "aho-corasick" -version = "1.0.1" +version = "1.0.2" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "67fc08ce920c31afb70f013dcce1bfc3a3195de6a228474e45e1f145b36f8d04" +checksum = "43f6cb1bf222025340178f382c426f13757b2960e89779dfcb319c32542a5a41" dependencies = [ "memchr", ] +[[package]] +name = "android-tzdata" +version = "0.1.1" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "e999941b234f3131b00bc13c22d06e8c5ff726d1b6318ac7eb276997bbb4fef0" + [[package]] name = "android_system_properties" version = "0.1.5" @@ -42,17 +71,101 @@ version = "0.1.6" source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "4b46cbb362ab8752921c97e041f5e366ee6297bd428a31275b9fcf1e380f7299" +[[package]] +name = "anstream" +version = "0.3.2" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "0ca84f3628370c59db74ee214b3263d58f9aadd9b4fe7e711fd87dc452b7f163" +dependencies = [ + "anstyle", + "anstyle-parse", + "anstyle-query", + "anstyle-wincon", + "colorchoice", + "is-terminal", + "utf8parse", +] + +[[package]] +name = "anstyle" +version = "1.0.1" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "3a30da5c5f2d5e72842e00bcb57657162cdabef0931f40e2deb9b4140440cecd" + +[[package]] +name = "anstyle-parse" +version = "0.2.1" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "938874ff5980b03a87c5524b3ae5b59cf99b1d6bc836848df7bc5ada9643c333" +dependencies = [ + "utf8parse", +] + +[[package]] +name = "anstyle-query" +version = "1.0.0" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "5ca11d4be1bab0c8bc8734a9aa7bf4ee8316d462a08c6ac5052f888fef5b494b" +dependencies = [ + "windows-sys 0.48.0", +] + +[[package]] +name = "anstyle-wincon" +version = "1.0.1" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "180abfa45703aebe0093f79badacc01b8fd4ea2e35118747e5811127f926e188" +dependencies = [ + "anstyle", + "windows-sys 0.48.0", +] + +[[package]] +name = "arc-swap" +version = "1.6.0" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "bddcadddf5e9015d310179a59bb28c4d4b9920ad0f11e8e14dbadf654890c9a6" + +[[package]] +name = "arrow2" +version = "0.17.2" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "15ae0428d69ab31d7b2adad22a752d6f11fef2e901d2262d0cad4f5cb08b7093" +dependencies = [ + "ahash", + "bytemuck", + "chrono", + "dyn-clone", + "either", + "ethnum", + "foreign_vec", + "getrandom 0.2.10", + "hash_hasher", + "num-traits", + "rustc_version", + "simdutf8", +] + [[package]] name = "ascii_utils" version = "0.9.3" source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "71938f30533e4d95a6d17aa530939da3842c2ab6f4f84b9dae68447e4129f74a" +[[package]] +name = "async-convert" +version = "1.0.0" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "6d416feee97712e43152cd42874de162b8f9b77295b1c85e5d92725cc8310bae" +dependencies = [ + "async-trait", +] + [[package]] name = "async-graphql" -version = "5.0.8" +version = "5.0.10" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "6ae09afb01514b3dbd6328547b2b11fcbcb0205d9c5e6f2e17e60cb166a82d7f" +checksum = "b35ef8f9be23ee30fe1eb1cf175c689bc33517c6c6d0fd0669dade611e5ced7f" dependencies = [ "async-graphql-derive", "async-graphql-parser", @@ -66,7 +179,7 @@ dependencies = [ "futures-util", "handlebars", "http", - "indexmap", + "indexmap 1.9.3", "mime", "multer", "num-traits", @@ -83,13 +196,13 @@ dependencies = [ [[package]] name = "async-graphql-derive" -version = "5.0.8" +version = "5.0.10" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "60ae62851dd3ff9a7550aee75e848e8834b75285b458753e98dd71d0733ad3f2" +checksum = "1a0f6ceed3640b4825424da70a5107e79d48d9b2bc6318dfc666b2fc4777f8c4" dependencies = [ "Inflector", "async-graphql-parser", - "darling", + "darling 0.14.4", "proc-macro-crate", "proc-macro2", "quote", @@ -99,9 +212,9 @@ dependencies = [ [[package]] name = "async-graphql-parser" -version = "5.0.8" +version = "5.0.10" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "9e6ee332acd99d2c50c3443beae46e9ed784c205eead9a668b7b5118b4a60a8b" +checksum = "ecc308cd3bc611ee86c9cf19182d2b5ee583da40761970e41207f088be3db18f" dependencies = [ "async-graphql-value", "pest", @@ -111,9 +224,9 @@ dependencies = [ [[package]] name = "async-graphql-poem" -version = "5.0.8" +version = "5.0.10" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "c714cf530b5b4d5dec0d177be059a76bcd6823824564f74254ce24a9fccee73b" +checksum = "68f818938d4e47dcc40bc383e9ddec373e9aab1db29e5ad9706b29621afe3b3f" dependencies = [ "async-graphql", "futures-util", @@ -124,14 +237,37 @@ dependencies = [ [[package]] name = "async-graphql-value" -version = "5.0.8" +version = "5.0.10" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "122da50452383410545b9428b579f4cda5616feb6aa0aff0003500c53fcff7b7" +checksum = "d461325bfb04058070712296601dfe5e5bd6cdff84780a0a8c569ffb15c87eb3" dependencies = [ "bytes", - "indexmap", + "indexmap 1.9.3", + "serde", + "serde_json", +] + +[[package]] +name = "async-openai" +version = "0.14.0" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "7614373e1d24d44f7b57df2125c5253c7afbf927574f2695371e5589a0dd4937" +dependencies = [ + "async-convert", + "backoff", + "base64 0.21.2", + "derive_builder", + "futures", + "rand 0.8.5", + "reqwest", + "reqwest-eventsource", "serde", "serde_json", + "thiserror", + "tokio", + "tokio-stream", + "tokio-util", + "tracing", ] [[package]] @@ -153,18 +289,18 @@ checksum = "16e62a023e7c117e27523144c5d2459f4397fcc3cab0085af8e2224f643a0193" dependencies = [ "proc-macro2", "quote", - "syn 2.0.15", + "syn 2.0.28", ] [[package]] name = "async-trait" -version = "0.1.68" +version = "0.1.73" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "b9ccdd8f2a161be9bd5c023df56f1b2a0bd1d83872ae53b71a84a12c9bf6e842" +checksum = "bc00ceb34980c03614e35a3a4e218276a0a824e911d07651cd0d858a51e8c0f0" dependencies = [ "proc-macro2", "quote", - "syn 2.0.15", + "syn 2.0.28", ] [[package]] @@ -184,6 +320,20 @@ version = "1.1.0" source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "d468802bab17cbc0cc575e9b053f41e72aa36bfa6b7f55e3529ffa43161b97fa" +[[package]] +name = "backoff" +version = "0.4.0" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "b62ddb9cb1ec0a098ad4bbf9344d0713fa193ae1a80af55febcff2627b6a00c1" +dependencies = [ + "futures-core", + "getrandom 0.2.10", + "instant", + "pin-project-lite", + "rand 0.8.5", + "tokio", +] + [[package]] name = "base64" version = "0.13.1" @@ -192,9 +342,15 @@ checksum = "9e1b586273c5702936fe7b7d6896644d8be71e6314cfe09d3167c95f712589e8" [[package]] name = "base64" -version = "0.21.0" +version = "0.21.2" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "a4a4ddaa51a5bc52a6948f74c06d20aaaddb71924eab79b8c97a8c556e942d6a" +checksum = "604178f6c5c21f02dc555784810edfb88d34ac2c73b2eae109655649ee73ce3d" + +[[package]] +name = "base64ct" +version = "1.6.0" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "8c3c1a368f70d6cf7302d78f8f7093da241fb8e8807c05cc9e51a125895a6d5b" [[package]] name = "bincode" @@ -211,6 +367,21 @@ version = "1.3.2" source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "bef38d45163c2f1dde094a7dfd33ccf595c92905c8f8f4fdc18d06fb1037718a" +[[package]] +name = "bitflags" +version = "2.3.3" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "630be753d4e58660abd17930c71b647fe46c27ea6b63cc59e1e3851406972e42" + +[[package]] +name = "bitpacking" +version = "0.8.4" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "a8c7d2ac73c167c06af4a5f37e6e59d84148d57ccbe4480b76f0273eefea82d7" +dependencies = [ + "crunchy", +] + [[package]] name = "block-buffer" version = "0.10.4" @@ -222,15 +393,29 @@ dependencies = [ [[package]] name = "bumpalo" -version = "3.12.1" +version = "3.13.0" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "9b1ce199063694f33ffb7dd4e0ee620741495c32833cde5aa08f02a0bf96f0c8" +checksum = "a3e2c3daef883ecc1b5d58c15adae93470a91d425f3532ba1695849656af3fc1" [[package]] name = "bytemuck" version = "1.13.1" source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "17febce684fd15d89027105661fec94afb475cb995fbc59d2865198446ba2eea" +dependencies = [ + "bytemuck_derive", +] + +[[package]] +name = "bytemuck_derive" +version = "1.4.1" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "fdde5c9cd29ebd706ce1b35600920a33550e402fc998a2e53ad3b42c3c47a192" +dependencies = [ + "proc-macro2", + "quote", + "syn 2.0.28", +] [[package]] name = "byteorder" @@ -279,6 +464,15 @@ name = "cc" version = "1.0.79" source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "50d30906286121d95be3d479533b458f87493b30a4b5f79a607db8f5d11aa91f" +dependencies = [ + "jobserver", +] + +[[package]] +name = "census" +version = "0.4.1" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "0fafee10a5dd1cffcb5cc560e0d0df8803d7355a2b12272e3557dee57314cb6e" [[package]] name = "cfg-if" @@ -294,25 +488,25 @@ checksum = "baf1de4339761588bc0619e3cbc0120ee582ebb74b53b4efbf79117bd2da40fd" [[package]] name = "chrono" -version = "0.4.24" +version = "0.4.26" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "4e3c5919066adf22df73762e50cffcde3a758f2a848b113b586d1f86728b673b" +checksum = "ec837a71355b28f6556dbd569b37b3f363091c0bd4b2e735674521b4c5fd9bc5" dependencies = [ + "android-tzdata", "iana-time-zone", "js-sys", - "num-integer", "num-traits", "serde", - "time", + "time 0.1.45", "wasm-bindgen", "winapi", ] [[package]] name = "ciborium" -version = "0.2.0" +version = "0.2.1" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "b0c137568cc60b904a7724001b35ce2630fd00d5d84805fbb608ab89509d788f" +checksum = "effd91f6c78e5a4ace8a5d3c0b6bfaec9e2baaef55f3efc00e45fb2e477ee926" dependencies = [ "ciborium-io", "ciborium-ll", @@ -321,32 +515,77 @@ dependencies = [ [[package]] name = "ciborium-io" -version = "0.2.0" +version = "0.2.1" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "346de753af073cc87b52b2083a506b38ac176a44cfb05497b622e27be899b369" +checksum = "cdf919175532b369853f5d5e20b26b43112613fd6fe7aee757e35f7a44642656" [[package]] name = "ciborium-ll" -version = "0.2.0" +version = "0.2.1" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "213030a2b5a4e0c0892b6652260cf6ccac84827b83a85a534e178e3906c4cf1b" +checksum = "defaa24ecc093c77630e6c15e17c51f5e187bf35ee514f4e2d67baaa96dae22b" dependencies = [ "ciborium-io", "half", ] +[[package]] +name = "cipher" +version = "0.4.4" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "773f3b9af64447d2ce9850330c473515014aa235e6a783b02db81ff39e4a3dad" +dependencies = [ + "crypto-common", + "inout", +] + [[package]] name = "clap" -version = "3.2.23" +version = "3.2.25" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "71655c45cb9845d3270c9d6df84ebe72b4dad3c2ba3f7023ad47c144e4e473a5" +checksum = "4ea181bf566f71cb9a5d17a59e1871af638180a18fb0035c92ae62b705207123" dependencies = [ - "bitflags", - "clap_lex", - "indexmap", + "bitflags 1.3.2", + "clap_lex 0.2.4", + "indexmap 1.9.3", "textwrap", ] +[[package]] +name = "clap" +version = "4.3.11" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "1640e5cc7fb47dbb8338fd471b105e7ed6c3cb2aeb00c2e067127ffd3764a05d" +dependencies = [ + "clap_builder", + "clap_derive", + "once_cell", +] + +[[package]] +name = "clap_builder" +version = "4.3.11" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "98c59138d527eeaf9b53f35a77fcc1fad9d883116070c63d5de1c7dc7b00c72b" +dependencies = [ + "anstream", + "anstyle", + "clap_lex 0.5.0", + "strsim", +] + +[[package]] +name = "clap_derive" +version = "4.3.2" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "b8cd2b2a819ad6eec39e8f1d6b53001af1e5469f8c177579cdaeb313115b825f" +dependencies = [ + "heck", + "proc-macro2", + "quote", + "syn 2.0.28", +] + [[package]] name = "clap_lex" version = "0.2.4" @@ -357,13 +596,24 @@ dependencies = [ ] [[package]] -name = "codespan-reporting" -version = "0.11.1" +name = "clap_lex" +version = "0.5.0" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "2da6da31387c7e4ef160ffab6d5e7f00c42626fe39aea70a7b0f1773f7dd6c1b" + +[[package]] +name = "colorchoice" +version = "1.0.0" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "3538270d33cc669650c4b093848450d380def10c331d38c768e34cac80576e6e" +checksum = "acbf1af155f9b9ef647e42cdc158db4b64a1b61f743629225fde6f3e0be2a7c7" + +[[package]] +name = "combine" +version = "4.6.6" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "35ed6e9d84f0b51a7f52daf1c7d71dd136fd7a3f41a8462b8cdb8c78d920fad4" dependencies = [ - "termcolor", - "unicode-width", + "memchr", ] [[package]] @@ -376,6 +626,12 @@ dependencies = [ "wasm-bindgen", ] +[[package]] +name = "constant_time_eq" +version = "0.1.5" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "245097e9a4535ee1e3e3931fcfcd55a796a44c643e8596ff6566d68f09b87bbc" + [[package]] name = "core-foundation" version = "0.9.3" @@ -394,9 +650,9 @@ checksum = "e496a50fda8aacccc86d7529e2c1e0892dbd0f898a6b5645b5561b89c3210efa" [[package]] name = "cpufeatures" -version = "0.2.7" +version = "0.2.8" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "3e4c1eaa2012c47becbbad2ab175484c2a84d1185b566fb2cc5b8707343dfe58" +checksum = "03e69e28e9f7f77debdedbaafa2866e1de9ba56df55a8bd7cfc724c25a09987c" dependencies = [ "libc", ] @@ -420,7 +676,7 @@ dependencies = [ "atty", "cast", "ciborium", - "clap", + "clap 3.2.25", "criterion-plot", "itertools", "lazy_static", @@ -469,9 +725,9 @@ dependencies = [ [[package]] name = "crossbeam-epoch" -version = "0.9.14" +version = "0.9.15" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "46bd5f3f85273295a9d14aedfb86f6aadbff6d8f5295c4a9edb08e819dcf5695" +checksum = "ae211234986c545741a7dc064309f67ee1e5ad243d0e48335adc0484d960bcc7" dependencies = [ "autocfg", "cfg-if 1.0.0", @@ -482,13 +738,19 @@ dependencies = [ [[package]] name = "crossbeam-utils" -version = "0.8.15" +version = "0.8.16" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "3c063cd8cc95f5c377ed0d4b49a4b21f632396ff690e8470c29b3359b346984b" +checksum = "5a22b2d63d4d1dc0b7f1b6b2747dd0088008a9be28b6ddf0b1e7d335e3037294" dependencies = [ "cfg-if 1.0.0", ] +[[package]] +name = "crunchy" +version = "0.2.2" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "7a81dae078cea95a014a339291cec439d2f232ebe854a9d672b796c6afafa9b7" + [[package]] name = "crypto-common" version = "0.1.6" @@ -501,9 +763,9 @@ dependencies = [ [[package]] name = "csv" -version = "1.2.1" +version = "1.2.2" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "0b015497079b9a9d69c02ad25de6c0a6edef051ea6360a327d0bd05802ef64ad" +checksum = "626ae34994d3d8d668f4269922248239db4ae42d538b14c398b74a52208e8086" dependencies = [ "csv-core", "itoa", @@ -531,81 +793,60 @@ dependencies = [ ] [[package]] -name = "ctor" -version = "0.2.0" -source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "dd4056f63fce3b82d852c3da92b08ea59959890813a7f4ce9c0ff85b10cf301b" +name = "custom_python_extension" +version = "0.1.1" dependencies = [ - "quote", - "syn 2.0.15", + "pyo3", + "pyo3-build-config", + "raphtory", ] [[package]] -name = "cxx" -version = "1.0.94" +name = "darling" +version = "0.14.4" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "f61f1b6389c3fe1c316bf8a4dccc90a38208354b330925bce1f74a6c4756eb93" +checksum = "7b750cb3417fd1b327431a470f388520309479ab0bf5e323505daf0290cd3850" dependencies = [ - "cc", - "cxxbridge-flags", - "cxxbridge-macro", - "link-cplusplus", + "darling_core 0.14.4", + "darling_macro 0.14.4", ] [[package]] -name = "cxx-build" -version = "1.0.94" +name = "darling" +version = "0.20.3" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "12cee708e8962df2aeb38f594aae5d827c022b6460ac71a7a3e2c3c2aae5a07b" +checksum = "0209d94da627ab5605dcccf08bb18afa5009cfbef48d8a8b7d7bdbc79be25c5e" dependencies = [ - "cc", - "codespan-reporting", - "once_cell", - "proc-macro2", - "quote", - "scratch", - "syn 2.0.15", + "darling_core 0.20.3", + "darling_macro 0.20.3", ] [[package]] -name = "cxxbridge-flags" -version = "1.0.94" -source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "7944172ae7e4068c533afbb984114a56c46e9ccddda550499caa222902c7f7bb" - -[[package]] -name = "cxxbridge-macro" -version = "1.0.94" +name = "darling_core" +version = "0.14.4" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "2345488264226bf682893e25de0769f3360aac9957980ec49361b083ddaa5bc5" +checksum = "109c1ca6e6b7f82cc233a97004ea8ed7ca123a9af07a8230878fcfda9b158bf0" dependencies = [ + "fnv", + "ident_case", "proc-macro2", "quote", - "syn 2.0.15", -] - -[[package]] -name = "darling" -version = "0.14.4" -source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "7b750cb3417fd1b327431a470f388520309479ab0bf5e323505daf0290cd3850" -dependencies = [ - "darling_core", - "darling_macro", + "strsim", + "syn 1.0.109", ] [[package]] name = "darling_core" -version = "0.14.4" +version = "0.20.3" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "109c1ca6e6b7f82cc233a97004ea8ed7ca123a9af07a8230878fcfda9b158bf0" +checksum = "177e3443818124b357d8e76f53be906d60937f0d3a90773a664fa63fa253e621" dependencies = [ "fnv", "ident_case", "proc-macro2", "quote", "strsim", - "syn 1.0.109", + "syn 2.0.28", ] [[package]] @@ -614,11 +855,22 @@ version = "0.14.4" source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "a4aab4dbc9f7611d8b55048a3a16d2d010c2c8334e46304b40ac1cc14bf3b48e" dependencies = [ - "darling_core", + "darling_core 0.14.4", "quote", "syn 1.0.109", ] +[[package]] +name = "darling_macro" +version = "0.20.3" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "836a9bbc7ad63342d6d6e7b815ccab164bc77a2d95d84bc3117a8c0d5c98e2d5" +dependencies = [ + "darling_core 0.20.3", + "quote", + "syn 2.0.28", +] + [[package]] name = "dashmap" version = "5.4.0" @@ -626,10 +878,11 @@ source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "907076dfda823b0b36d2a1bb5f90c96660a5bbcd7729e10727f07858f22c4edc" dependencies = [ "cfg-if 1.0.0", - "hashbrown", + "hashbrown 0.12.3", "lock_api", "once_cell", "parking_lot_core", + "serde", ] [[package]] @@ -651,6 +904,37 @@ version = "0.1.2" source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "eaa37046cc0f6c3cc6090fbdbf73ef0b8ef4cfcc37f6befc0020f63e8cf121e1" +[[package]] +name = "derive_builder" +version = "0.12.0" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "8d67778784b508018359cbc8696edb3db78160bab2c2a28ba7f56ef6932997f8" +dependencies = [ + "derive_builder_macro", +] + +[[package]] +name = "derive_builder_core" +version = "0.12.0" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "c11bdc11a0c47bc7d37d582b5285da6849c96681023680b906673c5707af7b0f" +dependencies = [ + "darling 0.14.4", + "proc-macro2", + "quote", + "syn 1.0.109", +] + +[[package]] +name = "derive_builder_macro" +version = "0.12.0" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "ebcda35c7a396850a55ffeac740804b40ffec779b98fffbb1738f4033f0ee79e" +dependencies = [ + "derive_builder_core", + "syn 1.0.109", +] + [[package]] name = "diff" version = "0.1.13" @@ -659,19 +943,20 @@ checksum = "56254986775e3233ffa9c4d7d3faaf6d36a2c09d30b20687e9f88bc8bafc16c8" [[package]] name = "digest" -version = "0.10.6" +version = "0.10.7" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "8168378f4e5023e7218c89c891c0fd8ecdb5e5e4f18cb78f38cf245dd021e76f" +checksum = "9ed9a281f7bc9b7576e61468ba615a66a5c8cfdff42420a70aa82701a3b1e292" dependencies = [ "block-buffer", "crypto-common", + "subtle", ] [[package]] name = "display-error-chain" -version = "0.1.1" +version = "0.2.0" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "7e1a8646b2c125eeb9a84ef0faa6d2d102ea0d5da60b824ade2743263117b848" +checksum = "f77af9e75578c1ab34f5f04545a8b05be0c36fbd7a9bb3cf2d2a971e435fdbb9" [[package]] name = "dotenv" @@ -679,6 +964,18 @@ version = "0.15.0" source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "77c90badedccf4105eca100756a0b1289e191f6fcbdadd3cee1d2f614f97da8f" +[[package]] +name = "downcast-rs" +version = "1.2.0" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "9ea835d29036a4087793836fa931b08837ad5e957da9e23886b29586fb9b6650" + +[[package]] +name = "dyn-clone" +version = "1.0.11" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "68b0cf012f1230e43cd00ebb729c6bb58707ecfa8ad08b52ef3a4ccd2697fc30" + [[package]] name = "dynamic-graphql" version = "0.7.3" @@ -697,7 +994,7 @@ source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "1c547074a568bfe79c9858a4be0ba42abb18b21f9ddfee44b3c83b96a24d7ef7" dependencies = [ "Inflector", - "darling", + "darling 0.14.4", "proc-macro-crate", "proc-macro2", "quote", @@ -720,6 +1017,18 @@ dependencies = [ "cfg-if 1.0.0", ] +[[package]] +name = "enum_dispatch" +version = "0.3.11" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "11f36e95862220b211a6e2aa5eca09b4fa391b13cd52ceb8035a24bf65a79de2" +dependencies = [ + "once_cell", + "proc-macro2", + "quote", + "syn 1.0.109", +] + [[package]] name = "env_logger" version = "0.7.1" @@ -740,6 +1049,12 @@ dependencies = [ "regex", ] +[[package]] +name = "equivalent" +version = "1.0.0" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "88bffebc5d80432c9b140ee17875ff173a8ab62faad5b257da912bd2f6c1c0a1" + [[package]] name = "errno" version = "0.3.1" @@ -761,20 +1076,47 @@ dependencies = [ "libc", ] +[[package]] +name = "ethnum" +version = "1.3.2" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "0198b9d0078e0f30dedc7acbb21c974e838fc8fae3ee170128658a98cb2c1c04" + +[[package]] +name = "eventsource-stream" +version = "0.2.3" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "74fef4569247a5f429d9156b9d0a2599914385dd189c539334c625d8099d90ab" +dependencies = [ + "futures-core", + "nom", + "pin-project-lite", +] + [[package]] name = "examples" -version = "0.4.0" +version = "0.5.7" dependencies = [ "chrono", "itertools", "rand 0.8.5", "raphtory", - "raphtory-io", "rayon", "regex", "serde", ] +[[package]] +name = "fail" +version = "0.5.1" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "fe5e43d0f78a42ad591453aedb1d7ae631ce7ee445c7643691055a9ed8d3b01c" +dependencies = [ + "log", + "once_cell", + "rand 0.8.5", +] + [[package]] name = "fast_chemail" version = "0.9.6" @@ -784,6 +1126,12 @@ dependencies = [ "ascii_utils", ] +[[package]] +name = "fastdivide" +version = "0.4.0" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "25c7df09945d65ea8d70b3321547ed414bbc540aad5bac6883d021b970f35b04" + [[package]] name = "fastrand" version = "1.9.0" @@ -793,11 +1141,23 @@ dependencies = [ "instant", ] +[[package]] +name = "filetime" +version = "0.2.21" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "5cbc844cecaee9d4443931972e1289c8ff485cb4cc2767cb03ca139ed6885153" +dependencies = [ + "cfg-if 1.0.0", + "libc", + "redox_syscall 0.2.16", + "windows-sys 0.48.0", +] + [[package]] name = "flate2" -version = "1.0.25" +version = "1.0.26" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "a8a2db397cb1c8772f31494cb8917e48cd1e64f0fa7efac59fbd741a0a8ce841" +checksum = "3b9429470923de8e8cbd4d2dc513535400b4b3fef0319fb5c4e1f520a7bef743" dependencies = [ "crc32fast", "miniz_oxide", @@ -813,7 +1173,7 @@ dependencies = [ "futures-sink", "nanorand", "pin-project", - "spin", + "spin 0.9.8", ] [[package]] @@ -837,15 +1197,31 @@ version = "0.1.1" source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "00b0228411908ca8685dba7fc2cdd70ec9990a6e753e89b6ac91a84c40fbaf4b" +[[package]] +name = "foreign_vec" +version = "0.1.0" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "ee1b05cbd864bcaecbd3455d6d967862d446e4ebfc3c2e5e5b9841e53cba6673" + [[package]] name = "form_urlencoded" -version = "1.1.0" +version = "1.2.0" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "a9c384f161156f5260c24a097c56119f9be8c798586aecc13afbcbe7b7e26bf8" +checksum = "a62bc1cf6f830c2ec14a513a9fb124d0a213a629668a4186f329db21fe045652" dependencies = [ "percent-encoding", ] +[[package]] +name = "fs4" +version = "0.6.6" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "2eeb4ed9e12f43b7fa0baae3f9cdda28352770132ef2e09a23760c29cae8bd47" +dependencies = [ + "rustix 0.38.2", + "windows-sys 0.48.0", +] + [[package]] name = "fuchsia-cprng" version = "0.1.1" @@ -909,7 +1285,7 @@ checksum = "89ca545a94061b6365f2c7355b4b32bd20df3ff95f02da9329b34ccc3bd6ee72" dependencies = [ "proc-macro2", "quote", - "syn 2.0.15", + "syn 2.0.28", ] [[package]] @@ -924,6 +1300,12 @@ version = "0.3.28" source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "76d3d132be6c0e6aa1534069c705a74a5997a356c0dc2f86a47765e5617c5b65" +[[package]] +name = "futures-timer" +version = "3.0.2" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "e64b03909df88034c26dc1547e8970b91f98bdb65165d6a4e9110d94263dbb2c" + [[package]] name = "futures-util" version = "0.3.28" @@ -972,6 +1354,19 @@ dependencies = [ "syn 1.0.109", ] +[[package]] +name = "generator" +version = "0.7.5" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "5cc16584ff22b460a382b7feec54b23d2908d858152e5739a120b949293bd74e" +dependencies = [ + "cc", + "libc", + "log", + "rustversion", + "windows", +] + [[package]] name = "generic-array" version = "0.14.7" @@ -995,9 +1390,9 @@ dependencies = [ [[package]] name = "getrandom" -version = "0.2.9" +version = "0.2.10" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "c85e1d9ab2eadba7e5040d4e09cbd6d072b76a557ad64e797c2cb9d4da21d7e4" +checksum = "be4136b2a15dd319360be1c07d9933517ccf0be8f16bf62a3bee4f0d618df427" dependencies = [ "cfg-if 1.0.0", "js-sys", @@ -1014,14 +1409,14 @@ checksum = "e77ac7b51b8e6313251737fcef4b1c01a2ea102bde68415b62c0ee9268fec357" dependencies = [ "proc-macro2", "quote", - "syn 2.0.15", + "syn 2.0.28", ] [[package]] name = "h2" -version = "0.3.18" +version = "0.3.20" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "17f8a914c2987b688368b5138aa05321db91f4090cf26118185672ad588bce21" +checksum = "97ec8491ebaf99c8eaa73058b045fe58073cd6be7f596ac993ced0b0a0c01049" dependencies = [ "bytes", "fnv", @@ -1029,7 +1424,7 @@ dependencies = [ "futures-sink", "futures-util", "http", - "indexmap", + "indexmap 1.9.3", "slab", "tokio", "tokio-util", @@ -1056,12 +1451,33 @@ dependencies = [ "thiserror", ] +[[package]] +name = "hash_hasher" +version = "2.0.3" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "74721d007512d0cb3338cd20f0654ac913920061a4c4d0d8708edb3f2a698c0c" + [[package]] name = "hashbrown" version = "0.12.3" source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "8a9ee70c43aaf417c914396645a0fa852624801b24ebb7ae78fe8272889ac888" +[[package]] +name = "hashbrown" +version = "0.13.2" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "43a3c133739dddd0d2990f9a4bdf8eb4b21ef50e4851ca85ab661199821d510e" +dependencies = [ + "ahash", +] + +[[package]] +name = "hashbrown" +version = "0.14.0" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "2c6201b9ff9fd90a5a3bac2e56a830d0caa509576f0e503818ee82c181b3437a" + [[package]] name = "headers" version = "0.3.8" @@ -1069,7 +1485,7 @@ source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "f3e372db8e5c0d213e0cd0b9be18be2aca3d44cf2fe30a9d46a65581cd454584" dependencies = [ "base64 0.13.1", - "bitflags", + "bitflags 1.3.2", "bytes", "headers-core", "http", @@ -1087,6 +1503,12 @@ dependencies = [ "http", ] +[[package]] +name = "heck" +version = "0.4.1" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "95505c38b4572b2d910cecb0281560f54b440a19336cbbcb27bf6ce6adc6f5a8" + [[package]] name = "hermit-abi" version = "0.1.19" @@ -1111,6 +1533,27 @@ version = "0.3.1" source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "fed44880c466736ef9a5c5b5facefb5ed0785676d0c02d612db14e54f0d84286" +[[package]] +name = "hex" +version = "0.4.3" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "7f24254aa9a54b5c858eaee2f5bccdb46aaf0e486a595ed5fd8f86ba55232a70" + +[[package]] +name = "hmac" +version = "0.12.1" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "6c49c37c09c17a53d937dfbb742eb3a961d65a994e6bcdcf37e7399d0cc8ab5e" +dependencies = [ + "digest", +] + +[[package]] +name = "htmlescape" +version = "0.3.1" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "e9025058dae765dee5070ec375f591e2ba14638c63feff74f13805a72e523163" + [[package]] name = "http" version = "0.2.9" @@ -1147,9 +1590,9 @@ checksum = "c4a1e36c821dbe04574f602848a19f742f4fb3c98d40449f11bcad18d6b17421" [[package]] name = "hyper" -version = "0.14.26" +version = "0.14.27" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "ab302d72a6f11a3b910431ff93aae7e773078c769f0a3ef15fb9ec692ed147d4" +checksum = "ffb1cfd654a8219eaef89881fdb3bb3b1cdc5fa75ded05d6933b2b382e395468" dependencies = [ "bytes", "futures-channel", @@ -1169,6 +1612,20 @@ dependencies = [ "want", ] +[[package]] +name = "hyper-rustls" +version = "0.24.1" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "8d78e1e73ec14cf7375674f74d7dde185c8206fd9dea6fb6295e8a98098aaa97" +dependencies = [ + "futures-util", + "http", + "hyper", + "rustls", + "tokio", + "tokio-rustls", +] + [[package]] name = "hyper-tls" version = "0.5.0" @@ -1184,9 +1641,9 @@ dependencies = [ [[package]] name = "iana-time-zone" -version = "0.1.56" +version = "0.1.57" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "0722cd7114b7de04316e7ea5456a0bbb20e4adb46fd27a3697adb812cff0f37c" +checksum = "2fad5b825842d2b38bd206f3e81d6957625fd7f0a361e345c30e01a0ae2dd613" dependencies = [ "android_system_properties", "core-foundation-sys", @@ -1198,12 +1655,11 @@ dependencies = [ [[package]] name = "iana-time-zone-haiku" -version = "0.1.1" +version = "0.1.2" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "0703ae284fc167426161c2e3f1da3ea71d94b21bedbcc9494e92b28e334e3dca" +checksum = "f31827a206f56af32e590ba56d5d2d085f558508192593743f16b2306495269f" dependencies = [ - "cxx", - "cxx-build", + "cc", ] [[package]] @@ -1214,9 +1670,9 @@ checksum = "b9e0384b61958566e926dc50660321d12159025e767c18e043daf26b70104c39" [[package]] name = "idna" -version = "0.3.0" +version = "0.4.0" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "e14ddfc70884202db2244c223200c204c2bda1bc6e0998d11b5e024d657209e6" +checksum = "7d20d6b07bfbc108882d88ed8e37d39636dcc260e15e30c45e6ba089610b917c" dependencies = [ "unicode-bidi", "unicode-normalization", @@ -1229,7 +1685,18 @@ source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "bd070e393353796e801d209ad339e89596eb4c8d430d18ede6a1cced8fafbd99" dependencies = [ "autocfg", - "hashbrown", + "hashbrown 0.12.3", + "serde", +] + +[[package]] +name = "indexmap" +version = "2.0.0" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "d5477fe2230a79769d8dc68e0eabf5437907c0457a5614a9e8dddb67f65eb65d" +dependencies = [ + "equivalent", + "hashbrown 0.14.0", "serde", ] @@ -1239,6 +1706,15 @@ version = "1.0.9" source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "bfa799dd5ed20a7e349f3b4639aa80d74549c81716d9ec4f994c9b5815598306" +[[package]] +name = "inout" +version = "0.1.3" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "a0c10553d664a4d0bcff9f4215d0aac67a639cc68ef660840afe309b807bc9f5" +dependencies = [ + "generic-array", +] + [[package]] name = "instant" version = "0.1.12" @@ -1246,6 +1722,9 @@ source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "7a5bbe824c507c5da5956355e86a746d82e0e1464f65d862cc5e71da70e94b2c" dependencies = [ "cfg-if 1.0.0", + "js-sys", + "wasm-bindgen", + "web-sys", ] [[package]] @@ -1256,19 +1735,18 @@ checksum = "8bb03732005da905c88227371639bf1ad885cc712789c011c31c5fb3ab3ccf02" [[package]] name = "inventory" -version = "0.3.5" +version = "0.3.6" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "7741301a6d6a9b28ce77c0fb77a4eb116b6bc8f3bef09923f7743d059c4157d3" +checksum = "e0539b5de9241582ce6bd6b0ba7399313560151e58c9aaf8b74b711b1bdce644" dependencies = [ - "ctor 0.2.0", "ghost", ] [[package]] name = "io-lifetimes" -version = "1.0.10" +version = "1.0.11" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "9c66c74d2ae7e79a5a8f7ac924adbe38ee42a859c6539ad869eb51f0b52dc220" +checksum = "eae7b9aee968036d54dce06cebaefd919e4472e753296daccd6d344e3e2df0c2" dependencies = [ "hermit-abi 0.3.1", "libc", @@ -1277,9 +1755,20 @@ dependencies = [ [[package]] name = "ipnet" -version = "2.7.2" +version = "2.8.0" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "12b6ee2129af8d4fb011108c73d99a1b83a85977f23b82460c0ae2e25bb4b57f" +checksum = "28b29a3cd74f0f4598934efe3aeba42bae0eb4680554128851ebbecb02af14e6" + +[[package]] +name = "is-terminal" +version = "0.4.9" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "cb0889898416213fab133e1d33a0e5858a48177452750691bde3666d0fdbaf8b" +dependencies = [ + "hermit-abi 0.3.1", + "rustix 0.38.2", + "windows-sys 0.48.0", +] [[package]] name = "itertools" @@ -1296,14 +1785,25 @@ version = "1.0.6" source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "453ad9f582a441959e5f0d088b02ce04cfe8d51a8eaf077f12ac6d3e94164ca6" +[[package]] +name = "jobserver" +version = "0.1.26" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "936cfd212a0155903bcbc060e316fb6cc7cbf2e1907329391ebadc1fe0ce77c2" +dependencies = [ + "libc", +] + [[package]] name = "js-raphtory" -version = "0.4.0" +version = "0.5.7" dependencies = [ "chrono", "console_error_panic_hook", "js-sys", "raphtory", + "serde", + "serde-wasm-bindgen", "wasm-bindgen", "wasm-bindgen-test", "wee_alloc", @@ -1311,51 +1811,64 @@ dependencies = [ [[package]] name = "js-sys" -version = "0.3.63" +version = "0.3.64" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "2f37a4a5928311ac501dee68b3c7613a1037d0edb30c8e5427bd832d55d1b790" +checksum = "c5f195fe497f702db0f318b07fdd68edb16955aed830df8363d837542f8f935a" dependencies = [ "wasm-bindgen", ] +[[package]] +name = "kdam" +version = "0.4.1" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "eec124c5ef865373afd03f7900161495339c59cef395a6dc45d025bcd6499b0b" +dependencies = [ + "terminal_size", + "windows-sys 0.48.0", +] + [[package]] name = "lazy_static" version = "1.4.0" source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "e2abad23fbc42b3700f2f279844dc832adb2b2eb069b2df918f455c4e18cc646" +[[package]] +name = "levenshtein_automata" +version = "0.2.1" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "0c2cdeb66e45e9f36bfad5bbdb4d2384e70936afbee843c6f6543f0c551ebb25" + [[package]] name = "libc" -version = "0.2.142" +version = "0.2.147" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "6a987beff54b60ffa6d51982e1aa1146bc42f19bd26be28b0586f252fccf5317" +checksum = "b4668fb0ea861c1df094127ac5f1da3409a82116a4ba74fca2e58ef927159bb3" [[package]] name = "libm" -version = "0.2.6" +version = "0.2.7" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "348108ab3fba42ec82ff6e9564fc4ca0247bdccdc68dd8af9764bbc79c3c8ffb" +checksum = "f7012b1bbb0719e1097c47611d3898568c546d597c2e74d66f6087edd5233ff4" [[package]] -name = "link-cplusplus" -version = "1.0.8" +name = "linux-raw-sys" +version = "0.3.8" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "ecd207c9c713c34f95a097a5b029ac2ce6010530c7b49d7fea24d977dede04f5" -dependencies = [ - "cc", -] +checksum = "ef53942eb7bf7ff43a617b3e2c1c4a5ecf5944a7c1bc12d7ee39bbb15e5c1519" [[package]] name = "linux-raw-sys" -version = "0.3.7" +version = "0.4.3" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "ece97ea872ece730aed82664c424eb4c8291e1ff2480247ccf7409044bc6479f" +checksum = "09fc20d2ca12cb9f044c93e3bd6d32d523e6e2ec3db4f7b2939cd99026ecd3f0" [[package]] name = "lock_api" -version = "0.4.9" +version = "0.4.10" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "435011366fe56583b16cf956f9df0095b405b82d76425bc8981c0e22e60ec4df" +checksum = "c1cc9717a20b1bb222f333e6a92fd32f7d8a18ddc5a3191a11af45dcbf4dcd16" dependencies = [ "autocfg", "scopeguard", @@ -1364,13 +1877,39 @@ dependencies = [ [[package]] name = "log" -version = "0.4.17" +version = "0.4.19" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "b06a4cde4c0f271a446782e3eff8de789548ce57dbc8eca9292c27f4a42004b4" + +[[package]] +name = "loom" +version = "0.5.6" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "abb12e687cfb44aa40f41fc3978ef76448f9b6038cad6aef4259d3c095a2382e" +checksum = "ff50ecb28bb86013e935fb6683ab1f6d3a20016f123c76fd4c27470076ac30f5" dependencies = [ "cfg-if 1.0.0", + "generator", + "pin-utils", + "scoped-tls", + "tracing", + "tracing-subscriber", ] +[[package]] +name = "lru" +version = "0.10.1" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "718e8fae447df0c7e1ba7f5189829e63fd536945c8988d61444c19039f16b670" +dependencies = [ + "hashbrown 0.13.2", +] + +[[package]] +name = "lz4_flex" +version = "0.10.0" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "8b8c72594ac26bfd34f2d99dfced2edfaddfe8a476e3ff2ca0eb293d925c4f83" + [[package]] name = "matchers" version = "0.1.0" @@ -1380,17 +1919,36 @@ dependencies = [ "regex-automata", ] +[[package]] +name = "measure_time" +version = "0.8.2" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "56220900f1a0923789ecd6bf25fbae8af3b2f1ff3e9e297fc9b6b8674dd4d852" +dependencies = [ + "instant", + "log", +] + [[package]] name = "memchr" version = "2.5.0" source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "2dffe52ecf27772e601905b7522cb4ef790d2cc203488bbd0e2fe85fcb74566d" +[[package]] +name = "memmap2" +version = "0.6.2" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "6d28bba84adfe6646737845bc5ebbfa2c08424eb1c37e94a1fd2a82adb56a872" +dependencies = [ + "libc", +] + [[package]] name = "memoffset" -version = "0.8.0" +version = "0.9.0" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "d61c719bcfbcf5d62b3a09efa6088de8c54bc0bfcd3ea7ae39fcc186108b8de1" +checksum = "5a634b1c61a95585bd15607c6ab0c4e5b226e695ff2800ba0cdccddf208c406c" dependencies = [ "autocfg", ] @@ -1407,25 +1965,40 @@ version = "0.3.17" source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "6877bb514081ee2a7ff5ef9de3281f14a4dd4bceac4c09388074a6b5df8a139a" +[[package]] +name = "mime_guess" +version = "2.0.4" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "4192263c238a5f0d0c6bfd21f336a313a4ce1c450542449ca191bb657b4642ef" +dependencies = [ + "mime", + "unicase", +] + +[[package]] +name = "minimal-lexical" +version = "0.2.1" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "68354c5c6bd36d73ff3feceb05efa59b6acb7626617f4962be322a825e61f79a" + [[package]] name = "miniz_oxide" -version = "0.6.2" +version = "0.7.1" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "b275950c28b37e794e8c55d88aeb5e139d0ce23fdbbeda68f8d7174abdf9e8fa" +checksum = "e7810e0be55b428ada41041c41f32c9f1a42817901b4ccf45fa3d4b6561e74c7" dependencies = [ "adler", ] [[package]] name = "mio" -version = "0.8.6" +version = "0.8.8" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "5b9d9a46eff5b4ff64b45a9e316a6d1e0bc719ef429cbec4dc630684212bfdf9" +checksum = "927a765cd3fc26206e66b296465fa9d3e5ab003e651c1b3c060e7956d96b19d2" dependencies = [ "libc", - "log", "wasi 0.11.0+wasi-snapshot-preview1", - "windows-sys 0.45.0", + "windows-sys 0.48.0", ] [[package]] @@ -1442,17 +2015,23 @@ dependencies = [ "log", "memchr", "mime", - "spin", + "spin 0.9.8", "version_check", ] +[[package]] +name = "murmurhash32" +version = "0.3.0" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "d9380db4c04d219ac5c51d14996bbf2c2e9a15229771b53f8671eb6c83cf44df" + [[package]] name = "nanorand" version = "0.7.0" source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "6a51313c5820b0b02bd422f4b44776fbf47961755c74ce64afc73bfad10226c3" dependencies = [ - "getrandom 0.2.9", + "getrandom 0.2.10", ] [[package]] @@ -1475,9 +2054,9 @@ dependencies = [ [[package]] name = "neo4rs" -version = "0.6.0" +version = "0.6.1" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "243f7625e3622d7d51e419be402a64502c202bdc33a40b9fb792aa0868490c2c" +checksum = "b7d3e9f28d52b1cde4bbbdd52f1e3c257f9050e34207880f3f1724179648244a" dependencies = [ "async-trait", "bytes", @@ -1486,8 +2065,12 @@ dependencies = [ "futures", "log", "neo4rs-macros", + "pin-project-lite", "thiserror", "tokio", + "tokio-rustls", + "url", + "webpki-roots", ] [[package]] @@ -1500,6 +2083,16 @@ dependencies = [ "syn 1.0.109", ] +[[package]] +name = "nom" +version = "7.1.3" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "d273983c5a657a70a3e8f2a01329822f3b8c8172b73826411a55751e404a0a4a" +dependencies = [ + "memchr", + "minimal-lexical", +] + [[package]] name = "nu-ansi-term" version = "0.46.0" @@ -1599,9 +2192,18 @@ dependencies = [ [[package]] name = "once_cell" -version = "1.17.2" +version = "1.18.0" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "dd8b5dd2ae5ed71462c540258bedcb51965123ad7e7ccf4b9a8cafaa4a63576d" + +[[package]] +name = "oneshot" +version = "0.1.5" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "9670a07f94779e00908f3e686eab508878ebb390ba6e604d3a284c00e8d0487b" +checksum = "fc22d22931513428ea6cc089e942d38600e3d00976eef8c86de6b8a3aadec6eb" +dependencies = [ + "loom", +] [[package]] name = "oorandom" @@ -1611,11 +2213,11 @@ checksum = "0ab1bc2a289d34bd04a330323ac98a1b4bc82c9d9fcb1e66b63caa84da26b575" [[package]] name = "openssl" -version = "0.10.52" +version = "0.10.55" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "01b8574602df80f7b85fdfc5392fa884a4e3b3f4f35402c070ab34c3d3f78d56" +checksum = "345df152bc43501c5eb9e4654ff05f794effb78d4efe3d53abc158baddc0703d" dependencies = [ - "bitflags", + "bitflags 1.3.2", "cfg-if 1.0.0", "foreign-types", "libc", @@ -1632,7 +2234,7 @@ checksum = "a948666b637a0f465e8564c73e89d4dde00d72d4d473cc972f390fc3dcee7d9c" dependencies = [ "proc-macro2", "quote", - "syn 2.0.15", + "syn 2.0.28", ] [[package]] @@ -1643,18 +2245,18 @@ checksum = "ff011a302c396a5197692431fc1948019154afc178baf7d8e37367442a4601cf" [[package]] name = "openssl-src" -version = "111.25.3+1.1.1t" +version = "111.26.0+1.1.1u" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "924757a6a226bf60da5f7dd0311a34d2b52283dd82ddeb103208ddc66362f80c" +checksum = "efc62c9f12b22b8f5208c23a7200a442b2e5999f8bdf80233852122b5a4f6f37" dependencies = [ "cc", ] [[package]] name = "openssl-sys" -version = "0.9.87" +version = "0.9.90" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "8e17f59264b2809d77ae94f0e1ebabc434773f370d6ca667bd223ea10e06cc7e" +checksum = "374533b0e45f3a7ced10fcaeccca020e66656bc03dac384f852e4e5a7a8104a6" dependencies = [ "cc", "libc", @@ -1708,7 +2310,7 @@ dependencies = [ "fnv", "futures-channel", "futures-util", - "indexmap", + "indexmap 1.9.3", "js-sys", "once_cell", "pin-project-lite", @@ -1746,11 +2348,20 @@ dependencies = [ "num-traits", ] +[[package]] +name = "ordered-float" +version = "3.7.0" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "2fc2dbde8f8a79f2102cc474ceb0ad68e3b80b85289ea62389b60e66777e4213" +dependencies = [ + "num-traits", +] + [[package]] name = "os_str_bytes" -version = "6.5.0" +version = "6.5.1" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "ceedf44fb00f2d1984b0bc98102627ce622e083e49a5bacdb3e514fa4238e267" +checksum = "4d5d9eb14b174ee9aa2ef96dc2b94637a2d4b6e7cb873c7e171f0c20c6cf3eac" [[package]] name = "output_vt100" @@ -1767,6 +2378,15 @@ version = "0.1.1" source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "b15813163c1d831bf4a13c3610c05c0d03b39feb07f7e09fa234dac9b15aaf39" +[[package]] +name = "ownedbytes" +version = "0.5.0" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "c718e498b20704d5fb5d51d07f414a22f61c19254c1708e117b93fd76860739c" +dependencies = [ + "stable_deref_trait", +] + [[package]] name = "parking_lot" version = "0.12.1" @@ -1779,28 +2399,51 @@ dependencies = [ [[package]] name = "parking_lot_core" -version = "0.9.7" +version = "0.9.8" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "9069cbb9f99e3a5083476ccb29ceb1de18b9118cafa53e90c9551235de2b9521" +checksum = "93f00c865fe7cabf650081affecd3871070f26767e7b2070a3ffae14c654b447" dependencies = [ "cfg-if 1.0.0", "libc", - "redox_syscall 0.2.16", + "redox_syscall 0.3.5", "smallvec", - "windows-sys 0.45.0", + "windows-targets", +] + +[[package]] +name = "password-hash" +version = "0.4.2" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "7676374caaee8a325c9e7a2ae557f216c5563a171d6997b0ef8a65af35147700" +dependencies = [ + "base64ct", + "rand_core 0.6.4", + "subtle", +] + +[[package]] +name = "pbkdf2" +version = "0.11.0" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "83a0692ec44e4cf1ef28ca317f14f8f07da2d95ec3fa01f86e4467b725e60917" +dependencies = [ + "digest", + "hmac", + "password-hash", + "sha2", ] [[package]] name = "percent-encoding" -version = "2.2.0" +version = "2.3.0" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "478c572c3d73181ff3c2539045f6eb99e5491218eae919370993b890cdbdd98e" +checksum = "9b2a4787296e9989611394c33f193f676704af1686e70b8f8033ab5ba9a35a94" [[package]] name = "pest" -version = "2.6.0" +version = "2.7.0" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "e68e84bfb01f0507134eac1e9b410a12ba379d064eab48c50ba4ce329a527b70" +checksum = "f73935e4d55e2abf7f130186537b19e7a4abc886a0252380b59248af473a3fc9" dependencies = [ "thiserror", "ucd-trie", @@ -1808,9 +2451,9 @@ dependencies = [ [[package]] name = "pest_derive" -version = "2.6.0" +version = "2.7.0" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "6b79d4c71c865a25a4322296122e3924d30bc8ee0834c8bfc8b95f7f054afbfb" +checksum = "aef623c9bbfa0eedf5a0efba11a5ee83209c326653ca31ff019bec3a95bfff2b" dependencies = [ "pest", "pest_generator", @@ -1818,22 +2461,22 @@ dependencies = [ [[package]] name = "pest_generator" -version = "2.6.0" +version = "2.7.0" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "6c435bf1076437b851ebc8edc3a18442796b30f1728ffea6262d59bbe28b077e" +checksum = "b3e8cba4ec22bada7fc55ffe51e2deb6a0e0db2d0b7ab0b103acc80d2510c190" dependencies = [ "pest", "pest_meta", "proc-macro2", "quote", - "syn 2.0.15", + "syn 2.0.28", ] [[package]] name = "pest_meta" -version = "2.6.0" +version = "2.7.0" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "745a452f8eb71e39ffd8ee32b3c5f51d03845f99786fa9b68db6ff509c505411" +checksum = "a01f71cb40bd8bb94232df14b946909e14660e33fc05db3e50ae2a82d7ea0ca0" dependencies = [ "once_cell", "pest", @@ -1842,22 +2485,22 @@ dependencies = [ [[package]] name = "pin-project" -version = "1.0.12" +version = "1.1.0" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "ad29a609b6bcd67fee905812e544992d216af9d755757c05ed2d0e15a74c6ecc" +checksum = "c95a7476719eab1e366eaf73d0260af3021184f18177925b07f54b30089ceead" dependencies = [ "pin-project-internal", ] [[package]] name = "pin-project-internal" -version = "1.0.12" +version = "1.1.0" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "069bdb1e05adc7a8990dce9cc75370895fbe4e3d58b9b73bf1aee56359344a55" +checksum = "39407670928234ebc5e6e580247dd567ad73a3578460c5990f9503df207e8f07" dependencies = [ "proc-macro2", "quote", - "syn 1.0.109", + "syn 2.0.28", ] [[package]] @@ -1874,15 +2517,15 @@ checksum = "8b870d8c151b6f2fb93e84a13146138f05d02ed11c7e7c54f8826aaaf7c9f184" [[package]] name = "pkg-config" -version = "0.3.26" +version = "0.3.27" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "6ac9a59f73473f1b8d852421e59e64809f025994837ef743615c6d0c5b305160" +checksum = "26072860ba924cbfa98ea39c8c19b4dd6a4a25423dbdf219c1eca91aa0cf6964" [[package]] name = "plotters" -version = "0.3.4" +version = "0.3.5" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "2538b639e642295546c50fcd545198c9d64ee2a38620a628724a3b266d5fbf97" +checksum = "d2c224ba00d7cadd4d5c660deaf2098e5e80e07846537c51f9cfa4be50c1fd45" dependencies = [ "num-traits", "plotters-backend", @@ -1893,27 +2536,27 @@ dependencies = [ [[package]] name = "plotters-backend" -version = "0.3.4" +version = "0.3.5" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "193228616381fecdc1224c62e96946dfbc73ff4384fba576e052ff8c1bea8142" +checksum = "9e76628b4d3a7581389a35d5b6e2139607ad7c75b17aed325f210aa91f4a9609" [[package]] name = "plotters-svg" -version = "0.3.3" +version = "0.3.5" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "f9a81d2759aae1dae668f783c308bc5c8ebd191ff4184aaa1b37f65a6ae5a56f" +checksum = "38f6d39893cca0701371e3c27294f09797214b86f1fb951b89ade8ec04e2abab" dependencies = [ "plotters-backend", ] [[package]] name = "poem" -version = "1.3.55" +version = "1.3.56" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "c0608069d4999c3c02d49dff261663f2e73a8f7b00b7cd364fb5e93e419dafa1" +checksum = "0a56df40b79ebdccf7986b337f9b0e51ac55cd5e9d21fb20b6aa7c7d49741854" dependencies = [ "async-trait", - "base64 0.21.0", + "base64 0.21.2", "bytes", "futures-util", "headers", @@ -1939,9 +2582,9 @@ dependencies = [ [[package]] name = "poem-derive" -version = "1.3.55" +version = "1.3.56" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "3b839bad877aa933dd00901abd127a44496130e3def48e079d60e43f2c8a33cc" +checksum = "1701f977a2d650a03df42c053686ea0efdb83554f34c7b026b89383c0a1b7846" dependencies = [ "proc-macro-crate", "proc-macro2", @@ -1961,7 +2604,7 @@ version = "1.3.0" source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "a25e9bcb20aa780fd0bb16b72403a9064d6b3f22f026946029acb941a50af755" dependencies = [ - "ctor 0.1.26", + "ctor", "diff", "output_vt100", "yansi", @@ -2011,43 +2654,18 @@ checksum = "dc375e1527247fe1a97d8b7156678dfe7c1af2fc075c9a4db3690ecd2a148068" [[package]] name = "proc-macro2" -version = "1.0.56" +version = "1.0.63" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "2b63bdb0cd06f1f4dedf69b254734f9b45af66e4a031e42a7480257d9898b435" +checksum = "7b368fba921b0dce7e60f5e04ec15e565b3303972b42bcfde1d0713b881959eb" dependencies = [ "unicode-ident", ] -[[package]] -name = "py-raphtory" -version = "0.4.0" -dependencies = [ - "bincode", - "chrono", - "csv", - "display-error-chain", - "flate2", - "flume", - "futures", - "itertools", - "num", - "parking_lot", - "pyo3", - "raphtory", - "raphtory-io", - "rayon", - "regex", - "replace_with", - "rustc-hash", - "serde", - "tokio", -] - [[package]] name = "pyo3" -version = "0.18.3" +version = "0.19.2" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "e3b1ac5b3731ba34fdaa9785f8d74d17448cd18f30cf19e0c7e7b1fdb5272109" +checksum = "e681a6cfdc4adcc93b4d3cf993749a4552018ee0a9b65fc0ccfad74352c72a38" dependencies = [ "cfg-if 1.0.0", "chrono", @@ -2062,11 +2680,24 @@ dependencies = [ "unindent", ] +[[package]] +name = "pyo3-asyncio" +version = "0.19.0" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "a2cc34c1f907ca090d7add03dc523acdd91f3a4dab12286604951e2f5152edad" +dependencies = [ + "futures", + "once_cell", + "pin-project-lite", + "pyo3", + "tokio", +] + [[package]] name = "pyo3-build-config" -version = "0.18.3" +version = "0.19.2" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "9cb946f5ac61bb61a5014924910d936ebd2b23b705f7a4a3c40b05c720b079a3" +checksum = "076c73d0bc438f7a4ef6fdd0c3bb4732149136abd952b110ac93e4edb13a6ba5" dependencies = [ "once_cell", "target-lexicon", @@ -2074,9 +2705,9 @@ dependencies = [ [[package]] name = "pyo3-ffi" -version = "0.18.3" +version = "0.19.2" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "fd4d7c5337821916ea2a1d21d1092e8443cf34879e53a0ac653fbb98f44ff65c" +checksum = "e53cee42e77ebe256066ba8aa77eff722b3bb91f3419177cf4cd0f304d3284d9" dependencies = [ "libc", "pyo3-build-config", @@ -2084,9 +2715,9 @@ dependencies = [ [[package]] name = "pyo3-macros" -version = "0.18.3" +version = "0.19.2" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "a9d39c55dab3fc5a4b25bbd1ac10a2da452c4aca13bb450f22818a002e29648d" +checksum = "dfeb4c99597e136528c6dd7d5e3de5434d1ceaf487436a3f03b2d56b6fc9efd1" dependencies = [ "proc-macro2", "pyo3-macros-backend", @@ -2096,9 +2727,9 @@ dependencies = [ [[package]] name = "pyo3-macros-backend" -version = "0.18.3" +version = "0.19.2" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "97daff08a4c48320587b5224cc98d609e3c27b6d437315bd40b605c98eeb5918" +checksum = "947dc12175c254889edc0c02e399476c2f652b4b9ebd123aa655c224de259536" dependencies = [ "proc-macro2", "quote", @@ -2141,9 +2772,9 @@ dependencies = [ [[package]] name = "quote" -version = "1.0.26" +version = "1.0.30" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "4424af4bf778aae2051a77b60283332f386554255d722233d09fbfc7e30da2fc" +checksum = "5907a1b7c277254a8b15170f6e7c97cfa60ee7872a3217663bb81151e48184bb" dependencies = [ "proc-macro2", ] @@ -2235,7 +2866,7 @@ version = "0.6.4" source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "ec0be4795e2f6a28069bec0b5ff3e2ac9bafc99e6a9a7dc3547996c5c816922c" dependencies = [ - "getrandom 0.2.9", + "getrandom 0.2.10", ] [[package]] @@ -2259,19 +2890,34 @@ dependencies = [ [[package]] name = "raphtory" -version = "0.4.0" +version = "0.5.7" dependencies = [ + "arrow2", + "async-trait", "bincode", + "bzip2", "chrono", "csv", + "dashmap", + "display-error-chain", + "enum_dispatch", + "flate2", "flume", "futures", + "futures-util", "genawaiter", "itertools", + "kdam", + "lock_api", + "neo4rs", + "num", "num-traits", "once_cell", + "ordered-float 3.7.0", "parking_lot", "pretty_assertions", + "pyo3", + "pyo3-asyncio", "quickcheck 1.0.3", "quickcheck_macros", "rand 0.8.5", @@ -2279,35 +2925,46 @@ dependencies = [ "rayon", "regex", "replace_with", + "reqwest", "roaring", "rustc-hash", "serde", + "serde_json", + "serde_with", "sorted_vector_map", + "tantivy", "tempdir", + "tempfile", "thiserror", + "tokio", "twox-hash", "uuid", + "zip", ] [[package]] name = "raphtory-benchmark" -version = "0.4.0" +version = "0.5.7" dependencies = [ "criterion", "rand 0.8.5", "raphtory", - "raphtory-io", "rayon", "sorted_vector_map", ] [[package]] name = "raphtory-graphql" -version = "0.4.0" +version = "0.5.7" dependencies = [ "async-graphql", "async-graphql-poem", + "async-openai", "async-stream", + "base64 0.21.2", + "bincode", + "chrono", + "clap 4.3.11", "dotenv", "dynamic-graphql", "futures-util", @@ -2315,44 +2972,46 @@ dependencies = [ "once_cell", "opentelemetry", "opentelemetry-jaeger", + "ordered-float 3.7.0", + "parking_lot", "poem", "raphtory", "serde", "serde_json", + "tempfile", + "thiserror", "tokio", "tracing", "tracing-opentelemetry", "tracing-subscriber", + "uuid", + "walkdir", ] [[package]] -name = "raphtory-io" -version = "0.4.0" +name = "raphtory-pymodule" +version = "0.5.7" dependencies = [ - "bzip2", - "chrono", - "csv", - "flate2", - "itertools", - "neo4rs", + "openssl", + "pyo3", + "pyo3-asyncio", + "pyo3-build-config", "raphtory", - "rayon", - "regex", - "reqwest", - "serde", - "serde_json", - "tokio", - "zip", + "raphtory-graphql", ] [[package]] -name = "raphtory-pymodule" -version = "0.4.0" +name = "raphtory-rust-benchmark" +version = "0.5.7" dependencies = [ - "openssl", - "py-raphtory", - "pyo3", - "pyo3-build-config", + "chrono", + "clap 4.3.11", + "csv", + "flate2", + "ordered-float 3.7.0", + "raphtory", + "serde", + "tar", ] [[package]] @@ -2392,7 +3051,7 @@ version = "0.2.16" source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "fb5a58c1855b4b6819d59012155603f0b22ad30cad752600aadfcb695265519a" dependencies = [ - "bitflags", + "bitflags 1.3.2", ] [[package]] @@ -2401,18 +3060,18 @@ version = "0.3.5" source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "567664f262709473930a4bf9e51bf2ebf3348f2e748ccc50dea20646858f8f29" dependencies = [ - "bitflags", + "bitflags 1.3.2", ] [[package]] name = "regex" -version = "1.8.1" +version = "1.8.4" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "af83e617f331cc6ae2da5443c602dfa5af81e517212d9d611a5b3ba1777b5370" +checksum = "d0ab3ca65655bb1e41f2a8c8cd662eb4fb035e67c3f78da1d61dffe89d07300f" dependencies = [ "aho-corasick", "memchr", - "regex-syntax 0.7.1", + "regex-syntax 0.7.2", ] [[package]] @@ -2432,9 +3091,9 @@ checksum = "f162c6dd7b008981e4d40210aca20b4bd0f9b60ca9271061b07f78537722f2e1" [[package]] name = "regex-syntax" -version = "0.7.1" +version = "0.7.2" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "a5996294f19bd3aae0453a862ad728f60e6600695733dd5df01da90c54363a3c" +checksum = "436b050e76ed2903236f032a59761c1eb99e1b0aead2c257922771dab1fc8c78" [[package]] name = "remove_dir_all" @@ -2453,11 +3112,11 @@ checksum = "e3a8614ee435691de62bcffcf4a66d91b3594bf1428a5722e79103249a095690" [[package]] name = "reqwest" -version = "0.11.17" +version = "0.11.18" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "13293b639a097af28fc8a90f22add145a9c954e49d77da06263d58cf44d5fb91" +checksum = "cde824a14b7c14f85caff81225f411faacc04a2013f41670f41443742b1c1c55" dependencies = [ - "base64 0.21.0", + "base64 0.21.2", "bytes", "encoding_rs", "futures-core", @@ -2466,28 +3125,52 @@ dependencies = [ "http", "http-body", "hyper", + "hyper-rustls", "hyper-tls", "ipnet", "js-sys", "log", "mime", + "mime_guess", "native-tls", "once_cell", "percent-encoding", "pin-project-lite", + "rustls", + "rustls-native-certs", + "rustls-pemfile", "serde", "serde_json", "serde_urlencoded", "tokio", "tokio-native-tls", + "tokio-rustls", + "tokio-util", "tower-service", "url", "wasm-bindgen", "wasm-bindgen-futures", + "wasm-streams", "web-sys", "winreg", ] +[[package]] +name = "reqwest-eventsource" +version = "0.4.0" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "8f03f570355882dd8d15acc3a313841e6e90eddbc76a93c748fd82cc13ba9f51" +dependencies = [ + "eventsource-stream", + "futures-core", + "futures-timer", + "mime", + "nom", + "pin-project-lite", + "reqwest", + "thiserror", +] + [[package]] name = "retain_mut" version = "0.1.7" @@ -2503,6 +3186,21 @@ dependencies = [ "uncased", ] +[[package]] +name = "ring" +version = "0.16.20" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "3053cf52e236a3ed746dfc745aa9cacf1b791d846bdaf412f60a8d7d6e17c8fc" +dependencies = [ + "cc", + "libc", + "once_cell", + "spin 0.5.2", + "untrusted", + "web-sys", + "winapi", +] + [[package]] name = "roaring" version = "0.10.1" @@ -2515,26 +3213,107 @@ dependencies = [ "serde", ] +[[package]] +name = "rust-stemmers" +version = "1.2.0" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "e46a2036019fdb888131db7a4c847a1063a7493f971ed94ea82c67eada63ca54" +dependencies = [ + "serde", + "serde_derive", +] + [[package]] name = "rustc-hash" version = "1.1.0" source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "08d43f7aa6b08d49f382cde6a7982047c3426db949b1424bc4b7ec9ae12c6ce2" +[[package]] +name = "rustc_version" +version = "0.4.0" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "bfa0f585226d2e68097d4f95d113b15b83a82e819ab25717ec0590d9584ef366" +dependencies = [ + "semver", +] + [[package]] name = "rustix" -version = "0.37.19" +version = "0.37.20" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "acf8729d8542766f1b2cf77eb034d52f40d375bb8b615d0b147089946e16613d" +checksum = "b96e891d04aa506a6d1f318d2771bcb1c7dfda84e126660ace067c9b474bb2c0" dependencies = [ - "bitflags", + "bitflags 1.3.2", "errno", "io-lifetimes", "libc", - "linux-raw-sys", + "linux-raw-sys 0.3.8", + "windows-sys 0.48.0", +] + +[[package]] +name = "rustix" +version = "0.38.2" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "aabcb0461ebd01d6b79945797c27f8529082226cb630a9865a71870ff63532a4" +dependencies = [ + "bitflags 2.3.3", + "errno", + "libc", + "linux-raw-sys 0.4.3", "windows-sys 0.48.0", ] +[[package]] +name = "rustls" +version = "0.21.2" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "e32ca28af694bc1bbf399c33a516dbdf1c90090b8ab23c2bc24f834aa2247f5f" +dependencies = [ + "log", + "ring", + "rustls-webpki", + "sct", +] + +[[package]] +name = "rustls-native-certs" +version = "0.6.3" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "a9aace74cb666635c918e9c12bc0d348266037aa8eb599b5cba565709a8dff00" +dependencies = [ + "openssl-probe", + "rustls-pemfile", + "schannel", + "security-framework", +] + +[[package]] +name = "rustls-pemfile" +version = "1.0.3" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "2d3987094b1d07b653b7dfdc3f70ce9a1da9c51ac18c1b06b662e4f9a0e9f4b2" +dependencies = [ + "base64 0.21.2", +] + +[[package]] +name = "rustls-webpki" +version = "0.100.1" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "d6207cd5ed3d8dca7816f8f3725513a34609c0c765bf652b8c3cb4cfd87db46b" +dependencies = [ + "ring", + "untrusted", +] + +[[package]] +name = "rustversion" +version = "1.0.13" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "dc31bd9b61a32c31f9650d18add92aa83a49ba979c143eefd27fe7177b05bd5f" + [[package]] name = "ryu" version = "1.0.13" @@ -2572,18 +3351,22 @@ source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "d29ab0c6d3fc0ee92fe66e2d99f700eab17a8d57d1c1d3b748380fb20baa78cd" [[package]] -name = "scratch" -version = "1.0.5" +name = "sct" +version = "0.7.0" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "1792db035ce95be60c3f8853017b3999209281c24e2ba5bc8e59bf97a0c590c1" +checksum = "d53dcdb7c9f8158937a7981b48accfd39a43af418591a5d008c7b22b5e1b7ca4" +dependencies = [ + "ring", + "untrusted", +] [[package]] name = "security-framework" -version = "2.8.2" +version = "2.9.1" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "a332be01508d814fed64bf28f798a146d73792121129962fdf335bb3c49a4254" +checksum = "1fc758eb7bffce5b308734e9b0c1468893cae9ff70ebf13e7090be8dcbcc83a8" dependencies = [ - "bitflags", + "bitflags 1.3.2", "core-foundation", "core-foundation-sys", "libc", @@ -2592,39 +3375,56 @@ dependencies = [ [[package]] name = "security-framework-sys" -version = "2.8.0" +version = "2.9.0" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "31c9bb296072e961fcbd8853511dd39c2d8be2deb1e17c6860b1d30732b323b4" +checksum = "f51d0c0d83bec45f16480d0ce0058397a69e48fcdc52d1dc8855fb68acbd31a7" dependencies = [ "core-foundation-sys", "libc", ] +[[package]] +name = "semver" +version = "1.0.17" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "bebd363326d05ec3e2f532ab7660680f3b02130d780c299bca73469d521bc0ed" + [[package]] name = "serde" -version = "1.0.160" +version = "1.0.164" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "bb2f3770c8bce3bcda7e149193a069a0f4365bda1fa5cd88e03bca26afc1216c" +checksum = "9e8c8cf938e98f769bc164923b06dce91cea1751522f46f8466461af04c9027d" dependencies = [ "serde_derive", ] +[[package]] +name = "serde-wasm-bindgen" +version = "0.5.0" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "f3b143e2833c57ab9ad3ea280d21fd34e285a42837aeb0ee301f4f41890fa00e" +dependencies = [ + "js-sys", + "serde", + "wasm-bindgen", +] + [[package]] name = "serde_derive" -version = "1.0.160" +version = "1.0.164" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "291a097c63d8497e00160b166a967a4a79c64f3facdd01cbd7502231688d77df" +checksum = "d9735b638ccc51c28bf6914d90a2e9725b377144fc612c49a611fddd1b631d68" dependencies = [ "proc-macro2", "quote", - "syn 2.0.15", + "syn 2.0.28", ] [[package]] name = "serde_json" -version = "1.0.96" +version = "1.0.99" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "057d394a50403bcac12672b2b18fb387ab6d289d957dab67dd201875391e52f1" +checksum = "46266871c240a00b8f503b877622fe33430b3c7d963bdc0f2adc511e54a1eae3" dependencies = [ "itoa", "ryu", @@ -2637,10 +3437,39 @@ version = "0.7.1" source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "d3491c14715ca2294c4d6a88f15e84739788c1d030eed8c110436aafdaa2f3fd" dependencies = [ - "form_urlencoded", - "itoa", - "ryu", - "serde", + "form_urlencoded", + "itoa", + "ryu", + "serde", +] + +[[package]] +name = "serde_with" +version = "3.3.0" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "1ca3b16a3d82c4088f343b7480a93550b3eabe1a358569c2dfe38bbcead07237" +dependencies = [ + "base64 0.21.2", + "chrono", + "hex", + "indexmap 1.9.3", + "indexmap 2.0.0", + "serde", + "serde_json", + "serde_with_macros", + "time 0.3.22", +] + +[[package]] +name = "serde_with_macros" +version = "3.3.0" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "2e6be15c453eb305019bfa438b1593c731f36a289a7853f7707ee29e870b3b3c" +dependencies = [ + "darling 0.20.3", + "proc-macro2", + "quote", + "syn 2.0.28", ] [[package]] @@ -2656,9 +3485,9 @@ dependencies = [ [[package]] name = "sha2" -version = "0.10.6" +version = "0.10.7" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "82e6b795fe2e3b1e845bafcb27aa35405c4d47cdfc92af5fc8d3002f76cebdc0" +checksum = "479fb9d862239e610720565ca91403019f2f00410f1864c5aa7479b950a76ed8" dependencies = [ "cfg-if 1.0.0", "cpufeatures", @@ -2683,6 +3512,21 @@ dependencies = [ "libc", ] +[[package]] +name = "simdutf8" +version = "0.1.4" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "f27f6278552951f1f2b8cf9da965d10969b2efdea95a6ec47987ab46edfe263a" + +[[package]] +name = "sketches-ddsketch" +version = "0.2.1" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "68a406c1882ed7f29cd5e248c9848a80e7cb6ae0fea82346d2746f2f941c07e1" +dependencies = [ + "serde", +] + [[package]] name = "slab" version = "0.4.8" @@ -2717,6 +3561,12 @@ dependencies = [ "quickcheck 0.9.2", ] +[[package]] +name = "spin" +version = "0.5.2" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "6e63cff320ae2c57904679ba7cb63280a3dc4613885beafb148ee7bf9aa9042d" + [[package]] name = "spin" version = "0.9.8" @@ -2726,6 +3576,12 @@ dependencies = [ "lock_api", ] +[[package]] +name = "stable_deref_trait" +version = "1.2.0" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "a8f112729512f8e442d81f95a8a7ddf2b7c6b8a1a6f509a95864142b30cab2d3" + [[package]] name = "static_assertions" version = "1.1.0" @@ -2738,6 +3594,12 @@ version = "0.10.0" source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "73473c0e59e6d5812c5dfe2a064a6444949f089e20eec9a2e5506596494e4623" +[[package]] +name = "subtle" +version = "2.5.0" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "81cdd64d312baedb58e21336b31bc043b77e01cc99033ce76ef539f78e965ebc" + [[package]] name = "syn" version = "1.0.109" @@ -2751,9 +3613,9 @@ dependencies = [ [[package]] name = "syn" -version = "2.0.15" +version = "2.0.28" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "a34fcf3e8b60f57e6a14301a2e916d323af98b0ea63c599441eec8558660c822" +checksum = "04361975b3f5e348b2189d8dc55bc942f278b2d482a6a0365de5bdd62d351567" dependencies = [ "proc-macro2", "quote", @@ -2771,11 +3633,165 @@ dependencies = [ "syn 1.0.109", ] +[[package]] +name = "tantivy" +version = "0.20.2" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "aec540e9cebc88f523f67f596dee213e491f0c55961de013566f267a0c31f5e9" +dependencies = [ + "aho-corasick", + "arc-swap", + "async-trait", + "base64 0.21.2", + "bitpacking", + "byteorder", + "census", + "crc32fast", + "crossbeam-channel", + "downcast-rs", + "fail", + "fastdivide", + "fs4", + "htmlescape", + "itertools", + "levenshtein_automata", + "log", + "lru", + "lz4_flex", + "measure_time", + "memmap2", + "murmurhash32", + "num_cpus", + "once_cell", + "oneshot", + "rayon", + "regex", + "rust-stemmers", + "rustc-hash", + "serde", + "serde_json", + "sketches-ddsketch", + "smallvec", + "tantivy-bitpacker", + "tantivy-columnar", + "tantivy-common", + "tantivy-fst", + "tantivy-query-grammar", + "tantivy-stacker", + "tantivy-tokenizer-api", + "tempfile", + "thiserror", + "time 0.3.22", + "uuid", + "winapi", +] + +[[package]] +name = "tantivy-bitpacker" +version = "0.4.0" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "16099e96f0ede682084469b80d6909dc170aa2b11d2a45538b5b36b2a90090b9" +dependencies = [ + "bitpacking", +] + +[[package]] +name = "tantivy-columnar" +version = "0.1.0" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "56e32b024b26eab93eb8648faf08004356bf9d47376557ee4409f4b210163656" +dependencies = [ + "fastdivide", + "fnv", + "itertools", + "serde", + "tantivy-bitpacker", + "tantivy-common", + "tantivy-sstable", + "tantivy-stacker", +] + +[[package]] +name = "tantivy-common" +version = "0.5.0" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "e7d12fdd6ec0f7e0962f129c03c696a85ec567734950cbb2b89af4a293ce342f" +dependencies = [ + "async-trait", + "byteorder", + "ownedbytes", + "serde", + "time 0.3.22", +] + +[[package]] +name = "tantivy-fst" +version = "0.4.0" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "fc3c506b1a8443a3a65352df6382a1fb6a7afe1a02e871cee0d25e2c3d5f3944" +dependencies = [ + "byteorder", + "regex-syntax 0.6.29", + "utf8-ranges", +] + +[[package]] +name = "tantivy-query-grammar" +version = "0.20.0" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "106d8f78ad1da4f0fdd526a0760c326c0573510d4dedabeb1962d35a35879797" +dependencies = [ + "combine", + "once_cell", + "regex", +] + +[[package]] +name = "tantivy-sstable" +version = "0.1.0" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "eda34243d3ee64bd8f9ba74a3b0d05f4d07beff7767a727212e9b5a19c13dde7" +dependencies = [ + "tantivy-common", + "tantivy-fst", + "zstd 0.12.3+zstd.1.5.2", +] + +[[package]] +name = "tantivy-stacker" +version = "0.1.0" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "67b9e9470301b026ad3b95f79a791a2a3ee81f3ab16fbe412a9dd81ff834acf5" +dependencies = [ + "murmurhash32", + "tantivy-common", +] + +[[package]] +name = "tantivy-tokenizer-api" +version = "0.1.1" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "64186801b6e06b3a1c4275e23b517835ff4ecbb707318b838dc9de457c062200" +dependencies = [ + "serde", +] + +[[package]] +name = "tar" +version = "0.4.38" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "4b55807c0344e1e6c04d7c965f5289c39a8d94ae23ed5c0b57aabac549f871c6" +dependencies = [ + "filetime", + "libc", + "xattr", +] + [[package]] name = "target-lexicon" -version = "0.12.7" +version = "0.12.8" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "fd1ba337640d60c3e96bc6f0638a939b9c9a7f2c316a1598c279828b3d1dc8c5" +checksum = "1b1c7f239eb94671427157bd93b3694320f3668d4e1eff08c7285366fd777fac" [[package]] name = "tempdir" @@ -2789,24 +3805,26 @@ dependencies = [ [[package]] name = "tempfile" -version = "3.5.0" +version = "3.6.0" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "b9fbec84f381d5795b08656e4912bec604d162bff9291d6189a78f4c8ab87998" +checksum = "31c0432476357e58790aaa47a8efb0c5138f137343f3b5f23bd36a27e3b0a6d6" dependencies = [ + "autocfg", "cfg-if 1.0.0", "fastrand", "redox_syscall 0.3.5", - "rustix", - "windows-sys 0.45.0", + "rustix 0.37.20", + "windows-sys 0.48.0", ] [[package]] -name = "termcolor" -version = "1.2.0" +name = "terminal_size" +version = "0.2.6" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "be55cf8942feac5c765c2c993422806843c9a9a45d4d5c407ad6dd2ea95eb9b6" +checksum = "8e6bf6f19e9f8ed8d4048dc22981458ebcf406d67e94cd422e5ecd73d63b3237" dependencies = [ - "winapi-util", + "rustix 0.37.20", + "windows-sys 0.48.0", ] [[package]] @@ -2817,22 +3835,22 @@ checksum = "222a222a5bfe1bba4a77b45ec488a741b3cb8872e5e499451fd7d0129c9c7c3d" [[package]] name = "thiserror" -version = "1.0.40" +version = "1.0.46" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "978c9a314bd8dc99be594bc3c175faaa9794be04a5a5e153caba6915336cebac" +checksum = "d9207952ae1a003f42d3d5e892dac3c6ba42aa6ac0c79a6a91a2b5cb4253e75c" dependencies = [ "thiserror-impl", ] [[package]] name = "thiserror-impl" -version = "1.0.40" +version = "1.0.46" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "f9456a42c5b0d803c8cd86e73dd7cc9edd429499f37a3550d286d5e86720569f" +checksum = "f1728216d3244de4f14f14f8c15c79be1a7c67867d28d69b719690e2a19fb445" dependencies = [ "proc-macro2", "quote", - "syn 2.0.15", + "syn 2.0.28", ] [[package]] @@ -2863,7 +3881,7 @@ dependencies = [ "byteorder", "integer-encoding", "log", - "ordered-float", + "ordered-float 1.1.1", "threadpool", ] @@ -2878,6 +3896,33 @@ dependencies = [ "winapi", ] +[[package]] +name = "time" +version = "0.3.22" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "ea9e1b3cf1243ae005d9e74085d4d542f3125458f3a81af210d901dcd7411efd" +dependencies = [ + "itoa", + "serde", + "time-core", + "time-macros", +] + +[[package]] +name = "time-core" +version = "0.1.1" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "7300fbefb4dadc1af235a9cef3737cea692a9d97e1b9cbcd4ebdae6f8868e6fb" + +[[package]] +name = "time-macros" +version = "0.2.9" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "372950940a5f07bf38dbe211d7283c9e6d7327df53794992d293e534c733d09b" +dependencies = [ + "time-core", +] + [[package]] name = "tinytemplate" version = "1.2.1" @@ -2905,9 +3950,9 @@ checksum = "1f3ccbac311fea05f86f61904b462b55fb3df8837a366dfc601a0161d0532f20" [[package]] name = "tokio" -version = "1.27.0" +version = "1.28.2" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "d0de47a4eecbe11f498978a9b29d792f0d2692d1dd003650c24c76510e3bc001" +checksum = "94d7b1cfd2aa4011f2de74c2c4c63665e27a71006b0a192dcd2710272e73dfa2" dependencies = [ "autocfg", "bytes", @@ -2919,18 +3964,18 @@ dependencies = [ "signal-hook-registry", "socket2", "tokio-macros", - "windows-sys 0.45.0", + "windows-sys 0.48.0", ] [[package]] name = "tokio-macros" -version = "2.0.0" +version = "2.1.0" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "61a573bdc87985e9d6ddeed1b3d864e8a302c847e40d647746df2f1de209d1ce" +checksum = "630bdcf245f78637c13ec01ffae6187cca34625e8c63150d424b59e55af2675e" dependencies = [ "proc-macro2", "quote", - "syn 2.0.15", + "syn 2.0.28", ] [[package]] @@ -2943,6 +3988,16 @@ dependencies = [ "tokio", ] +[[package]] +name = "tokio-rustls" +version = "0.24.1" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "c28327cf380ac148141087fbfb9de9d7bd4e84ab5d2c28fbc911d753de8a7081" +dependencies = [ + "rustls", + "tokio", +] + [[package]] name = "tokio-stream" version = "0.1.14" @@ -2983,17 +4038,17 @@ dependencies = [ [[package]] name = "toml_datetime" -version = "0.6.1" +version = "0.6.3" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "3ab8ed2edee10b50132aed5f331333428b011c99402b5a534154ed15746f9622" +checksum = "7cda73e2f1397b1262d6dfdcef8aafae14d1de7748d66822d3bfeeb6d03e5e4b" [[package]] name = "toml_edit" -version = "0.19.8" +version = "0.19.11" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "239410c8609e8125456927e6707163a3b1fdb40561e4b803bc041f466ccfdc13" +checksum = "266f016b7f039eec8a1a80dfe6156b633d208b9fccca5e4db1d6775b0c4e34a7" dependencies = [ - "indexmap", + "indexmap 2.0.0", "toml_datetime", "winnow", ] @@ -3018,13 +4073,13 @@ dependencies = [ [[package]] name = "tracing-attributes" -version = "0.1.24" +version = "0.1.26" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "0f57e3ca2a01450b1a921183a9c9cbfda207fd822cef4ccb00a65402cbba7a74" +checksum = "5f4f31f56159e98206da9efd823404b79b6ef3143b4a7ab76e67b1751b25a4ab" dependencies = [ "proc-macro2", "quote", - "syn 2.0.15", + "syn 2.0.28", ] [[package]] @@ -3137,6 +4192,15 @@ dependencies = [ "version_check", ] +[[package]] +name = "unicase" +version = "2.7.0" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "f7d2d4dafb69621809a81864c9c1b864479e1235c0dd4e199924b9742439ed89" +dependencies = [ + "version_check", +] + [[package]] name = "unicode-bidi" version = "0.3.13" @@ -3145,9 +4209,9 @@ checksum = "92888ba5573ff080736b3648696b70cafad7d250551175acbaa4e0385b3e1460" [[package]] name = "unicode-ident" -version = "1.0.8" +version = "1.0.9" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "e5464a87b239f13a63a501f2701565754bae92d243d4bb7eb12f6d57d2269bf4" +checksum = "b15811caf2415fb889178633e7724bad2509101cde276048e013b9def5e51fa0" [[package]] name = "unicode-normalization" @@ -3158,23 +4222,23 @@ dependencies = [ "tinyvec", ] -[[package]] -name = "unicode-width" -version = "0.1.10" -source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "c0edd1e5b14653f783770bce4a4dabb4a5108a5370a5f5d8cfe8710c361f6c8b" - [[package]] name = "unindent" version = "0.1.11" source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "e1766d682d402817b5ac4490b3c3002d91dfa0d22812f341609f97b08757359c" +[[package]] +name = "untrusted" +version = "0.7.1" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "a156c684c91ea7d62626509bce3cb4e1d9ed5c4d978f7b4352658f96a4c26b4a" + [[package]] name = "url" -version = "2.3.1" +version = "2.4.0" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "0d68c799ae75762b8c3fe375feb6600ef5602c883c5d21eb51c09f22b83c4643" +checksum = "50bff7831e19200a85b17131d085c25d7811bc4e186efdaf54bbd132994a88cb" dependencies = [ "form_urlencoded", "idna", @@ -3187,13 +4251,26 @@ version = "0.7.6" source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "09cc8ee72d2a9becf2f2febe0205bbed8fc6615b7cb429ad062dc7b7ddd036a9" +[[package]] +name = "utf8-ranges" +version = "1.0.5" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "7fcfc827f90e53a02eaef5e535ee14266c1d569214c6aa70133a624d8a3164ba" + +[[package]] +name = "utf8parse" +version = "0.2.1" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "711b9620af191e0cdc7468a8d14e709c3dcdb115b36f838e601583af800a370a" + [[package]] name = "uuid" -version = "1.3.1" +version = "1.4.1" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "5b55a3fef2a1e3b3a00ce878640918820d3c51081576ac657d23af9fc7928fdb" +checksum = "79daa5ed5740825c40b389c5e50312b9c86df53fccd33f281df655642b43869d" dependencies = [ - "getrandom 0.2.9", + "getrandom 0.2.10", + "serde", ] [[package]] @@ -3226,11 +4303,10 @@ dependencies = [ [[package]] name = "want" -version = "0.3.0" +version = "0.3.1" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "1ce8a968cb1cd110d136ff8b819a556d6fb6d919363c61534f6860c7eb172ba0" +checksum = "bfa7760aed19e106de2c7c0b581b509f2f25d3dacaf737cb82ac61bc6d760b0e" dependencies = [ - "log", "try-lock", ] @@ -3254,9 +4330,9 @@ checksum = "9c8d87e72b64a3b4db28d11ce29237c246188f4f51057d65a7eab63b7987e423" [[package]] name = "wasm-bindgen" -version = "0.2.86" +version = "0.2.87" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "5bba0e8cb82ba49ff4e229459ff22a191bbe9a1cb3a341610c9c33efc27ddf73" +checksum = "7706a72ab36d8cb1f80ffbf0e071533974a60d0a308d01a5d0375bf60499a342" dependencies = [ "cfg-if 1.0.0", "wasm-bindgen-macro", @@ -3264,24 +4340,24 @@ dependencies = [ [[package]] name = "wasm-bindgen-backend" -version = "0.2.86" +version = "0.2.87" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "19b04bc93f9d6bdee709f6bd2118f57dd6679cf1176a1af464fca3ab0d66d8fb" +checksum = "5ef2b6d3c510e9625e5fe6f509ab07d66a760f0885d858736483c32ed7809abd" dependencies = [ "bumpalo", "log", "once_cell", "proc-macro2", "quote", - "syn 2.0.15", + "syn 2.0.28", "wasm-bindgen-shared", ] [[package]] name = "wasm-bindgen-futures" -version = "0.4.36" +version = "0.4.37" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "2d1985d03709c53167ce907ff394f5316aa22cb4e12761295c5dc57dacb6297e" +checksum = "c02dbc21516f9f1f04f187958890d7e6026df8d16540b7ad9492bc34a67cea03" dependencies = [ "cfg-if 1.0.0", "js-sys", @@ -3291,9 +4367,9 @@ dependencies = [ [[package]] name = "wasm-bindgen-macro" -version = "0.2.86" +version = "0.2.87" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "14d6b024f1a526bb0234f52840389927257beb670610081360e5a03c5df9c258" +checksum = "dee495e55982a3bd48105a7b947fd2a9b4a8ae3010041b9e0faab3f9cd028f1d" dependencies = [ "quote", "wasm-bindgen-macro-support", @@ -3301,28 +4377,28 @@ dependencies = [ [[package]] name = "wasm-bindgen-macro-support" -version = "0.2.86" +version = "0.2.87" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "e128beba882dd1eb6200e1dc92ae6c5dbaa4311aa7bb211ca035779e5efc39f8" +checksum = "54681b18a46765f095758388f2d0cf16eb8d4169b639ab575a8f5693af210c7b" dependencies = [ "proc-macro2", "quote", - "syn 2.0.15", + "syn 2.0.28", "wasm-bindgen-backend", "wasm-bindgen-shared", ] [[package]] name = "wasm-bindgen-shared" -version = "0.2.86" +version = "0.2.87" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "ed9d5b4305409d1fc9482fee2d7f9bcbf24b3972bf59817ef757e23982242a93" +checksum = "ca6ad05a4870b2bf5fe995117d3728437bd27d7cd5f06f13c17443ef369775a1" [[package]] name = "wasm-bindgen-test" -version = "0.3.36" +version = "0.3.37" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "c9e636f3a428ff62b3742ebc3c70e254dfe12b8c2b469d688ea59cdd4abcf502" +checksum = "6e6e302a7ea94f83a6d09e78e7dc7d9ca7b186bc2829c24a22d0753efd680671" dependencies = [ "console_error_panic_hook", "js-sys", @@ -3334,24 +4410,46 @@ dependencies = [ [[package]] name = "wasm-bindgen-test-macro" -version = "0.3.36" +version = "0.3.37" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "f18c1fad2f7c4958e7bcce014fa212f59a65d5e3721d0f77e6c0b27ede936ba3" +checksum = "ecb993dd8c836930ed130e020e77d9b2e65dd0fbab1b67c790b0f5d80b11a575" dependencies = [ "proc-macro2", "quote", ] +[[package]] +name = "wasm-streams" +version = "0.2.3" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "6bbae3363c08332cadccd13b67db371814cd214c2524020932f0804b8cf7c078" +dependencies = [ + "futures-util", + "js-sys", + "wasm-bindgen", + "wasm-bindgen-futures", + "web-sys", +] + [[package]] name = "web-sys" -version = "0.3.61" +version = "0.3.64" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "e33b99f4b23ba3eec1a53ac264e35a755f00e966e0065077d6027c0f575b0b97" +checksum = "9b85cbef8c220a6abc02aefd892dfc0fc23afb1c6a426316ec33253a3877249b" dependencies = [ "js-sys", "wasm-bindgen", ] +[[package]] +name = "webpki-roots" +version = "0.23.1" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "b03058f88386e5ff5310d9111d53f48b17d732b401aeb83a8d5190f2ac459338" +dependencies = [ + "rustls-webpki", +] + [[package]] name = "wee_alloc" version = "0.4.5" @@ -3401,7 +4499,7 @@ version = "0.48.0" source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "e686886bc078bc1b0b600cac0147aadb815089b6e4da64016cbd754b6342700f" dependencies = [ - "windows-targets 0.48.0", + "windows-targets", ] [[package]] @@ -3419,37 +4517,13 @@ dependencies = [ "windows_x86_64_msvc 0.42.2", ] -[[package]] -name = "windows-sys" -version = "0.45.0" -source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "75283be5efb2831d37ea142365f009c02ec203cd29a3ebecbc093d52315b66d0" -dependencies = [ - "windows-targets 0.42.2", -] - [[package]] name = "windows-sys" version = "0.48.0" source = "registry+https://github.com/rust-lang/crates.io-index" checksum = "677d2418bec65e3338edb076e806bc1ec15693c5d0104683f2efe857f61056a9" dependencies = [ - "windows-targets 0.48.0", -] - -[[package]] -name = "windows-targets" -version = "0.42.2" -source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "8e5180c00cd44c9b1c88adb3693291f1cd93605ded80c250a75d472756b4d071" -dependencies = [ - "windows_aarch64_gnullvm 0.42.2", - "windows_aarch64_msvc 0.42.2", - "windows_i686_gnu 0.42.2", - "windows_i686_msvc 0.42.2", - "windows_x86_64_gnu 0.42.2", - "windows_x86_64_gnullvm 0.42.2", - "windows_x86_64_msvc 0.42.2", + "windows-targets", ] [[package]] @@ -3553,9 +4627,9 @@ checksum = "1a515f5799fe4961cb532f983ce2b23082366b898e52ffbce459c86f67c8378a" [[package]] name = "winnow" -version = "0.4.6" +version = "0.4.7" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "61de7bac303dc551fe038e2b3cef0f571087a47571ea6e79a87692ac99b99699" +checksum = "ca0ace3845f0d96209f0375e6d367e3eb87eb65d27d445bdc9f1843a26f39448" dependencies = [ "memchr", ] @@ -3569,6 +4643,15 @@ dependencies = [ "winapi", ] +[[package]] +name = "xattr" +version = "0.2.3" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "6d1526bbe5aaeb5eb06885f4d987bcdfa5e23187055de9b83fe00156a821fabc" +dependencies = [ + "libc", +] + [[package]] name = "yansi" version = "0.5.1" @@ -3577,14 +4660,69 @@ checksum = "09041cd90cf85f7f8b2df60c646f853b7f535ce68f85244eb6731cf89fa498ec" [[package]] name = "zip" -version = "0.5.13" +version = "0.6.6" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "93ab48844d61251bb3835145c521d88aa4031d7139e8485990f60ca911fa0815" +checksum = "760394e246e4c28189f19d488c058bf16f564016aefac5d32bb1f3b51d5e9261" dependencies = [ + "aes", "byteorder", "bzip2", + "constant_time_eq", "crc32fast", + "crossbeam-utils", "flate2", - "thiserror", - "time", + "hmac", + "pbkdf2", + "sha1", + "time 0.3.22", + "zstd 0.11.2+zstd.1.5.2", +] + +[[package]] +name = "zstd" +version = "0.11.2+zstd.1.5.2" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "20cc960326ece64f010d2d2107537f26dc589a6573a316bd5b1dba685fa5fde4" +dependencies = [ + "zstd-safe 5.0.2+zstd.1.5.2", +] + +[[package]] +name = "zstd" +version = "0.12.3+zstd.1.5.2" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "76eea132fb024e0e13fd9c2f5d5d595d8a967aa72382ac2f9d39fcc95afd0806" +dependencies = [ + "zstd-safe 6.0.5+zstd.1.5.4", +] + +[[package]] +name = "zstd-safe" +version = "5.0.2+zstd.1.5.2" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "1d2a5585e04f9eea4b2a3d1eca508c4dee9592a89ef6f450c11719da0726f4db" +dependencies = [ + "libc", + "zstd-sys", +] + +[[package]] +name = "zstd-safe" +version = "6.0.5+zstd.1.5.4" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "d56d9e60b4b1758206c238a10165fbcae3ca37b01744e394c463463f6529d23b" +dependencies = [ + "libc", + "zstd-sys", +] + +[[package]] +name = "zstd-sys" +version = "2.0.8+zstd.1.5.5" +source = "registry+https://github.com/rust-lang/crates.io-index" +checksum = "5556e6ee25d32df2586c098bbfa278803692a20d0ab9565e049480d52707ec8c" +dependencies = [ + "cc", + "libc", + "pkg-config", ] diff --git a/Cargo.toml b/Cargo.toml index 1ce676d890..5b07049519 100644 --- a/Cargo.toml +++ b/Cargo.toml @@ -1,18 +1,18 @@ [workspace] members = [ "raphtory", - "raphtory-io", "raphtory-benchmark", "examples/rust", + "examples/custom_python_extension", "python", - "py-raphtory", "js-raphtory", "raphtory-graphql", + "comparison-benchmark/rust/raphtory-rust-benchmark" ] default-members = ["raphtory"] [workspace.package] -version = "0.4.0" +version = "0.5.7" documentation = "https://raphtory.readthedocs.io/en/latest/" repository = "https://github.com/Raphtory/raphtory/" license = "GPL-3.0" diff --git a/Makefile b/Makefile index c8f17ad30d..0f48dd1771 100644 --- a/Makefile +++ b/Makefile @@ -1,5 +1,8 @@ RUST_READTHEDOCS_DOCS_TARGET=docs/source/_rustdoc +rust-fmt: + cargo +nightly fmt + rust-build: cargo build -q @@ -25,4 +28,4 @@ install-python: cd python && maturin build && pip install ../target/wheels/*.whl run-graphql: - cargo run --release -p raphtory-graphql \ No newline at end of file + cargo run --release -p raphtory-graphql diff --git a/README.md b/README.md index 932c2e4715..989cb5696a 100644 --- a/README.md +++ b/README.md @@ -21,7 +21,10 @@ PyPI - + +PyPI Downloads + + Launch Notebook @@ -33,7 +36,7 @@   Pometry   -🧙🏻‍ Tutorial +🧙🏻‍ Tutorial   🐛 Report a Bug   @@ -42,10 +45,10 @@
-Raphtory is an in-memory graph tool written in Rust with friendly Python APIs on top. It is blazingly fast, scales to hundreds of millions of edges +Raphtory is an in-memory vectorised graph database written in Rust with friendly Python APIs on top. It is blazingly fast, scales to hundreds of millions of edges on your laptop, and can be dropped into your existing pipelines with a simple `pip install raphtory`. -It supports time traveling, multilayer modelling, and advanced analytics beyond simple querying like community evolution, dynamic scoring, and mining temporal motifs. +It supports time traveling, full-text search, multilayer modelling, and advanced analytics beyond simple querying like automatic risk detection, dynamic scoring, and temporal motifs. If you wish to contribute, check out the open [list of issues](https://github.com/Pometry/Raphtory/issues), [bounty board](https://github.com/Raphtory/Raphtory/discussions/categories/bounty-board) or hit us up directly on [slack](https://join.slack.com/t/raphtory/shared_invite/zt-xbebws9j-VgPIFRleJFJBwmpf81tvxA). Successful contributions will be reward with swizzling swag! @@ -54,6 +57,7 @@ If you wish to contribute, check out the open [list of issues](https://github.co ```python from raphtory import Graph +from raphtory import algorithms as algo import pandas as pd # Create a new graph @@ -82,12 +86,16 @@ print(pd.DataFrame(results[1:], columns=results[0])) # Grab an edge, explore the history of its 'weight' cb_edge = graph.edge("Bob","Charlie") -weight_history = cb_edge.property_history("weight") +weight_history = cb_edge.properties.temporal.get("weight").items() print("The edge between Bob and Charlie has the following weight history:", weight_history) # Compare this weight between time 2 and time 3 weight_change = cb_edge.at(2)["weight"] - cb_edge.at(3)["weight"] print("The weight of the edge between Bob and Charlie has changed by",weight_change,"pts") + +# Run pagerank and ask for the top ranked node +top_node = algo.pagerank(graph).top_k(1) +print("The most important node in the graph is",top_node[0][0],"with a score of",top_node[0][1]) ``` ```a @@ -107,8 +115,113 @@ Graph(number_of_edges=2, number_of_vertices=3, earliest_time=1, latest_time=3) The edge between Bob and Charlie has the following weight history: [(2, 5.0), (3, -15.0)] The weight of the edge between Bob and Charlie has changed by 20.0 pts + +The top node in the graph is Charlie with a score of 0.4744116163405977 ``` +## GraphQL + +### Create/Load a graph + +Save a raphtory graph and set the `GRAPH_DIRECTORY` environment variable to point to the directory containing the graph. + +
+ + +Alternatively you can run the code below to generate a graph. + + +```bash +mkdir -p /tmp/graphs +mkdir -p examples/rust/src/bin/lotr/data/ +tail -n +2 resource/lotr.csv > examples/rust/src/bin/lotr/data/lotr.csv + +cd examples/rust && cargo run --bin lotr -r + +cp examples/rust/src/bin/lotr/data/graphdb.bincode /tmp/graphs/lotr.bincode +``` + +
+ + +### Run the GraphQL server + +The code below will run GraphQL with a UI at `localhost:1736` + +GraphlQL will look for graph files in `/tmp/graphs` or in the path set in the `GRAPH_DIRECTORY` Environment variable. + +```bash +cd raphtory-graphql && cargo run -r +``` + +
+ℹ️Warning: Server must have the same version + environment +The GraphQL server must be running in the same environment (i.e. debug or release) and same Raphtory version as the generated graph, otherwise it will throw errors due to incompatible graph metadata across versions. +
+ +
+Following will be output upon a successful launch + +```bash +warning: `raphtory` (lib) generated 17 warnings (run `cargo fix --lib -p raphtory` to apply 13 suggestions) + Finished release [optimized] target(s) in 0.91s + Running `Raphtory/target/release/raphtory-graphql` +loading graph from /tmp/graphs/lotr.bincode +Playground: http://localhost:1736 + 2023-08-11T14:36:52.444203Z INFO poem::server: listening, addr: socket://0.0.0.0:1736 + at /Users/pometry/.cargo/registry/src/github.com-1ecc6299db9ec823/poem-1.3.56/src/server.rs:109 + + 2023-08-11T14:36:52.444257Z INFO poem::server: server started + at /Users/pometry/.cargo/registry/src/github.com-1ecc6299db9ec823/poem-1.3.56/src/server.rs:111 +``` +
+ + +### Execute a query + +Go to the Playground at `http://localhost:1736` and execute the following commands: + +Query: +```bash + query GetNodes($graphName: String!) { + graph(name: $graphName) { + nodes { + name + } + } + } +``` + +Query Variables: +```bash +{ + "graphName": "lotr.bincode" +} +``` + +Expected Result: +```bash +{ + "data": { + "graph": { + "nodes": [ + { + "name": "Gandalf" + }, + { + "name": "Elrond" + }, + { + "name": "Frodo" + }, + { + "name": "Bilbo" + }, + ... +``` + + + ## Installing Raphtory diff --git a/benchmark/benchmark_base.py b/comparison-benchmark/python/benchmark_base.py similarity index 69% rename from benchmark/benchmark_base.py rename to comparison-benchmark/python/benchmark_base.py index a3d53c9e6a..b8ad8ae793 100755 --- a/benchmark/benchmark_base.py +++ b/comparison-benchmark/python/benchmark_base.py @@ -2,25 +2,38 @@ ### This class is used by the benchmarking scripts to benchmark the graph tools import time from abc import ABC, abstractmethod -import docker + +try: + import docker +except ImportError as e: + print("IMPORT ERROR, docker not found...") import os import multiprocessing class BenchmarkBase(ABC): - - def start_docker(self, image_name, container_folder, exec_commands, envs={}, ports={}, image_path=None, wait=0, start_cmd=None): + def start_docker( + self, + image_name, + container_folder, + exec_commands, + envs={}, + ports={}, + image_path=None, + wait=0, + start_cmd=None, + ): if envs is None: envs = {} - print('Creating Docker client...') + print("Creating Docker client...") self.docker = docker.from_env() - print('Pulling Docker image...') + print("Pulling Docker image...") self.docker.images.pull(image_name) - print('Defining volumes...') + print("Defining volumes...") local_folder = os.path.abspath(os.getcwd()) - volumes = {local_folder: {'bind': container_folder, 'mode': 'z'}} + volumes = {local_folder: {"bind": container_folder, "mode": "z"}} if image_path: image, build_logs = self.docker.images.build( @@ -28,18 +41,18 @@ def start_docker(self, image_name, container_folder, exec_commands, envs={}, por ) image_name = image.id - print('Running Docker container & benchmark...') + print("Running Docker container & benchmark...") if start_cmd is None: self.container = self.docker.containers.run( image_name, volumes=volumes, detach=True, - stdin_open = True, + stdin_open=True, tty=True, environment=envs, ports=ports, - mem_limit='4g', + mem_limit="4g", ) else: self.container = self.docker.containers.run( @@ -47,21 +60,21 @@ def start_docker(self, image_name, container_folder, exec_commands, envs={}, por command=start_cmd, volumes=volumes, detach=True, - stdin_open = True, + stdin_open=True, tty=True, environment=envs, ports=ports, - mem_limit='4g', + mem_limit="4g", ) time.sleep(wait) try: for cmd in exec_commands: - print(f'Running command {cmd}...') + print(f"Running command {cmd}...") _, stream = self.container.exec_run(cmd, stream=True) for data in stream: - print(data.decode(), end='') + print(data.decode(), end="") print() del stream # print(exec_command) @@ -74,16 +87,20 @@ def start_docker(self, image_name, container_folder, exec_commands, envs={}, por print("Completed command...") except Exception as e: print(e) - print('Error running command') + print("Error running command") self.container.stop() self.container.remove() - return 1, 'Error running command' + return 1, "Error running command" - print('Benchmark completed, retrieving results...') - file_path = '/tmp/bench-*.csv' - file_contents = self.container.exec_run(['/bin/bash', '-c', f'cat {file_path}']).output.decode('utf-8').strip() + print("Benchmark completed, retrieving results...") + file_path = "/tmp/bench-*.csv" + file_contents = ( + self.container.exec_run(["/bin/bash", "-c", f"cat {file_path}"]) + .output.decode("utf-8") + .strip() + ) - print('Removing container...') + print("Removing container...") self.container.stop() self.container.remove() diff --git a/benchmark/benchmark_driver.py b/comparison-benchmark/python/benchmark_driver.py similarity index 65% rename from benchmark/benchmark_driver.py rename to comparison-benchmark/python/benchmark_driver.py index a7ed78ccf2..cf00467771 100755 --- a/benchmark/benchmark_driver.py +++ b/comparison-benchmark/python/benchmark_driver.py @@ -8,14 +8,22 @@ import os from io import StringIO -fns = ['setup', 'degree', 'out_neighbours', 'page_rank', 'connected_components'] +fns = ["setup", "degree", "out_neighbours", "page_rank", "connected_components"] def process_arguments(): - parser = argparse.ArgumentParser(description='benchmark args') - parser.add_argument('--docker', action=argparse.BooleanOptionalAction, - help='Launch with docker containers, --no-docker to run locally', default=True) - parser.add_argument('-b', '--bench', type=str, help=""" + parser = argparse.ArgumentParser(description="benchmark args") + parser.add_argument( + "--docker", + action=argparse.BooleanOptionalAction, + help="Launch with docker containers, --no-docker to run locally", + default=True, + ) + parser.add_argument( + "-b", + "--bench", + type=str, + help=""" Run specific benchmark, default: Goes to Menu (if docker runs all), all: Run All @@ -28,7 +36,9 @@ def process_arguments(): mem: Run Memgraph Benchmark cozo: Run CozoDB Benchmark exit: Exit - """, default='menu') + """, + default="menu", + ) return parser.parse_args() @@ -51,26 +61,26 @@ def display_menu(): def setup(): return { - 'all': 'ALL', - 'download': 'DOWNLOAD', - 'r': RaphtoryBench, - 'gt': GraphToolBench, - 'k': KuzuBench, - 'nx': NetworkXBench, - 'neo': Neo4jBench, - 'mem': MemgraphBench, - 'cozo': CozoDBBench + "all": "ALL", + "download": "DOWNLOAD", + "r": RaphtoryBench, + "gt": GraphToolBench, + "k": KuzuBench, + "nx": NetworkXBench, + "neo": Neo4jBench, + "mem": MemgraphBench, + "cozo": CozoDBBench, } def run_benchmark(choice, docker=False): benchmarks_to_run = [] - if choice.lower() == 'all': + if choice.lower() == "all": for key in setup().keys(): - if key == 'menu' or key == 'all' or key == 'download': + if key == "menu" or key == "all" or key == "download": continue benchmarks_to_run.append(key) - elif choice == 'download' or choice == 'menu': + elif choice == "download" or choice == "menu": return elif choice in setup().keys(): benchmarks_to_run.append(choice) @@ -79,6 +89,8 @@ def run_benchmark(choice, docker=False): print("Running benchmarks: " + str(benchmarks_to_run)) for key in benchmarks_to_run: driver = setup()[key] + print(key) + print(setup()) if docker: print("** Running dockerized benchmark " + str(key) + "...") print("Starting docker container...") @@ -88,23 +100,25 @@ def run_benchmark(choice, docker=False): results[driver.name()] = logs else: print("** Running for " + driver.name() + "...") - times = '' - fn_header = '' + times = "" + fn_header = "" for fn in fns: print("** Running " + fn + "...") start_time = time.time() getattr(driver, fn)() end_time = time.time() print(fn + " time: " + str(end_time - start_time)) - fn_header += fn + ',' - if driver.name() == 'Neo4j' and fn == 'setup': + fn_header += fn + "," + if driver.name() == "Neo4j" and fn == "setup": # take away 15 seconds for the sleep time when restarting the database end_time = end_time - 50 - times += str(end_time - start_time) + ',' + times += str(end_time - start_time) + "," fn_header = fn_header[:-1] times = times[:-1] - results[driver.name()] = fn_header + '\n' + times - pd.DataFrame([times.split(',')], columns=fns).to_csv('/tmp/bench-'+driver.name()+'-'+str(time.time())+'.csv') + results[driver.name()] = fn_header + "\n" + times + pd.DataFrame([times.split(",")], columns=fns).to_csv( + "/tmp/bench-" + driver.name() + "-" + str(time.time()) + ".csv" + ) return results @@ -116,10 +130,10 @@ def print_table(data): _data[key] = pd.read_csv(StringIO(value)) merged_df = pd.concat([df.assign(key=key) for key, df in _data.items()]) col = merged_df.pop("key") - if 'Unnamed: 0' in merged_df.columns: - merged_df.drop('Unnamed: 0', axis=1, inplace=True) - merged_df.insert(0, 'System', col) - print(merged_df.to_string(index=False, justify='left')) + if "Unnamed: 0" in merged_df.columns: + merged_df.drop("Unnamed: 0", axis=1, inplace=True) + merged_df.insert(0, "System", col) + print(merged_df.to_string(index=False, justify="left")) def dl_file(url, path): @@ -127,7 +141,7 @@ def dl_file(url, path): print("Downloading " + url + "...") r = requests.get(url, stream=True) if r.status_code == 200: - with open(path, 'wb') as f: + with open(path, "wb") as f: f.write(r.raw.read()) else: print("Error downloading data") @@ -146,38 +160,38 @@ def download_data(): # Download the data print("Downloading data...") urls = { - 'simple-profiles.csv.gz': 'https://raw.githubusercontent.com/Raphtory/Data/main/simple-profiles.csv.gz', - 'simple-relationships.csv.gz': 'https://media.githubusercontent.com/media/Raphtory/Data/main/simple-relationships.csv.gz' + "simple-profiles.csv.gz": "https://osf.io/download/w2xns/", + "simple-relationships.csv.gz": "https://osf.io/download/nbq6h/", } # make the data directory - create_directory('data') + create_directory("data") for name, url in urls.items(): - dl_file(url, 'data/' + name) + dl_file(url, "data/" + name) # Unzip the files for name in urls.keys(): print("Unzipping " + name + "...") - with gzip.open('data/' + name, 'rb') as f_in: - with open('data/' + name[:-3], 'wb') as f_out: + with gzip.open("data/" + name, "rb") as f_in: + with open("data/" + name[:-3], "wb") as f_out: shutil.copyfileobj(f_in, f_out) print("Done unzipping " + name + "...") - os.remove('data/' + name) + os.remove("data/" + name) # return the file paths - return 'data/simple-profiles.csv', 'data/simple-relationships.csv' + return "data/simple-profiles.csv", "data/simple-relationships.csv" def main(docker, choice): print("Welcome to the Raphtory Benchmarking Tool") results = {} try: - if choice == 'menu': + if choice == "menu": choice = display_menu() - if choice == 'download' or choice == 1: + if choice == "download" or choice == 1: download_data() - elif choice == 'exit' or choice not in setup(): + elif choice == "exit" or choice not in setup(): print(str(choice) + ". Exiting...") else: results = run_benchmark(choice, docker) diff --git a/benchmark/benchmark_imports.py b/comparison-benchmark/python/benchmark_imports.py similarity index 98% rename from benchmark/benchmark_imports.py rename to comparison-benchmark/python/benchmark_imports.py index 8191457e3b..843052c688 100755 --- a/benchmark/benchmark_imports.py +++ b/comparison-benchmark/python/benchmark_imports.py @@ -8,42 +8,49 @@ try: from raphtory_bench import RaphtoryBench + RaphtoryBench = RaphtoryBench() except ImportError as e: pass try: from kuzu_bench import KuzuBench + KuzuBench = KuzuBench() except ImportError: pass try: from networkx_bench import NetworkXBench + NetworkXBench = NetworkXBench() except ImportError as e: pass try: from neo4j_bench import Neo4jBench + Neo4jBench = Neo4jBench() except ImportError: pass try: from graphtool_bench import GraphToolBench + GraphToolBench = GraphToolBench() except ImportError as e: pass try: from memgraph_bench import MemgraphBench + MemgraphBench = MemgraphBench() except ImportError as e: pass try: from cozo_bench import CozoDBBench + CozoDBBench = CozoDBBench() except ImportError: - pass \ No newline at end of file + pass diff --git a/benchmark/cozo_bench.py b/comparison-benchmark/python/cozo_bench.py similarity index 70% rename from benchmark/cozo_bench.py rename to comparison-benchmark/python/cozo_bench.py index c83ae9e19e..19d968d2ff 100755 --- a/benchmark/cozo_bench.py +++ b/comparison-benchmark/python/cozo_bench.py @@ -7,15 +7,16 @@ class CozoDBBench(BenchmarkBase): - def start_docker(self, **kwargs): - image_name = 'python:3.10-bullseye' - container_folder = '/app/data' + image_name = "python:3.10-bullseye" + container_folder = "/app/data" exec_commands = [ - 'pip install requests docker pycozo[embedded,pandas]', - '/bin/bash -c "cd /app/data;python benchmark_driver.py --no-docker --bench cozo"' + "pip install requests docker pycozo[embedded,pandas]", + '/bin/bash -c "cd /app/data;python benchmark_driver.py --no-docker --bench cozo"', ] - code, contents = super().start_docker(image_name, container_folder, exec_commands) + code, contents = super().start_docker( + image_name, container_folder, exec_commands + ) return code, contents def shutdown(self): @@ -33,7 +34,8 @@ def setup(self): self.client = Client() self.client.run("{:create user { code: Int }}") self.client.run("{:create friend { fr: Int, to: Int }}") - self.client.run(""" + self.client.run( + """ res[user] <~ CsvReader(types: ['Int'], url: 'file://./data/simple-profiles.csv', @@ -45,8 +47,10 @@ def setup(self): :replace user { code: Int } - """) - self.client.run(""" + """ + ) + self.client.run( + """ res[] <~ CsvReader(types: ['Int', 'Int'], url: 'file://./data/simple-relationships.csv', @@ -56,10 +60,13 @@ def setup(self): res[fr, to] :replace friend { fr: Int, to: Int } - """) + """ + ) def degree(self): - return self.client.run("?[user_id, total_degree, out_degree, in_degree] <~ DegreeCentrality(*friend[])") + return self.client.run( + "?[user_id, total_degree, out_degree, in_degree] <~ DegreeCentrality(*friend[])" + ) def out_neighbours(self): return self.degree() @@ -68,4 +75,6 @@ def page_rank(self): return self.client.run("?[user_id, page_rank] <~ PageRank(*friend[])") def connected_components(self): - return self.client.run("?[user_id, component] <~ ConnectedComponents(*friend[])") + return self.client.run( + "?[user_id, component] <~ ConnectedComponents(*friend[])" + ) diff --git a/benchmark/graphtool_bench.py b/comparison-benchmark/python/graphtool_bench.py similarity index 69% rename from benchmark/graphtool_bench.py rename to comparison-benchmark/python/graphtool_bench.py index de0b008a93..86e4ac7a8e 100755 --- a/benchmark/graphtool_bench.py +++ b/comparison-benchmark/python/graphtool_bench.py @@ -12,14 +12,16 @@ class GraphToolBench(BenchmarkBase): def start_docker(self, **kwargs): - image_name = 'tiagopeixoto/graph-tool:latest' - container_folder = '/app/data' + image_name = "tiagopeixoto/graph-tool:latest" + container_folder = "/app/data" exec_commands = [ - 'python -m ensurepip --upgrade', - 'python -m pip install requests tqdm docker pandas', - '/bin/bash -c "cd /app/data;python benchmark_driver.py --no-docker --bench gt"' + "python -m ensurepip --upgrade", + "python -m pip install requests tqdm docker pandas", + '/bin/bash -c "cd /app/data;python benchmark_driver.py --no-docker --bench gt"', ] - code, contents = super().start_docker(image_name, container_folder, exec_commands) + code, contents = super().start_docker( + image_name, container_folder, exec_commands + ) return code, contents def shutdown(self): @@ -34,13 +36,13 @@ def name(self): def setup(self): self.graph = gt.Graph() # with gzip.open(relationships_file, 'rt') as f: - with open(simple_relationship_file, 'r') as f: - reader = csv.reader(f, delimiter='\t') + with open(simple_relationship_file, "r") as f: + reader = csv.reader(f, delimiter="\t") for row in reader: # , total=30622564): self.graph.add_edge(int(row[0]), int(row[1])) def degree(self): - self.graph.degree_property_map('total').get_array() + self.graph.degree_property_map("total").get_array() def out_neighbours(self): [len(list(v.out_neighbours())) for v in self.graph.vertices()] diff --git a/benchmark/kuzu_bench.py b/comparison-benchmark/python/kuzu_bench.py similarity index 67% rename from benchmark/kuzu_bench.py rename to comparison-benchmark/python/kuzu_bench.py index cd42e435e4..45596b1468 100755 --- a/benchmark/kuzu_bench.py +++ b/comparison-benchmark/python/kuzu_bench.py @@ -1,4 +1,5 @@ from benchmark_base import BenchmarkBase + # Dont fail if not installed try: import kuzu @@ -7,15 +8,16 @@ class KuzuBench(BenchmarkBase): - def start_docker(self): - image_name = 'python:3.10-bullseye' - container_folder = '/app/data' + image_name = "python:3.10-bullseye" + container_folder = "/app/data" exec_commands = [ - 'pip install requests tqdm docker kuzu pandas numpy scipy', - '/bin/bash -c "cd /app/data;python benchmark_driver.py --no-docker --bench k"' + "pip install requests tqdm docker kuzu pandas numpy scipy", + '/bin/bash -c "cd /app/data;python benchmark_driver.py --no-docker --bench k"', ] - code, contents = super().start_docker(image_name, container_folder, exec_commands) + code, contents = super().start_docker( + image_name, container_folder, exec_commands + ) return code, contents def shutdown(self): @@ -33,7 +35,7 @@ def run_query(self, query): return res def setup(self): - self.db = kuzu.Database('/tmp/testdb') + self.db = kuzu.Database("/tmp/testdb") self.conn = kuzu.Connection(self.db) self.run_query("CREATE NODE TABLE User(id INT64, PRIMARY KEY (id))") self.run_query("CREATE REL TABLE Follows(FROM User TO User)") @@ -41,14 +43,15 @@ def setup(self): self.run_query('COPY Follows FROM "data/simple-relationships.csv" (DELIM="\t")') def degree(self): - res = self.run_query('MATCH (a:User)-[f:Follows]->(b:User) RETURN a.id,COUNT(f)') + res = self.run_query( + "MATCH (a:User)-[f:Follows]->(b:User) RETURN a.id,COUNT(f)" + ) df = res.get_as_df() def out_neighbours(self): - self.conn.set_query_timeout(300000) # 300 seconds - res = self.run_query('MATCH (u:User)-[:Follows]->(n)' - 'RETURN COUNT(n.id)') - # 'RETURN u.id, COLLECT(n.id) AS out_neighbours') + self.conn.set_query_timeout(300000) # 300 seconds + res = self.run_query("MATCH (u:User)-[:Follows]->(n)" "RETURN COUNT(n.id)") + # 'RETURN u.id, COLLECT(n.id) AS out_neighbours') df = res.get_as_df() def page_rank(self): diff --git a/benchmark/memgraph_bench.py b/comparison-benchmark/python/memgraph_bench.py similarity index 77% rename from benchmark/memgraph_bench.py rename to comparison-benchmark/python/memgraph_bench.py index 6a90d25bc2..d065d452fa 100755 --- a/benchmark/memgraph_bench.py +++ b/comparison-benchmark/python/memgraph_bench.py @@ -12,13 +12,13 @@ class MemgraphBench(BenchmarkBase): def start_docker(self, **kwargs): - image_name = 'memgraph/memgraph-platform:latest' - container_folder = '/app/data' + image_name = "memgraph/memgraph-platform:latest" + container_folder = "/app/data" exec_commands = [ '/bin/bash -c "apt update && apt install -y libssl-dev"', '/bin/bash -c "python3 -m pip install gqlalchemy requests tqdm docker pandas"', '/bin/bash -c "cp -R /app/data/data /tmp/;chmod 777 -R /tmp/data"', - '/bin/bash -c "cd /app/data;python3 benchmark_driver.py --no-docker --bench mem"' + '/bin/bash -c "cd /app/data;python3 benchmark_driver.py --no-docker --bench mem"', ] # ports = { # '7444': '7444', @@ -30,7 +30,6 @@ def start_docker(self, **kwargs): container_folder=container_folder, exec_commands=exec_commands, # ports=ports, - ) return code, contents @@ -45,19 +44,23 @@ def __init__(self): def import_data(self): print("loading nodes") - query = 'LOAD CSV FROM "/tmp/data/simple-profiles.csv" NO HEADER DELIMITER "\t" AS row '\ - 'CREATE (n:Node {id: row[0]});' + query = ( + 'LOAD CSV FROM "/tmp/data/simple-profiles.csv" NO HEADER DELIMITER "\t" AS row ' + "CREATE (n:Node {id: row[0]});" + ) self.graph.execute(query) print("Creating index") - query = 'CREATE INDEX ON :Node(id);' + query = "CREATE INDEX ON :Node(id);" self.graph.execute(query) print("loading relationships") - query = 'LOAD CSV FROM "/tmp/data/simple-relationships.csv" NO HEADER DELIMITER "\t" AS row ' \ - 'MATCH (n1:Node {id: row[0]}), (n2:Node {id: row[1]}) CREATE (n1)-[:FOLLOWS]->(n2);' + query = ( + 'LOAD CSV FROM "/tmp/data/simple-relationships.csv" NO HEADER DELIMITER "\t" AS row ' + "MATCH (n1:Node {id: row[0]}), (n2:Node {id: row[1]}) CREATE (n1)-[:FOLLOWS]->(n2);" + ) self.graph.execute(query) def setup(self): - self.graph = Memgraph(host='127.0.0.1', port=7687) + self.graph = Memgraph(host="127.0.0.1", port=7687) # query = "MATCH (n) DETACH DELETE n" # self.graph.execute(query) self.import_data() diff --git a/benchmark/neo4j_bench.py b/comparison-benchmark/python/neo4j_bench.py similarity index 60% rename from benchmark/neo4j_bench.py rename to comparison-benchmark/python/neo4j_bench.py index e99f5ee6e9..3570bddf8a 100755 --- a/benchmark/neo4j_bench.py +++ b/comparison-benchmark/python/neo4j_bench.py @@ -14,28 +14,34 @@ def create_graph_projection(tx): - tx.run(""" + tx.run( + """ CALL gds.graph.project.cypher( 'social', 'MATCH (n) RETURN id(n) AS id', 'MATCH (n)-[r:FOLLOWS]->(m) RETURN id(n) AS source, id(m) AS target') YIELD graphName AS graph, nodeQuery, nodeCount AS nodes, relationshipQuery, relationshipCount AS rels - """) + """ + ) def query_degree(tx): - result = tx.run(""" + result = tx.run( + """ MATCH p=(n)-[r:FOLLOWS]->() RETURN n.id, COUNT(p) - """) + """ + ) return list(result) def get_out_neighbors(tx): - result = tx.run(""" + result = tx.run( + """ MATCH p=(n)-[:FOLLOWS]->(neighbor) RETURN n.id, COUNT(p) - """) + """ + ) return list(result) @@ -45,58 +51,77 @@ def run_pagerank(tx): def run_connected_components(tx): - result = tx.run(""" + result = tx.run( + """ CALL gds.wcc.stream("social") - """) + """ + ) return list(result) def execute_bash_command(command, background=False): print("Executing command: ", command) if background: - subprocess.Popen(command, shell=True, stdout=subprocess.PIPE, stderr=subprocess.PIPE) + subprocess.Popen( + command, shell=True, stdout=subprocess.PIPE, stderr=subprocess.PIPE + ) return - process = subprocess.Popen(command, shell=True, stdout=subprocess.PIPE, stderr=subprocess.PIPE) + process = subprocess.Popen( + command, shell=True, stdout=subprocess.PIPE, stderr=subprocess.PIPE + ) stdout, stderr = process.communicate() - return stdout.decode('utf-8'), stderr.decode('utf-8') + return stdout.decode("utf-8"), stderr.decode("utf-8") def write_array_to_csv(arr, file_path): - with open(file_path, 'w', newline='') as csv_file: - writer = csv.writer(csv_file, delimiter='\t') + with open(file_path, "w", newline="") as csv_file: + writer = csv.writer(csv_file, delimiter="\t") writer.writerows(arr) def modify_data(): print("Generating data...") - file_dir = os.path.abspath(os.getcwd()) + '/data/' + file_dir = os.path.abspath(os.getcwd()) + "/data/" print("File dir: ", file_dir) - if 'simple-profiles-header-neo4j.csv' not in os.listdir(file_dir): + if "simple-profiles-header-neo4j.csv" not in os.listdir(file_dir): print("Generating node header") - write_array_to_csv([['node:ID', 'name']], file_dir + 'simple-profiles-header-neo4j.csv') + write_array_to_csv( + [["node:ID", "name"]], file_dir + "simple-profiles-header-neo4j.csv" + ) print("Generating relationship header") - write_array_to_csv([['node:START_ID', 'node:END_ID', ':TYPE']], - file_dir + 'simple-relationships-headers-neo4j.csv') + write_array_to_csv( + [["node:START_ID", "node:END_ID", ":TYPE"]], + file_dir + "simple-relationships-headers-neo4j.csv", + ) print("Generating node data") - df = pd.read_csv(file_dir + 'simple-profiles.csv', sep='\t', header=None) - df['copy'] = df[0].copy() - df.to_csv(file_dir + 'simple-profiles-neo4j.csv', index=None, header=None, sep='\t') + df = pd.read_csv(file_dir + "simple-profiles.csv", sep="\t", header=None) + df["copy"] = df[0].copy() + df.to_csv( + file_dir + "simple-profiles-neo4j.csv", index=None, header=None, sep="\t" + ) print("Generating relationship data") - df = pd.read_csv(file_dir + 'simple-relationships.csv', sep='\t', header=None) - df['type'] = 'FOLLOWS' - df.to_csv(file_dir + 'simple-relationships-neo4j.csv', sep='\t', index=None, header=None) + df = pd.read_csv(file_dir + "simple-relationships.csv", sep="\t", header=None) + df["type"] = "FOLLOWS" + df.to_csv( + file_dir + "simple-relationships-neo4j.csv", + sep="\t", + index=None, + header=None, + ) print("Done") def import_data(): - return execute_bash_command("neo4j-admin database import full --overwrite-destination --delimiter='TAB' " - "--nodes=/var/lib/neo4j/import/data2/data/simple-profiles-header-neo4j.csv," - "/var/lib/neo4j/import/data2/data/simple-profiles-neo4j.csv " - "--relationships=/var/lib/neo4j/import/data2/data/simple-relationships-headers-neo4j.csv," - "/var/lib/neo4j/import/data2/data/simple-relationships-neo4j.csv neo4j") + return execute_bash_command( + "neo4j-admin database import full --overwrite-destination --delimiter='TAB' " + "--nodes=/var/lib/neo4j/import/data2/data/simple-profiles-header-neo4j.csv," + "/var/lib/neo4j/import/data2/data/simple-profiles-neo4j.csv " + "--relationships=/var/lib/neo4j/import/data2/data/simple-relationships-headers-neo4j.csv," + "/var/lib/neo4j/import/data2/data/simple-relationships-neo4j.csv neo4j" + ) # tx.run(""" # LOAD CSV FROM 'file:///data2/data/simple-relationships.csv' AS row # FIELDTERMINATOR '\t' @@ -110,16 +135,13 @@ def import_data(): class Neo4jBench(BenchmarkBase): def start_docker(self, **kwargs): modify_data() - image_name = 'neo4j:5.8.0' - container_folder = '/var/lib/neo4j/import/data2/' + image_name = "neo4j:5.8.0" + container_folder = "/var/lib/neo4j/import/data2/" envs = { - 'NEO4J_AUTH': 'neo4j/password', - 'NEO4J_PLUGINS': '["graph-data-science"]' - } - ports = { - '7474': '7474', - '7687': '7687' + "NEO4J_AUTH": "neo4j/password", + "NEO4J_PLUGINS": '["graph-data-science"]', } + ports = {"7474": "7474", "7687": "7687"} exec_commands = [ '/bin/bash -c "apt update && apt install python3-pip -y"', '/bin/bash -c "python3 -m pip install neo4j requests tqdm pandas numpy docker"', @@ -128,9 +150,15 @@ def start_docker(self, **kwargs): '/bin/bash -c "cd /var/lib/neo4j/import/data2/; python3 benchmark_driver.py --no-docker --bench neo"', ] # image_path = 'DockerFiles/pyneo' image_path ports - code, contents = super().start_docker(image_name=image_name, container_folder=container_folder, - exec_commands=exec_commands, envs=envs, wait=35, ports=ports, - start_cmd='tail -f /dev/null') + code, contents = super().start_docker( + image_name=image_name, + container_folder=container_folder, + exec_commands=exec_commands, + envs=envs, + wait=35, + ports=ports, + start_cmd="tail -f /dev/null", + ) return code, contents def shutdown(self): @@ -139,7 +167,6 @@ def shutdown(self): def __init__(self): self.driver = None - def name(self): return "Neo4j" @@ -154,9 +181,12 @@ def setup(self): print("status: ", stout) print("error: ", sterr) print("Starting neo4j") - execute_bash_command('export NEO4J_AUTH="neo4j/password"; export NEO4J_PLUGINS=\'[' - '"graph-data-science"]\';/bin/bash -c "tini -s -g -- ' - '/startup/docker-entrypoint.sh neo4j start &"', background=True) + execute_bash_command( + 'export NEO4J_AUTH="neo4j/password"; export NEO4J_PLUGINS=\'[' + '"graph-data-science"]\';/bin/bash -c "tini -s -g -- ' + '/startup/docker-entrypoint.sh neo4j start &"', + background=True, + ) print("Sleeping for 50 seconds...") time.sleep(50) # print("Updating password") diff --git a/benchmark/networkx_bench.py b/comparison-benchmark/python/networkx_bench.py similarity index 68% rename from benchmark/networkx_bench.py rename to comparison-benchmark/python/networkx_bench.py index 03aede1713..28b9894ee8 100755 --- a/benchmark/networkx_bench.py +++ b/comparison-benchmark/python/networkx_bench.py @@ -1,5 +1,6 @@ from benchmark_base import BenchmarkBase import csv + # Dont fail if not imported locally try: import networkx as nx @@ -12,13 +13,15 @@ class NetworkXBench(BenchmarkBase): def start_docker(self, **kwargs): - image_name = 'python:3.10-bullseye' - container_folder = '/app/data' + image_name = "python:3.10-bullseye" + container_folder = "/app/data" exec_commands = [ - 'pip install requests tqdm docker networkx pandas numpy scipy', - '/bin/bash -c "cd /app/data;python benchmark_driver.py --no-docker --bench nx"' + "pip install requests tqdm docker networkx pandas numpy scipy", + '/bin/bash -c "cd /app/data;python benchmark_driver.py --no-docker --bench nx"', ] - code, contents = super().start_docker(image_name, container_folder, exec_commands) + code, contents = super().start_docker( + image_name, container_folder, exec_commands + ) return code, contents def shutdown(self): @@ -33,8 +36,8 @@ def name(self): def setup(self): self.graph = nx.DiGraph() - with open(simple_relationship_file, 'r') as f: - reader = csv.reader(f, delimiter='\t') + with open(simple_relationship_file, "r") as f: + reader = csv.reader(f, delimiter="\t") for row in reader: self.graph.add_edge(int(row[0]), int(row[1])) @@ -52,4 +55,6 @@ def page_rank(self): return nx.pagerank(self.graph) def connected_components(self): - return [len(comp) for comp in nx.connected_components(self.graph.to_undirected())] + return [ + len(comp) for comp in nx.connected_components(self.graph.to_undirected()) + ] diff --git a/benchmark/profile_bench.py b/comparison-benchmark/python/profile_bench.py similarity index 91% rename from benchmark/profile_bench.py rename to comparison-benchmark/python/profile_bench.py index 3ceb85c2ac..09e32a13a1 100755 --- a/benchmark/profile_bench.py +++ b/comparison-benchmark/python/profile_bench.py @@ -28,13 +28,13 @@ def setup(): 3: KuzuBench(), 4: NetworkXBench(), 5: Neo4jBench(), - 6: MemgraphBench() + 6: MemgraphBench(), } def run_benchmark(choice): driver = setup()[choice] - fns = ['setup', 'degree', 'out_neighbours', 'page_rank', 'connected_components'] + fns = ["setup", "degree", "out_neighbours", "page_rank", "connected_components"] for fn in fns: print("** Running " + fn + "...") start_time = time.time() diff --git a/benchmark/raphtory_bench.py b/comparison-benchmark/python/raphtory_bench.py similarity index 66% rename from benchmark/raphtory_bench.py rename to comparison-benchmark/python/raphtory_bench.py index 462dec9906..180eafa9dd 100755 --- a/benchmark/raphtory_bench.py +++ b/comparison-benchmark/python/raphtory_bench.py @@ -7,22 +7,28 @@ import raphtory from tqdm import tqdm from raphtory.algorithms import pagerank, weakly_connected_components -except ImportError: - pass +except ImportError as e: + print("IMPORT ERROR") + print(e) + print("Cannot continue. Exiting") + import sys + + sys.exit(1) simple_relationship_file = "data/simple-relationships.csv" class RaphtoryBench(BenchmarkBase): - def start_docker(self, **kwargs): - image_name = 'python:3.10-bullseye' - container_folder = '/app/data' + image_name = "python:3.10-bullseye" + container_folder = "/app/data" exec_commands = [ - 'pip install raphtory requests tqdm pandas numpy docker', - '/bin/bash -c "cd /app/data;python benchmark_driver.py --no-docker --bench r"' + "pip install raphtory requests tqdm pandas numpy docker", + '/bin/bash -c "cd /app/data;python benchmark_driver.py --no-docker --bench r"', ] - code, contents = super().start_docker(image_name, container_folder, exec_commands) + code, contents = super().start_docker( + image_name, container_folder, exec_commands + ) return code, contents def shutdown(self): @@ -36,9 +42,9 @@ def __init__(self): def setup(self): # Load edges - self.graph = raphtory.Graph(multiprocessing.cpu_count()) - with open(simple_relationship_file, 'r') as f: - reader = csv.reader(f, delimiter='\t') + self.graph = raphtory.Graph() + with open(simple_relationship_file, "r") as f: + reader = csv.reader(f, delimiter="\t") for row in reader: self.graph.add_edge(1, row[0], row[1], {}) diff --git a/benchmark/readme.md b/comparison-benchmark/readme.md similarity index 70% rename from benchmark/readme.md rename to comparison-benchmark/readme.md index 0c3ad2a36f..c4b9437518 100755 --- a/benchmark/readme.md +++ b/comparison-benchmark/readme.md @@ -3,6 +3,66 @@ This is the raphtory benchmarking suite. It is designed to test the performance of raphtory against other graph processing systems. +There are two benchmarks suites, one for python with support for multiple systems, and one for rust with support for + raphtory only. + + +## Rust Suite + +This only does a light benchmark of raphtory, as it is designed to be used standalone. + + Raphtory Quick Benchmark + + Usage: raphtory-rust-benchmark [OPTIONS] + + Options: + --header Set if the file has a header, default is False + --delimiter Delimiter of the csv file [default: "\t"] + --file-path Path to a csv file [default: ] + --from-column Position of the from column in the csv [default: 0] + --to-column Position of the to column in the csv [default: 1] + --time-column Position of the time column in the csv, default will ignore time [default: -1] + --download Download default files + --debug Debug to print more info to the screen + -h, --help Print help + -V, --version Print version + + +First download the example file by cd'ing into the `raphtory-rust-benchmark` folder and running + + cargo run -- --download + +This will download the example file into tmp folder on your system, it will give you the file path. + +You can then run the benchmark by running, with the file path it has given you + + cargo run -- --file-path + +You can also provide your own file path, but please ensure you have set the correct arguments. +I.e Whether it has a header, what the delimiter is, and what columns are what. + +e.g. + + cargo run -- --file-path="/Users/1337/Documents/dev/Data/lotr.csv" --delimiter="," --from-column=0 --to-column=1 + +The results for a 1000 edge file are below + + Raphtory Quick Benchmark + Running setup... + Setup took 0.015264357 seconds + Graph has 864 vertices and 1000 edges + Degree: 0.001719875 seconds + Out neighbours: 0.000247832 seconds + Page rank: 0.012001127 seconds + Connected components: 0.025755603 seconds + + + +## Python Suite + +This benchmarks the python version of raphtory. +Please ensure your python environment has raphtory installed. + Systems currently supported are: - [raphtory](https://github.com/Pometry/Raphtory) - [neo4j](https://neo4j.com/) @@ -29,7 +89,6 @@ More information available [here](https://snap.stanford.edu/data/soc-pokec.html) - pandas - raphtory - neo4j - - # How to run @@ -135,4 +194,4 @@ Some key notes: https://memgraph.com/docs/memgraph/import-data/load-csv-clause#one-type-of-nodes-and-relationships - Cozo - - Triggered a segmentation fault when running the connected components algorithm \ No newline at end of file + - Triggered a segmentation fault when running the connected components algorithm diff --git a/raphtory-io/Cargo.toml b/comparison-benchmark/rust/raphtory-rust-benchmark/Cargo.toml similarity index 50% rename from raphtory-io/Cargo.toml rename to comparison-benchmark/rust/raphtory-rust-benchmark/Cargo.toml index e9bbe9375a..83d0bff70a 100644 --- a/raphtory-io/Cargo.toml +++ b/comparison-benchmark/rust/raphtory-rust-benchmark/Cargo.toml @@ -1,6 +1,6 @@ [package] -name = "raphtory-io" -description = "raphtory-io, contains all connectors and example datasets for raphtory" +name = "raphtory-rust-benchmark" +description = "Raphtory Quick Rust Benchmark" edition.workspace = true rust-version.workspace = true version.workspace = true @@ -15,20 +15,11 @@ homepage.workspace = true # See more keys and their definitions at https://doc.rust-lang.org/cargo/reference/manifest.html [dependencies] -raphtory = { path = "../raphtory", version = "0.4.0" } -reqwest = { version = "0.11.14", features = ["blocking"] } -neo4rs = "0.6.0" -csv = "1.1.6" +raphtory = { path = "../../../raphtory", version = "0.5.7", package = "raphtory", features = ["io"] } +chrono = { version = "0.4", features = ["serde"] } serde = { version = "1", features = ["derive","rc"] } -serde_json = "1" -rayon = "1" -regex = "1" -chrono = "0.4" -itertools="0.10" - -zip = "0.5" -bzip2 = "0.4" -flate2 = "1.0" - -[dev-dependencies] -tokio = { version = "1.27.0", features = ["full"] } +clap = { version = "4.3.11", features = ["derive"] } +csv = "1.2.2" +tar = "0.4.38" +flate2 = "1.0.26" +ordered-float = "3.7.0" diff --git a/comparison-benchmark/rust/raphtory-rust-benchmark/src/main.rs b/comparison-benchmark/rust/raphtory-rust-benchmark/src/main.rs new file mode 100644 index 0000000000..7b8616eed8 --- /dev/null +++ b/comparison-benchmark/rust/raphtory-rust-benchmark/src/main.rs @@ -0,0 +1,212 @@ +use chrono::NaiveDateTime; +use clap::{ArgAction, Parser}; +use csv::StringRecord; +use flate2::read::GzDecoder; +use raphtory::{ + algorithms::{ + algorithm_result::AlgorithmResult, connected_components::weakly_connected_components, + pagerank::unweighted_page_rank, + }, + graph_loader::{fetch_file, source::csv_loader::CsvLoader}, + prelude::{AdditionOps, Graph, GraphViewOps, VertexViewOps, NO_PROPS}, +}; +use std::{ + fs::File, + io::{self, Read, Write}, + path::Path, + time::Instant, +}; + +#[derive(Parser, Debug)] +#[command(author, version, about, long_about = None )] +struct Args { + /// Set if the file has a header, default is False + #[arg(long, action=ArgAction::SetTrue)] + header: bool, + + /// Delimiter of the csv file + #[arg(long, default_value = "\t")] + delimiter: String, + + /// Path to a csv file + #[arg(long, default_value = "")] + file_path: String, + + /// Position of the from column in the csv + #[arg(long, default_value = "0")] + from_column: usize, + + /// Position of the to column in the csv + #[arg(long, default_value = "1")] + to_column: usize, + + /// Position of the time column in the csv, Expected time is in unix ms, default will ignore time and set it to 1 + #[arg(long, default_value = "-1")] + time_column: i32, + + /// Download default files + #[arg(long, action=ArgAction::SetTrue)] + download: bool, + + /// Debug to print more info to the screen + #[arg(long, action=ArgAction::SetTrue)] + debug: bool, +} + +fn main() { + println!( + " +██████╗ ███████╗███╗ ██╗ ██████╗██╗ ██╗███╗ ███╗ █████╗ ██████╗ ██╗ ██╗ +██╔══██╗██╔════╝████╗ ██║██╔════╝██║ ██║████╗ ████║██╔══██╗██╔══██╗██║ ██╔╝ +██████╔╝█████╗ ██╔██╗ ██║██║ ███████║██╔████╔██║███████║██████╔╝█████╔╝ +██╔══██╗██╔══╝ ██║╚██╗██║██║ ██╔══██║██║╚██╔╝██║██╔══██║██╔══██╗██╔═██╗ +██████╔╝███████╗██║ ╚████║╚██████╗██║ ██║██║ ╚═╝ ██║██║ ██║██║ ██║██║ ██╗ +╚═════╝ ╚══════╝╚═╝ ╚═══╝ ╚═════╝╚═╝ ╚═╝╚═╝ ╚═╝╚═╝ ╚═╝╚═╝ ╚═╝╚═╝ ╚═╝ +" + ); + let args = Args::parse(); + // Set default values + let debug = args.debug; + if debug { + println!( + " + .___ .____ ____ . . ___ __ __ ___ .___ .____ + / ` / / \\ / / .' \\ | | .' `. / ` / + | | |__. |,_-< | | | |\\ /| | | | | |__. + | | | | ` | | | _ | \\/ | | | | | | + /---/ /----/ `----' `._.' `.___| / / `.__.' /---/ /----/ + " + ); + println!("Debug mode enabled.\nArguments: {:?}", args); + } + let header = args.header; + let delimiter = args.delimiter; + let file_path = args.file_path; + let from_column = args.from_column; + let to_column = args.to_column; + let time_column = args.time_column; + let download = args.download; + + if download { + let url = "https://osf.io/download/nbq6h/"; + println!("Downloading default file from url {}...", url); + // make err msg from url and custom string + let err_msg = format!("Failed to download file from {}", url); + let path = fetch_file("simple-relationships.csv.gz", true, url, 1200).expect(&err_msg); + println!("Downloaded file to {}", path.to_str().unwrap()); + println!("Unpacking file..."); + // extract a file from a gz archive + // Open the input .csv.gz file + let input_file = File::open(&path).expect("Failed to open downloaded file"); + let gz_decoder = GzDecoder::new(input_file); + let path_str = path.to_str().unwrap(); + let dst_file = if path_str.len() >= 3 { + let new_length = path_str.len() - 3; + path_str[..new_length].to_owned() + } else { + path_str.to_owned() + }; + let mut output_file = File::create(&dst_file) + .expect("Failed to create new file to decompress downloaded data"); + // Decompress and write the content to the output file + let mut buffer = vec![0; 4096]; + let mut gz_reader = io::BufReader::new(gz_decoder); + loop { + let bytes_read = gz_reader.read(&mut buffer).unwrap_or(0); + if bytes_read == 0 { + break; + } + output_file.write_all(&buffer[..bytes_read]).unwrap(); + } + + // exit program + println!("Downloaded+Unpacked file, please run again without --download flag and with --file-path={}", dst_file); + return; + } + + if file_path.is_empty() { + println!("You did not set a file path"); + return; + } + if !Path::new(&file_path).exists() { + println!("File path does not exist or is not a file {}", &file_path); + return; + } + + if debug { + println!("Reading file {}", &file_path); + } + + println!("Running setup..."); + let mut now = Instant::now(); + // Iterate over the CSV records + let g = { + let g = Graph::new(); + CsvLoader::new(file_path) + .set_header(header) + .set_delimiter(&delimiter) + .load_rec_into_graph(&g, |generic_loader: StringRecord, g: &Graph| { + let src_id = generic_loader + .get(from_column) + .map(|s| s.to_owned()) + .unwrap(); + let dst_id = generic_loader.get(to_column).map(|s| s.to_owned()).unwrap(); + let mut edge_time = NaiveDateTime::from_timestamp_opt(1, 0).unwrap(); + if time_column != -1 { + edge_time = NaiveDateTime::from_timestamp_millis( + generic_loader + .get(time_column as usize) + .unwrap() + .parse() + .unwrap(), + ) + .unwrap(); + } + if debug { + println!("Adding edge {} -> {} at time {}", src_id, dst_id, edge_time); + } + g.add_edge(edge_time, src_id, dst_id, NO_PROPS, None) + .expect("Failed to add edge"); + }) + .expect("Failed to load graph from CSV data files"); + g + }; + println!("Setup took {} seconds", now.elapsed().as_secs_f64()); + + if debug { + println!( + "Graph has {} vertices and {} edges", + g.count_vertices(), + g.count_edges() + ) + } + + // Degree of all nodes + now = Instant::now(); + let _degree = g.vertices().iter().map(|v| v.degree()).collect::>(); + println!("Degree: {} seconds", now.elapsed().as_secs_f64()); + + // Out neighbours of all nodes with time + now = Instant::now(); + let _out_neighbours = g + .vertices() + .iter() + .map(|v| v.out_neighbours()) + .collect::>(); + println!("Out neighbours: {} seconds", now.elapsed().as_secs_f64()); + + // page rank with time + now = Instant::now(); + let _page_rank: Vec<_> = unweighted_page_rank(&g, 1000, None, None, true) + .into_iter() + .collect(); + println!("Page rank: {} seconds", now.elapsed().as_secs_f64()); + + // connected components with time + now = Instant::now(); + let _cc: AlgorithmResult = weakly_connected_components(&g, usize::MAX, None); + println!( + "Connected components: {} seconds", + now.elapsed().as_secs_f64() + ); +} diff --git a/dev/bootstrap.sh b/dev/bootstrap.sh new file mode 100755 index 0000000000..afb7121944 --- /dev/null +++ b/dev/bootstrap.sh @@ -0,0 +1,23 @@ +#!/bin/bash + +DIR="$( cd "$( dirname "${BASH_SOURCE[0]}" )" && pwd )" + +cd "$DIR/.." + +log() { + echo "$(basename ${BASH_SOURCE[0]}): $@" +} + +install_hooks() { + git config core.hooksPath \ + || git config core.hooksPath ./dev/hooks +} + +install_rust_nightly() { + rustup toolchain install nightly +} + +log 'installing rust nightly...' +install_rust_nightly +log 'configuring hooks...' +install_hooks \ No newline at end of file diff --git a/dev/hooks/pre-commit b/dev/hooks/pre-commit new file mode 100755 index 0000000000..3731928a78 --- /dev/null +++ b/dev/hooks/pre-commit @@ -0,0 +1,18 @@ +#!/bin/bash + +# Run rustfmt on the whole repository using nightly toolchain +cargo +nightly fmt --all -- --check + +# Capture the exit code of the previous command +RESULT=$? + +# If the result is non-zero (i.e., there were formatting errors), abort the commit +if [ $RESULT -ne 0 ]; then + if [ -z "$(git ls-files --others --modified --exclude-standard)" ]; then + echo "There are formatting errors. Running cargo fmt. Please check the formatting changes and add them before committing." + cargo +nightly fmt --all + else + echo "There are formatting errors and un-staged files. Please run 'cargo +nightly fmt --all' to fix the formatting before committing." + fi + exit 1 +fi diff --git a/dev/readme.md b/dev/readme.md new file mode 100644 index 0000000000..93961ea3b0 --- /dev/null +++ b/dev/readme.md @@ -0,0 +1,40 @@ +# Quick start dev setup + +If you run `./dev/bootstrap.sh` it will setup the environment for you. + +In this case it will + +- Install a rust nightly +- setup your git hooks to point to the dev hooks in `./dev/hooks` + +You need to run this only once, you will have to `chmod +x ./dev/bootstrap.sh` first. + +## how to run + +From the raphtory root folder + + chmod +x ./dev/bootstrap.sh + ./dev/bootstrap.sh + +## dev hooks + +### pre-commit hook + +The pre-commit hook will run `cargo fmt` on all staged files. If the formatting fails, the commit will be aborted. + + + #!/bin/bash + + # Run rustfmt on the whole repository using nightly toolchain + cargo +nightly fmt --all -- --check + + # Capture the exit code of the previous command + RESULT=$? + + # If the result is non-zero (i.e., there were formatting errors), abort the commit + if [ $RESULT -ne 0 ]; then + echo "There are formatting errors. Please run 'cargo +nightly fmt' and fix them before committing." + exit 1 + fi + + diff --git a/docs/requirements.txt b/docs/requirements.txt index 4335d9d446..3f33f163cb 100644 --- a/docs/requirements.txt +++ b/docs/requirements.txt @@ -3,56 +3,58 @@ alabaster==0.7.13 appnope==0.1.3 asttokens==2.2.1 attrs==23.1.0 +autodocsumm==0.2.11 Babel==2.12.1 backcall==0.2.0 beautifulsoup4==4.12.2 bleach==6.0.0 -certifi==2023.5.7 +certifi==2023.7.22 charset-normalizer==3.1.0 -contourpy==1.0.7 +contourpy==1.1.0 cycler==0.11.0 decorator==5.1.1 defusedxml==0.7.1 docutils==0.19 executing==1.2.0 fastjsonschema==2.17.1 -fonttools==4.39.4 +fonttools==4.40.0 idna==3.4 imagesize==1.4.1 -ipython==8.13.2 +ipython==8.14.0 jedi==0.18.2 Jinja2==3.1.2 jsonpickle==3.0.1 jsonschema==4.17.3 -jupyter_client==8.2.0 -jupyter_core==5.3.0 +jupyter_client==8.3.0 +jupyter_core==5.3.1 jupyterlab-pygments==0.2.2 kiwisolver==1.4.4 -MarkupSafe==2.1.2 +MarkupSafe==2.1.3 matplotlib==3.7.1 matplotlib-inline==0.1.6 -mistune==2.0.5 +maturin==1.1.0 +mistune==3.0.1 nbclient==0.8.0 -nbconvert==7.4.0 -nbformat==5.8.0 +nbconvert==7.6.0 +nbformat==5.9.0 nbsphinx==0.9.2 networkx==3.1 -numpy==1.24.3 +numpy==1.25.0 numpydoc==1.5.0 packaging==23.1 -pandas==2.0.2 +pandas==2.0.3 pandocfilters==1.5.0 parso==0.8.3 pexpect==4.8.0 pickleshare==0.7.5 -Pillow==9.5.0 -platformdirs==3.5.1 -prompt-toolkit==3.0.38 +Pillow==10.0.0 +platformdirs==3.8.0 +prompt-toolkit==3.0.39 ptyprocess==0.7.0 pure-eval==0.2.2 pydata-sphinx-theme==0.13.3 Pygments==2.15.1 -pyparsing==3.0.9 +pyparsing==3.1.0 pyrsistent==0.19.3 python-dateutil==2.8.2 pytz==2023.3 @@ -62,7 +64,7 @@ requests==2.31.0 six==1.16.0 snowballstemmer==2.2.0 soupsieve==2.4.1 -Sphinx==6.2.1 +sphinx==6.2.1 sphinx-copybutton==0.5.2 sphinx-toggleprompt==0.4.0 sphinx_design==0.4.1 @@ -74,10 +76,11 @@ sphinxcontrib-qthelp==1.0.3 sphinxcontrib-serializinghtml==1.1.5 stack-data==0.6.2 tinycss2==1.2.1 -tornado==6.3.2 +tomli==2.0.1 +tornado==6.3.3 traitlets==5.9.0 -typing_extensions==4.6.2 +typing_extensions==4.7.1 tzdata==2023.3 -urllib3==2.0.2 +urllib3==2.0.3 wcwidth==0.2.6 webencodings==0.5.1 diff --git a/docs/source/_static/css/getting_started.css b/docs/source/_static/css/getting_started.css index 5537711779..c5397780b7 100644 --- a/docs/source/_static/css/getting_started.css +++ b/docs/source/_static/css/getting_started.css @@ -146,13 +146,13 @@ ul.task-bullet > li > p:first-child { } .comparison-card .sd-btn-secondary { - background-color: #6c757d !important; - border-color: #6c757d !important; + background-color: #AE0D22 !important; + border-color: #AE0D22 !important; } .comparison-card .sd-btn-secondary:hover { - background-color: #5a6268 !important; - border-color: #545b62 !important; + background-color: #AE0D22 !important; + border-color: #AE0D22 !important; } .comparison-card .card-footer { diff --git a/docs/source/_static/css/raphtory.css b/docs/source/_static/css/raphtory.css index f48a17e899..d60d948f58 100644 --- a/docs/source/_static/css/raphtory.css +++ b/docs/source/_static/css/raphtory.css @@ -38,13 +38,13 @@ table { } .intro-card .sd-btn-secondary { - background-color: #CC0808 !important; - border-color: #CC0808 !important; + background-color: #AE0D22 !important; + border-color: #AE0D22 !important; } .intro-card .sd-btn-secondary:hover { - background-color: #E0311D !important; - border-color: #E0311D !important; + background-color: #AE0D22 !important; + border-color: #AE0D22 !important; } .card, .card img { @@ -56,19 +56,19 @@ table { } h1, h2 { - color: #f04040; + color: #AE0D22; } html[data-theme="light"] { - --pst-color-primary: #f04040; + --pst-color-primary: #AE0D22; } html[data-theme="dark"] { - --pst-color-primary: #f04040; + --pst-color-primary: #AE0D22; } :root { - --pst-color-primary: #f04040; + --pst-color-primary: #AE0D22; --pst-color-link: #eb6060; - --pst-color-primary-light: #f04040; + --pst-color-primary-light: #AE0D22; } \ No newline at end of file diff --git a/docs/source/_static/logo.svg b/docs/source/_static/logo.svg new file mode 100644 index 0000000000..92ae28a812 --- /dev/null +++ b/docs/source/_static/logo.svg @@ -0,0 +1,155 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + \ No newline at end of file diff --git a/docs/source/_static/rust-crate.jpg b/docs/source/_static/rust-crate.jpg new file mode 100644 index 0000000000..693436767a Binary files /dev/null and b/docs/source/_static/rust-crate.jpg differ diff --git a/docs/source/api/index.rst b/docs/source/api/index.rst deleted file mode 100644 index 38936f4510..0000000000 --- a/docs/source/api/index.rst +++ /dev/null @@ -1,16 +0,0 @@ -{{ header }} - -.. _api: - -============= -API -============= - -.. toctree:: - :maxdepth: 2 - - - raphtory - rust - - diff --git a/docs/source/api/raphtory.rst b/docs/source/api/raphtory.rst deleted file mode 100644 index 311937c49a..0000000000 --- a/docs/source/api/raphtory.rst +++ /dev/null @@ -1,67 +0,0 @@ -.. _overview: - -{{ header }} - -**************** -Raphtory -**************** - -.. automodule:: raphtory - :members: - :undoc-members: - :show-inheritance: - :private-members: - :inherited-members: - -raphtory.algorithms -------------------- - -.. automodule:: raphtory.algorithms - :members: - :undoc-members: - :show-inheritance: - :private-members: - :inherited-members: - - -raphtory.vis -------------------- - -.. automodule:: raphtory.vis - :members: - :undoc-members: - :show-inheritance: - :private-members: - :inherited-members: - - -raphtory.nullmodels --------------------------- - -.. automodule:: raphtory.nullmodels - :members: - :undoc-members: - :show-inheritance: - :private-members: - :inherited-members: - - - - - - - - - - - - - - - - - - - - - diff --git a/docs/source/api/rust.rst b/docs/source/api/rust.rst deleted file mode 100644 index cd796635f2..0000000000 --- a/docs/source/api/rust.rst +++ /dev/null @@ -1,4 +0,0 @@ -Rust -================ - -Our rust module is hosted on docs.rs, and can be found `here `__. \ No newline at end of file diff --git a/docs/source/conf.py b/docs/source/conf.py index f47f661b71..aa51d6f068 100644 --- a/docs/source/conf.py +++ b/docs/source/conf.py @@ -1,13 +1,24 @@ +# do not add from __future__ import annotations as it will break the typehints parsing +# (I think this is a bug in autodoc and may be fixed at some point) + # Configuration file for the Sphinx documentation builder. # # For the full list of built-in configuration values, see the documentation: # https://www.sphinx-doc.org/en/master/usage/configuration.html + from sphinx.ext.autosummary import _import_by_name import os +import re import sys import warnings import raphtory +from sphinx.util.typing import stringify_annotation +from sphinx.util import inspect + +# for type annotations resolution (need to actually import everything that we want to use in a type hint in the docs) +from typing import * +from raphtory import * import jinja2 @@ -17,7 +28,11 @@ project = 'Raphtory' copyright = '2023, Pometry' author = 'Pometry' -release = '2020' +release = '2023' + + + + # -- General configuration --------------------------------------------------- # https://www.sphinx-doc.org/en/master/usage/configuration.html#general-configuration @@ -26,7 +41,6 @@ "IPython.sphinxext.ipython_directive", "IPython.sphinxext.ipython_console_highlighting", "matplotlib.sphinxext.plot_directive", - "numpydoc", "sphinx_copybutton", "sphinx_design", "sphinx_toggleprompt", @@ -41,6 +55,7 @@ "sphinx.ext.mathjax", "sphinx.ext.todo", "nbsphinx", + "autodocsumm", ] templates_path = ['_templates'] @@ -55,30 +70,28 @@ :suppress: import raphtory - from raphtory import vis + from raphtory import export import os os.chdir(r'{os.path.dirname(os.path.dirname(__file__))}') """ - html_context = { "header": header, } - # -- Options for HTML output ------------------------------------------------- # https://www.sphinx-doc.org/en/master/usage/configuration.html#options-for-html-output html_theme = "pydata_sphinx_theme" - -html_logo = "_static/logo.svg" html_static_path = ['_static', 'images'] html_css_files = [ + "css/custom.css", "css/getting_started.css", "css/raphtory.css", ] +html_logo = "_static/logo.svg" html_use_modindex = True htmlhelp_basename = "raphtory" @@ -91,8 +104,14 @@ "issue": ("https://github.com/pometry/raphtory/issues/%s", "GH %s"), } +intersphinx_mapping = {'python': ('https://docs.python.org/3', None)} + autosummary_generate = True autosummary_imported_members = True +autodoc_typehints = "both" +autodoc_typehints_description_target = "documented" +autodoc_type_aliases = {} + # numpydoc def rstjinja(app, docname, source): @@ -107,6 +126,70 @@ def rstjinja(app, docname, source): rendered = app.builder.templates.render_string(src, app.config.html_context) source[0] = rendered + +def add_typehints(app, objtype: str, name: str, obj, + options: dict, args: str, retann: str) -> tuple[str | Any, str | Any] | tuple[str, None]: + """Record type hints to env object. + + This function does the same as the sphinx.ext.autodoc.typehints extension but for + signatures that are defined in the docstring. + """ + if not hasattr(obj, "__annotations__"): + # If an object has annotations, typehints extension will handle it, otherwise, + # we need to look at the signature for the type hints + + # make sure we set the configuration option in the same way + if app.config.autodoc_typehints_format == 'short': + mode = 'smart' + else: + mode = 'fully-qualified' + + try: + if callable(obj): + # build a mock function from the signature to get the correct annotations + exec_parts = [f"def _annotations_moc"] + if args is not None: + exec_parts.append(args) + else: + exec_parts.append("()") + if retann: + exec_parts.append(f" -> {retann}") + exec_parts.append(":\n pass") + res = globals() + exec("".join(exec_parts), res) + + # extract type hints and store them in the appropriate temp data + # (this is the same as what the typehints extension does) + annotations = app.env.temp_data.setdefault('annotations', {}) + annotation = annotations.setdefault(name, {}) + sig = inspect.signature(res["_annotations_moc"], type_aliases=app.config.autodoc_type_aliases) + for param in sig.parameters.values(): + if param.annotation is not param.empty: + annotation[param.name] = stringify_annotation(param.annotation, mode) + if sig.return_annotation is not sig.empty: + retann = stringify_annotation(sig.return_annotation, mode) + annotation['return'] = retann + kwargs = {} + if app.config.autodoc_typehints in ('none', 'description'): + kwargs.setdefault('show_annotation', False) + if app.config.autodoc_typehints_format == "short": + kwargs.setdefault('unqualified_typehints', True) + + # we need to reparse the signature to get the correct formatting for links to work + # and to enable the 'description' option to strip the type hints from the signature + args = inspect.stringify_signature(sig, **kwargs) + if args: + matched = re.match(r'^(\(.*\))\s+->\s+(.*)$', args) + if matched: + args = matched.group(1) + retann = matched.group(2) + return args, retann + else: + return args, None + except (TypeError, ValueError): + pass + + def setup(app): app.connect("source-read", rstjinja) - + app.connect('autodoc-process-signature', add_typehints, priority=0) diff --git a/docs/source/development/community.rst b/docs/source/development/community.rst deleted file mode 100644 index 061094b4a6..0000000000 --- a/docs/source/development/community.rst +++ /dev/null @@ -1,17 +0,0 @@ -.. _develop.community: - -********** -Community -********** - -.. _community.version: - - -Join the growing community of open-source enthusiasts using Raphtory to power their graph analysis projects! - -- Follow `Twitter`_ for the latest Raphtory news and development - -- Join our `Slack`_ to chat with us and get answers to your questions! - -.. _Twitter: https://twitter.com/raphtory -.. _Slack: https://join.slack.com/t/raphtory/shared_invite/zt-xbebws9j-VgPIFRleJFJBwmpf81tvxA diff --git a/docs/source/development/contributing.rst b/docs/source/development/contributing.rst deleted file mode 100644 index 88aad4ddc6..0000000000 --- a/docs/source/development/contributing.rst +++ /dev/null @@ -1,78 +0,0 @@ -{{ header }} - -.. _contributing: - -============= -Contributing -============= - -We're happy that you're considering contributing! - -To help you get started we've prepared the following guidelines. - -How Do I Contribute? -~~~~~~~~~~~~~~~~~~~~ - -There are many ways to contribute: - -- Report a bug -- Request a feature/enhancement -- Fix bugs -- Work on requested/approved features -- Refactor codebase -- Write tests -- Fix documentation - -Project Layout -~~~~~~~~~~~~~~~ - -- `raphtory`: Raphtory Core written in rust -- `py-raphtory`: Raphtory python library (written in rust, converted to python with PyO3) -- `python`: Raphtory python helper scripts -- `benchmark`: Benchmarking scripts used to compare Raphtory to other platforms -- `raphtory-benchmark`: Benchmarking scripts run in the CI/CD pipeline -- `raphtory-graphql`: GraphQL server for raphtory -- `raphtory-io`: IO module for raphtory -- `js-raphtory`: Raphtory javascript library - - -- `docs`: Documentation (built and hosted using sphinx and readthedocs) -- `examples`: Example raphtory projects in both python and rust -- `resource`: Sample CSV files - - -Documentation -============== - -Raphtory documentations can be found in `docs` directory. -They are built using `Sphinx `__ and hosted by readthedocs. - -After making your changes, you're good to build them. - -- Ensure that all development dependencies are already installed. - ```bash - $ cd docs && pip install -q -r requirements.txt - ``` - -- Build docs - ```bash - $ cd docs && make html - ``` - -- View docs - ```bash - $ open build/html/index.html - ``` - -Community Guidelines -===================== - -This project follows `Google's Open Source Community Guidelines `__. - - -License -======== - -Raphtory it licensed under `GNU General Public License v3.0`. - -This docs page is licensed under `BSD 3-Clause License`. \ No newline at end of file diff --git a/docs/source/development/index.rst b/docs/source/development/index.rst deleted file mode 100644 index f331ba21b5..0000000000 --- a/docs/source/development/index.rst +++ /dev/null @@ -1,18 +0,0 @@ -{{ header }} - -.. _development: - -=========== -Development -=========== - - -.. toctree:: - :maxdepth: 2 - - contributing - policies - roadmap - community - - diff --git a/docs/source/development/policies.rst b/docs/source/development/policies.rst deleted file mode 100644 index a7a59eea76..0000000000 --- a/docs/source/development/policies.rst +++ /dev/null @@ -1,47 +0,0 @@ -.. _develop.policies: - -******** -Policies -******** - -.. _policies.version: - -Raphtory uses a loose variant of semantic versioning (`SemVer`_) to govern -deprecations, API compatibility, and version numbering. - -A raphtory release number is made up of ``MAJOR.MINOR.PATCH``. - -API breaking changes should only occur in **major** releases. These changes -will be documented, with clear guidance on what is changing, why it's changing, -and how to migrate existing code to the new behavior. - -Whenever possible, a deprecation path will be provided rather than an outright -breaking change. - -raphtory will introduce deprecations in **minor** releases. These deprecations -will preserve the existing behavior while emitting a warning that provide -guidance on: - -* How to achieve similar behavior if an alternative is available -* The raphtory version in which the deprecation will be enforced. - -We will not introduce new deprecations in patch releases. - -Deprecations will only be enforced in **major** releases. For example, if a -behavior is deprecated in raphtory 1.2.0, it will continue to work, with a -warning, for all releases in the 1.x series. The behavior will change and the -deprecation removed in the next major release (2.0.0). - -.. note:: - - raphtory will sometimes make *behavior changing* bug fixes, as part of - minor or patch releases. Whether or not a change is a bug fix or an - API-breaking change is a judgement call. We'll do our best, and we - invite you to participate in development discussion on the issue - tracker or mailing list. - -These policies do not apply to features marked as **experimental** in the documentation. -Raphtory may change the behavior of experimental features at any time. - - -.. _SemVer: https://semver.org diff --git a/docs/source/development/roadmap.rst b/docs/source/development/roadmap.rst deleted file mode 100644 index c2c9aca6cc..0000000000 --- a/docs/source/development/roadmap.rst +++ /dev/null @@ -1,19 +0,0 @@ -.. _develop.roadmap: - -******** -Roadmap -******** - -.. _roadmap.version: - - -As an open-source project, our project roadmap is public and open to -suggestions. We welcome your feedback and contributions to the project. - -We work in 2-week sprints, and our roadmap is organized by sprint on Github. -View the current sprint and the next sprint on our `Github project`_ - -Each sprint is organized by issues, which are organized by priority in our fortnightly sprint planning meetings. -These are assigned to team members, and tracked on the Github project board, completed upon merging a pull request. - -.. _Github project: https://github.com/orgs/Pometry/projects/1/ \ No newline at end of file diff --git a/docs/source/getting_started/images/lotr-graphic.png b/docs/source/getting_started/images/lotr-graphic.png deleted file mode 100644 index 3386b8325f..0000000000 Binary files a/docs/source/getting_started/images/lotr-graphic.png and /dev/null differ diff --git a/docs/source/getting_started/index.rst b/docs/source/getting_started/index.rst deleted file mode 100644 index efdbf03301..0000000000 --- a/docs/source/getting_started/index.rst +++ /dev/null @@ -1,158 +0,0 @@ -{{ header }} - -.. _getting_started: - -=============== -Getting started -=============== - - -Installation (python) ----------------------- - -.. grid:: 1 2 2 2 - :gutter: 2 - - .. grid-item-card:: Install via pip? - :class-card: install-card - :columns: 12 12 6 6 - :padding: 3 - - Raphtory can be installed via pip from `PyPI `__. - - ++++ - - .. code-block:: bash - - pip install raphtory - - .. grid-item-card:: Prefer rust? - :class-card: install-card - :columns: 12 12 6 6 - :padding: 3 - - Install into you rust project via crates from `Crates `__. - - ++++ - - .. code-block:: bash - - cargo add raphtory - - -Building / Source ------------------ - -.. grid:: 1 2 2 2 - :gutter: 2 - - .. grid-item-card:: Python from source? - :class-card: install-card - :columns: 12 - :padding: 3 - - Building a specific version? Installing from source? Developing? - Check the python advanced installation pages. - - +++ - - .. button-ref:: install-python - :ref-type: ref - :click-parent: - :color: secondary - :expand: - - Advanced python installation - - .. grid-item-card:: Rust from source? - :class-card: install-card - :columns: 12 - :padding: 3 - - Developing a new functionality? You prefer rust over python? - - +++ - - .. button-ref:: install-rust - :ref-type: ref - :click-parent: - :color: secondary - :expand: - - Advanced rust installation - - -.. _gentle_intro: - -Intro to Raphtory ------------------- - -.. raw:: html - -
-
- -
- -
-
- -Blah Blah Blah Blah. - -.. raw:: html - -
-
-
- -
- -
-
- -Nlah Nlah Nlah Nlah. - -.. raw:: html - -
-
-
-
-
- -
-
- -Tutorials ---------- - -.. If you update this toctree, also update the manual toctree in the - main index.rst.template - -.. toctree:: - :maxdepth: 2 - :hidden: - - overview - installation/index - intro_tutorials/index diff --git a/docs/source/getting_started/installation/index.rst b/docs/source/getting_started/installation/index.rst deleted file mode 100644 index 820b9aa4eb..0000000000 --- a/docs/source/getting_started/installation/index.rst +++ /dev/null @@ -1,9 +0,0 @@ -========================= -Installation -========================= - -.. toctree:: - :maxdepth: 1 - - install_python - install_rust diff --git a/docs/source/getting_started/installation/install_python.rst b/docs/source/getting_started/installation/install_python.rst deleted file mode 100644 index ec9a8f1cb8..0000000000 --- a/docs/source/getting_started/installation/install_python.rst +++ /dev/null @@ -1,98 +0,0 @@ -.. _install-python: - -{{ header }} - -===================== -Python -===================== - -The easiest way to install raphtory is to install it -via pip, `pip install raphtory`. -This is the recommended installation method for most users. - -.. _install.version: - -Python version support ----------------------- - -Officially Python 3.10. - -Installing raphtory -------------------- - -Installing from PyPI -~~~~~~~~~~~~~~~~~~~~ - -Raphtory can be installed via pip from -`PyPI `__. - -.. note:: - You must have ``pip>=23`` to install from PyPI. - -:: - - pip install raphtory - - -Installing from source -~~~~~~~~~~~~~~~~~~~~~~ - -Installing from source is the quickest way to: - -* Try a new feature that will be shipped in the next release (that is, a feature from a pull-request that was recently merged to the main branch). -* Check whether a bug you encountered has been fixed since the last release. - -Note that first uninstalling raphtory might be required to be able to install from source, as version numbers may not be up to date:: - - pip uninstall raphtory -y - -Requirements ------------- - -To install raphtory from source, you need the following: - -* `git `__ to clone the repository. -* `rust `__ to build the rust modules. -* `python `__ to run the setup script. -* `pip `__ to install the python package. -* `virtualenv` to create a virtual environment for the python package or `conda` -* `maturin `__ to build the python package. -* `requirements` listed in the requirements.txt file. - -Installing directly from github source --------------------------------------- - -The following will pull the raphtory repository from git and install the python package from source. - - pip install -e 'git+https://github.com/Pometry/Raphtory.git#egg=raphtory&subdirectory=python' - - -Installing directly from source -------------------------------- - -If you are developing raphtory and want to build & install the python package locally, you can do so with the following command: - - make build-all - or - cd python && maturin develop - - -Running the test suite ----------------------- - -Raphtory is equipped with an exhaustive set of unit tests. -To run it on your machine to verify that everything is working -(and that you have all of the dependencies installed), make sure you have `pytest -`__ >= 7.0 - -Test dependencies: - - python -m pip install -q pytest networkx numpy seaborn pandas nbmake pytest-xdist matplotlib - -To run `raphtory` python tests: - - cd python && pytest - -To run notebook tests: - - cd python/tests && pytest --nbmake --nbmake-timeout=1200 . diff --git a/docs/source/getting_started/installation/install_rust.rst b/docs/source/getting_started/installation/install_rust.rst deleted file mode 100644 index 088904be9d..0000000000 --- a/docs/source/getting_started/installation/install_rust.rst +++ /dev/null @@ -1,99 +0,0 @@ -.. _install-rust: - -{{ header }} - -=================== -Rust -=================== - -The easiest way to install raphtory is to install it -via cargo, `cargo add raphtory`. -This is the recommended installation method for most users. - -.. _install.version-rust: - -Rust version support ----------------------- - -Officially Rust 1.67.1 - -Installing raphtory -------------------- - -Installing from Cargo -~~~~~~~~~~~~~~~~~~~~~ - -Raphtory can be installed via pip from -`Cargo `__. - -.. note:: - You must have ``rust>=1.67.1`` to install from cargo. - -:: - - cargo add raphtory - - -Installing from source -~~~~~~~~~~~~~~~~~~~~~~ - -Installing from source is the quickest way to: - -* Try a new feature that will be shipped in the next release (that is, a feature from a pull-request that was recently merged to the main branch). -* Check whether a bug you encountered has been fixed since the last release. - -Note that first uninstalling raphtory might be required to be able to install from source, as version numbers may not be up to date:: - - cargo remove raphtory - -Requirements ------------- - -To install raphtory from source, you need the following: - -* `git `__ to clone the repository. -* `rust `__ to build the rust modules. -* `make `__ to run the build script. - -Installing directly from source -------------------------------- - -Building the rust core is done using cargo. The following command will build the core. - - make rust-build - -or - - cargo build - -Import the raphtory package into a rust project ------------------------------------------------ - -To use the raphtory core in a rust project, add the following to your Cargo.toml file: -Note: The path should be the path to the raphtory directory - - - - [dependencies] - - raphtory = {path = "../raphtory", version = "0.3.0" } - - -or - - - [dependencies] - - raphtory = "0.3.0" - - -Running the test suite ----------------------- - -Raphtory is equipped with an exhaustive set of unit tests. -To run it on your machine to verify that everything is working -(and that you have all of the dependencies installed) - -To run `raphtory` rust tests: - - cargo test \ No newline at end of file diff --git a/docs/source/getting_started/intro_tutorials/01_quickstart.rst b/docs/source/getting_started/intro_tutorials/01_quickstart.rst deleted file mode 100644 index 33d3e98370..0000000000 --- a/docs/source/getting_started/intro_tutorials/01_quickstart.rst +++ /dev/null @@ -1,143 +0,0 @@ -.. _gettingstarted_quickstart: - -{{ header }} - -How do I create a graph, add nodes/edges, add properties, run algorithms? -========================================================================== - -.. raw:: html - -
    -
  • - -I want to create a graph - -.. ipython:: python - - import raphtory - g = raphtory.Graph() - -To load the raphtory package and start working with it, import the -package. We recommend to import the package under the alias ``raphtory``. - - -.. raw:: html - -
  • -
- -How do I add nodes and edges? -===================================== - -.. raw:: html - -
    -
  • - -I want to add two nodes and an edge into the graph. - -.. ipython:: python - - g.add_vertex(0, "Ben") - g.add_vertex(1, "Hamza") - g.add_edge(2, "Ben", "Hamza") - - -Here we have added a node called "Ben" a time 0, and a node called "Hamza" at time 1. -Next we added an edge between "Ben" and "Hamza" at time 2. - -.. raw:: html - -
  • -
- -.. note:: - These don't have any properties, but we will add them below! - - - -How do I add nodes and edges with properties? -============================================== - -.. raw:: html - -
    -
  • - -I want to add properties with my nodes and edges. - -.. ipython:: python - - g.add_vertex(3, "Rachel", {"class": "student", "age": 20}) - g.add_vertex(4, "Shivam", {"class": "student", "age": 21}) - g.add_edge(5, "Rachel", "Shivam", {"class": "friendship"}) - - -Here we have added a node called "Rachel" a time 3, with the properies class and age. -Similarly, we have doen the same for a node called "Shivam" at time 4. -Next we added an edge between "Rachel" and "Shivam" at time 5 with the property name "class" and the value "friendship". - -.. raw:: html - -
  • -
- - - -How do I run an algorithm? -===================================== - -.. raw:: html - -
    -
  • - -I'd like to run a Max Out Degree algorithm. - -.. ipython:: python - - from raphtory import algorithms - print("Graph - Max out degree: %i" % algorithms.max_out_degree(g)) - -Here we have imported the algorithms package, and then run the max out degree algorithm on the graph. - - -.. raw:: html - -
  • -
- - - -How do I view / visualise my graph? -===================================== - -.. raw:: html - -
    -
  • - -I'd like to view my graph. - -.. ipython:: python - - from raphtory import vis - vis.to_networkx(g) - -or you can show it with pyvis vis - - -.. ipython:: python - - from raphtory import vis - v = vis.to_pyvis(g) - v.show('graph.html') - -Here we have imported the vis package, and then converted the graph to a networkx / pyvis graph. -We can then view the graph in a notebook, or save it to a file. - -.. raw:: html - -
  • -
- diff --git a/docs/source/getting_started/intro_tutorials/index.rst b/docs/source/getting_started/intro_tutorials/index.rst deleted file mode 100644 index 2420671f35..0000000000 --- a/docs/source/getting_started/intro_tutorials/index.rst +++ /dev/null @@ -1,14 +0,0 @@ -{{ header }} - -.. _gettingstarted: - -========================= -Getting started tutorials -========================= - -.. toctree:: - :maxdepth: 1 - - 01_quickstart - lotr.ipynb - diff --git a/docs/source/getting_started/intro_tutorials/lotr.csv b/docs/source/getting_started/intro_tutorials/lotr.csv deleted file mode 100644 index 7515aed3e2..0000000000 --- a/docs/source/getting_started/intro_tutorials/lotr.csv +++ /dev/null @@ -1,2650 +0,0 @@ -SRC,DST,TIME -Gandalf,Elrond,33 -Frodo,Bilbo,114 -Blanco,Marcho,146 -Frodo,Bilbo,205 -Thorin,Gandalf,270 -Thorin,Bilbo,270 -Gandalf,Bilbo,270 -Gollum,Bilbo,286 -Gollum,Bilbo,306 -Gollum,Bilbo,308 -Bilbo,Elrond,317 -Frodo,Samwise,319 -Gandalf,Bilbo,320 -Gollum,Bilbo,324 -Frodo,Gandalf,329 -Peregrin,Elessar,356 -Arwen,Aragorn,358 -Barahir,Faramir,359 -Bilbo,Findegil,360 -Meriadoc,Peregrin,363 -Peregrin,Elendil,368 -Galadriel,Celeborn,374 -Frodo,Bilbo,387 -Frodo,Bilbo,388 -Frodo,Bilbo,389 -Frodo,Bilbo,390 -Frodo,Bilbo,393 -Frodo,Bilbo,399 -Hamfast,Bilbo,402 -Gandalf,Bilbo,483 -Gandalf,Bilbo,543 -Frodo,Gandalf,555 -Frodo,Bilbo,555 -Gandalf,Bilbo,555 -Frodo,Bilbo,562 -Gandalf,Bilbo,730 -Frodo,Bilbo,808 -Frodo,Bilbo,815 -Gandalf,Bilbo,843 -Frodo,Gandalf,861 -Frodo,Bilbo,898 -Frodo,Merry,929 -Frodo,Merry,930 -Frodo,Bilbo,942 -Frodo,Bilbo,944 -Odo,Frodo,959 -Frodo,Bilbo,1038 -Meriadoc,Peregrin,1042 -Meriadoc,Merry,1042 -Meriadoc,Pippin,1042 -Meriadoc,Fredegar,1042 -Peregrin,Merry,1042 -Peregrin,Pippin,1042 -Peregrin,Fredegar,1042 -Merry,Pippin,1042 -Merry,Fredegar,1042 -Pippin,Fredegar,1042 -Pippin,Merry,1044 -Pippin,Bilbo,1044 -Merry,Bilbo,1044 -Frodo,Gandalf,1056 -Sam,Halfast,1089 -Frodo,Bilbo,1106 -Frodo,Gandalf,1130 -Gandalf,Bilbo,1135 -Gandalf,Bilbo,1156 -Frodo,Gandalf,1160 -Frodo,Saruman,1185 -Gandalf,Bilbo,1229 -Frodo,Gandalf,1234 -Frodo,Gandalf,1241 -Isildur,Elendil,1309 -Isildur,Gil-galad,1309 -Isildur,Sauron,1309 -Elendil,Gil-galad,1309 -Elendil,Sauron,1309 -Gil-galad,Sauron,1309 -Sméagol,Déagol,1324 -Sméagol,Déagol,1330 -Sméagol,Déagol,1331 -Sméagol,Déagol,1336 -Frodo,Gollum,1356 -Frodo,Gollum,1359 -Frodo,Gandalf,1390 -Frodo,Gollum,1400 -Frodo,Bilbo,1401 -Isildur,Gollum,1407 -Isildur,Déagol,1407 -Gollum,Déagol,1407 -Frodo,Gandalf,1417 -Isildur,Elendil,1420 -Frodo,Gollum,1429 -Gollum,Déagol,1441 -Gollum,Bilbo,1459 -Gandalf,Bilbo,1469 -Frodo,Bilbo,1484 -Frodo,Gollum,1484 -Bilbo,Gollum,1484 -Frodo,Bilbo,1567 -Frodo,Gollum,1567 -Bilbo,Gollum,1567 -Gandalf,Bilbo,1654 -Frodo,Gandalf,1656 -Sam,Gandalf,1677 -Sam,Frodo,1687 -Sam,Frodo,1705 -Sam,Gandalf,1710 -Sam,Gandalf,1711 -Sam,Frodo,1714 -Gandalf,Bilbo,1721 -Frodo,Gandalf,1741 -Gandalf,Bilbo,1748 -Sam,Elrond,1756 -Frodo,Gandalf,1783 -Frodo,Gandalf,1785 -Pippin,Frodo,1789 -Pippin,Merry,1789 -Pippin,Fredegar,1789 -Frodo,Merry,1789 -Frodo,Fredegar,1789 -Merry,Fredegar,1789 -Frodo,Gandalf,1792 -Frodo,Bilbo,1802 -Frodo,Gandalf,1804 -Merry,Fredegar,1806 -Frodo,Gandalf,1809 -Lobelia,Frodo,1816 -Lobelia,Lotho,1816 -Frodo,Lotho,1816 -Pippin,Sam,1825 -Lobelia,Sam,1826 -Lobelia,Frodo,1826 -Sam,Frodo,1826 -Pippin,Sam,1829 -Sam,Frodo,1869 -Sam,Frodo,1871 -Peregrin,Bilbo,1879 -Pippin,Sam,1888 -Pippin,Frodo,1951 -Pippin,Sam,1955 -Pippin,Bilbo,1981 -Frodo,Gandalf,1999 -Pippin,Frodo,2024 -Pippin,Sam,2024 -Frodo,Sam,2024 -Frodo,Gandalf,2056 -Frodo,Bilbo,2083 -Pippin,Frodo,2110 -Pippin,Sam,2110 -Frodo,Sam,2110 -Frodo,Bilbo,2175 -Sam,Frodo,2204 -Pippin,Frodo,2242 -Frodo,Bilbo,2246 -Frodo,Bilbo,2250 -Sam,Frodo,2254 -Sam,Gandalf,2254 -Frodo,Gandalf,2254 -Sam,Frodo,2318 -Sam,Frodo,2358 -Sam,Frodo,2393 -Pippin,Sam,2446 -Pippin,Frodo,2488 -Maggot,Pippin,2490 -Pippin,Frodo,2511 -Pippin,Sam,2511 -Frodo,Sam,2511 -Pippin,Sam,2513 -Maggot,Pippin,2519 -Pippin,Peregrin,2521 -Sam,Frodo,2541 -Maggot,Frodo,2607 -Frodo,Bilbo,2613 -Frodo,Peregrin,2628 -Pippin,Frodo,2633 -Pippin,Sam,2633 -Frodo,Sam,2633 -Pippin,Sam,2659 -Sam,Frodo,2668 -Frodo,Merry,2694 -Pippin,Frodo,2742 -Pippin,Merry,2742 -Pippin,Sam,2742 -Frodo,Merry,2742 -Frodo,Sam,2742 -Merry,Sam,2742 -Maggot,Frodo,2756 -Meriadoc,Frodo,2786 -Pippin,Bilbo,2794 -Maggot,Frodo,2821 -Pippin,Frodo,2829 -Maggot,Merry,2834 -Pippin,Frodo,2835 -Maggot,Frodo,2837 -Maggot,Bilbo,2837 -Frodo,Bilbo,2837 -Maggot,Merry,2838 -Pippin,Merry,2845 -Frodo,Merry,2850 -Pippin,Frodo,2857 -Sam,Frodo,2882 -Sam,Merry,2919 -Sam,Frodo,2922 -Frodo,Gandalf,2925 -Sam,Frodo,2938 -Pippin,Merry,2949 -Gandalf,Merry,2972 -Frodo,Gandalf,2999 -Gandalf,Fredegar,3060 -Pippin,Merry,3239 -Sam,Frodo,3265 -Pippin,Frodo,3271 -Pippin,Sam,3271 -Frodo,Sam,3271 -Sam,Frodo,3278 -Pippin,Sam,3282 -Pippin,Merry,3291 -Sam,Frodo,3316 -Sam,Frodo,3337 -Sam,Frodo,3345 -Sam,Merry,3356 -Frodo,Goldberry,3461 -Tom,Goldberry,3482 -Tom,Goldberry,3499 -Tom,Goldberry,3514 -Tom,Frodo,3526 -Pippin,Merry,3544 -Tom,Goldberry,3616 -Tom,Goldberry,3686 -Tom,Frodo,3702 -Tom,Frodo,3703 -Tom,Gandalf,3703 -Tom,Bilbo,3703 -Frodo,Gandalf,3703 -Frodo,Bilbo,3703 -Gandalf,Bilbo,3703 -Tom,Frodo,3705 -Tom,Frodo,3714 -Tom,Gandalf,3718 -Frodo,Merry,3721 -Tom,Frodo,3733 -Pippin,Sam,3837 -Pippin,Merry,3837 -Sam,Merry,3837 -Frodo,Gandalf,3914 -Frodo,Bilbo,3914 -Gandalf,Bilbo,3914 -Pippin,Sam,3919 -Pippin,Merry,3919 -Sam,Merry,3919 -Pippin,Sam,3938 -Pippin,Merry,3938 -Sam,Merry,3938 -Frodo,Merry,3946 -Tom,Frodo,3960 -Pippin,Sam,3976 -Pippin,Merry,3976 -Sam,Merry,3976 -Tom,Frodo,3988 -Tom,Merry,4037 -Pippin,Sam,4046 -Pippin,Merry,4046 -Sam,Merry,4046 -Tom,Goldberry,4060 -Butterbur,Barliman,4126 -Tom,Goldberry,4131 -Butterbur,Barliman,4261 -Sam,Frodo,4269 -Nob,Butterbur,4332 -Pippin,Frodo,4342 -Pippin,Sam,4342 -Frodo,Sam,4342 -Butterbur,Barliman,4353 -Pippin,Sam,4380 -Frodo,Butterbur,4389 -Frodo,Bilbo,4418 -Butterbur,Bilbo,4421 -Pippin,Sam,4482 -Pippin,Frodo,4565 -Pippin,Sam,4565 -Frodo,Sam,4565 -Sam,Frodo,4620 -Pippin,Frodo,4629 -Pippin,Sam,4629 -Frodo,Sam,4629 -Sam,Frodo,4692 -Sam,Frodo,4697 -Nob,Butterbur,4714 -Pippin,Sam,4734 -Pippin,Butterbur,4736 -Frodo,Butterbur,4749 -Pippin,Frodo,4902 -Pippin,Sam,4902 -Frodo,Sam,4902 -Frodo,Gandalf,4910 -Pippin,Gandalf,4926 -Pippin,Sam,4930 -Nob,Merry,5012 -Frodo,Merry,5089 -Nob,Merry,5090 -Nob,Gandalf,5090 -Merry,Gandalf,5090 -Bob,Bill,5228 -Bob,Bill,5229 -Butterbur,Merry,5242 -Tom,Butterbur,5249 -Nob,Butterbur,5268 -Nob,Bob,5268 -Butterbur,Bob,5268 -Pippin,Frodo,5274 -Pippin,Merry,5274 -Pippin,Sam,5274 -Frodo,Merry,5274 -Frodo,Sam,5274 -Merry,Sam,5274 -Nob,Bob,5276 -Pippin,Frodo,5410 -Elendil,Gil-galad,5434 -Pippin,Sam,5468 -Frodo,Merry,5470 -Merry,Gandalf,5500 -Frodo,Merry,5534 -Sam,Peregrin,5538 -Pippin,Gandalf,5544 -Merry,Gil-galad,5615 -Pippin,Frodo,5619 -Pippin,Merry,5619 -Frodo,Merry,5619 -Frodo,Gandalf,5620 -Lúthien,Beren,5653 -Lúthien,Barahir,5653 -Beren,Barahir,5653 -Beren,Lúthien,5654 -Beren,Thingol,5654 -Lúthien,Thingol,5654 -Beren,Barahir,5657 -Beren,Thingol,5657 -Barahir,Thingol,5657 -Beren,Lúthien,5660 -Beren,Sauron,5660 -Beren,Thingol,5660 -Lúthien,Sauron,5660 -Lúthien,Thingol,5660 -Sauron,Thingol,5660 -Beren,Thingol,5667 -Beren,Elwing,5667 -Beren,Eärendil,5667 -Beren,Lúthien,5667 -Beren,Dior,5667 -Thingol,Elwing,5667 -Thingol,Eärendil,5667 -Thingol,Lúthien,5667 -Thingol,Dior,5667 -Elwing,Eärendil,5667 -Elwing,Lúthien,5667 -Elwing,Dior,5667 -Eärendil,Lúthien,5667 -Eärendil,Dior,5667 -Lúthien,Dior,5667 -Sam,Merry,5682 -Pippin,Frodo,5683 -Pippin,Merry,5713 -Sam,Frodo,5714 -Sam,Frodo,5752 -Pippin,Merry,5758 -Frodo,Gandalf,5775 -Sam,Merry,5999 -Pippin,Merry,6010 -Sam,Frodo,6011 -Pippin,Merry,6012 -Sam,Frodo,6020 -Frodo,Bilbo,6037 -Frodo,Bilbo,6044 -Gandalf,Bilbo,6118 -Frodo,Bilbo,6126 -Frodo,Bilbo,6127 -Glorfindel,Elrond,6161 -Glorfindel,Frodo,6195 -Elrond,Aragorn,6200 -Glorfindel,Frodo,6220 -Pippin,Sam,6225 -Pippin,Merry,6225 -Sam,Merry,6225 -Glorfindel,Frodo,6267 -Frodo,Lúthien,6325 -Frodo,Gandalf,6381 -Butterbur,Bill,6429 -Gandalf,Barliman,6431 -Frodo,Gandalf,6531 -Glorfindel,Aragorn,6549 -Frodo,Gandalf,6578 -Glorfindel,Elrond,6583 -Sam,Frodo,6628 -Glorfindel,Gandalf,6660 -Glorfindel,Elrond,6660 -Gandalf,Elrond,6660 -Glorfindel,Frodo,6661 -Glorfindel,Gandalf,6661 -Glorfindel,Elrond,6661 -Frodo,Gandalf,6661 -Frodo,Elrond,6661 -Gandalf,Elrond,6661 -Frodo,Elrond,6669 -Arwen,Frodo,6673 -Arwen,Lúthien,6673 -Arwen,Elrond,6673 -Frodo,Lúthien,6673 -Frodo,Elrond,6673 -Lúthien,Elrond,6673 -Frodo,Elrond,6676 -Pippin,Frodo,6682 -Pippin,Merry,6682 -Frodo,Merry,6682 -Thorin,Glóin,6693 -Gandalf,Elrond,6701 -Frodo,Glóin,6709 -Frodo,Beorn,6710 -Frodo,Grimbeorn,6710 -Beorn,Grimbeorn,6710 -Bard,Bain,6717 -Bard,Brand,6717 -Bain,Brand,6717 -Dwalin,Bombur,6728 -Dwalin,Glóin,6728 -Dwalin,Bofur,6728 -Bombur,Glóin,6728 -Bombur,Bofur,6728 -Glóin,Bofur,6728 -Ori,Balin,6730 -Ori,Óin,6730 -Balin,Óin,6730 -Frodo,Glóin,6736 -Smaug,Bilbo,6747 -Frodo,Glóin,6748 -Arwen,Elrond,6754 -Frodo,Gandalf,6757 -Sam,Frodo,6810 -Sam,Bilbo,6810 -Frodo,Bilbo,6810 -Gandalf,Elrond,6833 -Gandalf,Bilbo,6835 -Frodo,Bilbo,6855 -Frodo,Bilbo,6935 -Eärendil,Elrond,6969 -Frodo,Bilbo,6987 -Frodo,Aragorn,6994 -Arwen,Frodo,6995 -Sam,Bilbo,7006 -Sam,Bilbo,7009 -Frodo,Elrond,7018 -Gandalf,Bilbo,7024 -Gandalf,Elrond,7037 -Sam,Frodo,7040 -Sam,Bilbo,7040 -Frodo,Bilbo,7040 -Frodo,Gandalf,7041 -Glorfindel,Glóin,7047 -Glorfindel,Frodo,7047 -Glóin,Frodo,7047 -Frodo,Elrond,7048 -Gimli,Glóin,7051 -Elrond,Glorfindel,7052 -Elrond,Galdor,7052 -Elrond,Erestor,7052 -Elrond,Círdan,7052 -Glorfindel,Galdor,7052 -Glorfindel,Erestor,7052 -Glorfindel,Círdan,7052 -Galdor,Erestor,7052 -Galdor,Círdan,7052 -Erestor,Círdan,7052 -Legolas,Thranduil,7053 -Frodo,Bilbo,7058 -Gandalf,Elrond,7059 -Gandalf,Boromir,7059 -Elrond,Boromir,7059 -Frodo,Glóin,7064 -Balin,Óin,7077 -Balin,Ori,7077 -Óin,Ori,7077 -Elrond,Sauron,7127 -Elrond,Sauron,7128 -Isildur,Elendil,7134 -Isildur,Anárion,7134 -Elendil,Anárion,7134 -Elendil,Gil-galad,7135 -Elendil,Sauron,7135 -Gil-galad,Sauron,7135 -Gil-galad,Elrond,7142 -Elwing,Eärendil,7145 -Elwing,Lúthien,7145 -Elwing,Dior,7145 -Eärendil,Lúthien,7145 -Eärendil,Dior,7145 -Lúthien,Dior,7145 -Elendil,Gil-galad,7148 -Isildur,Elendil,7149 -Isildur,Gil-galad,7149 -Isildur,Sauron,7149 -Elendil,Gil-galad,7149 -Elendil,Sauron,7149 -Gil-galad,Sauron,7149 -Gil-galad,Círdan,7162 -Isildur,Valandil,7170 -Isildur,Elendil,7170 -Isildur,Ohtar,7170 -Valandil,Elendil,7170 -Valandil,Ohtar,7170 -Elendil,Ohtar,7170 -Isildur,Elendil,7179 -Isildur,Gil-galad,7179 -Isildur,Anárion,7179 -Elendil,Gil-galad,7179 -Elendil,Anárion,7179 -Gil-galad,Anárion,7179 -Meneldil,Anárion,7192 -Elrond,Aragorn,7235 -Isildur,Elendil,7241 -Isildur,Elrond,7241 -Isildur,Aragorn,7241 -Elendil,Elrond,7241 -Elendil,Aragorn,7241 -Elrond,Aragorn,7241 -Frodo,Bilbo,7270 -Aragorn,Boromir,7279 -Isildur,Elendil,7281 -Isildur,Denethor,7281 -Elendil,Denethor,7281 -Gollum,Bilbo,7330 -Frodo,Bilbo,7336 -Galdor,Elrond,7353 -Frodo,Gandalf,7356 -Frodo,Galdor,7356 -Frodo,Glóin,7356 -Gandalf,Galdor,7356 -Gandalf,Glóin,7356 -Galdor,Glóin,7356 -Gollum,Gandalf,7391 -Isildur,Aragorn,7404 -Gollum,Aragorn,7405 -Isildur,Gandalf,7407 -Isildur,Saruman,7434 -Isildur,Boromir,7434 -Saruman,Boromir,7434 -Isildur,Elendil,7440 -Gil-galad,Sauron,7448 -Celebrimbor,Sauron,7454 -Gollum,Denethor,7455 -Gollum,Aragorn,7455 -Denethor,Aragorn,7455 -Gandalf,Elrond,7484 -Sméagol,Gollum,7509 -Legolas,Glóin,7525 -Saruman,Radagast,7581 -Gandalf,Saruman,7599 -Saruman,Sauron,7714 -Saruman,Radagast,7739 -Sauron,Aragorn,7769 -Glorfindel,Galdor,7904 -Gandalf,Elrond,7911 -Glorfindel,Saruman,7913 -Glorfindel,Erestor,7932 -Frodo,Boromir,7948 -Balin,Thrór,7992 -Glorfindel,Sauron,8028 -Bilbo,Boromir,8060 -Gandalf,Bilbo,8062 -Frodo,Elrond,8097 -Beren,Túrin,8105 -Beren,Hador,8105 -Beren,Húrin,8105 -Túrin,Hador,8105 -Túrin,Húrin,8105 -Hador,Húrin,8105 -Pippin,Frodo,8117 -Pippin,Merry,8117 -Pippin,Sam,8117 -Frodo,Merry,8117 -Frodo,Sam,8117 -Merry,Sam,8117 -Legolas,Gollum,8145 -Sam,Frodo,8150 -Sam,Bilbo,8150 -Frodo,Bilbo,8150 -Elrond,Thranduil,8157 -Elrond,Aragorn,8158 -Frodo,Gandalf,8183 -Frodo,Gandalf,8190 -Frodo,Bilbo,8190 -Gandalf,Bilbo,8190 -Gimli,Legolas,8255 -Gimli,Glóin,8255 -Legolas,Glóin,8255 -Isildur,Aragorn,8257 -Frodo,Boromir,8262 -Pippin,Frodo,8276 -Pippin,Gandalf,8276 -Frodo,Gandalf,8276 -Pippin,Elrond,8286 -Elendil,Aragorn,8292 -Gandalf,Elrond,8295 -Gandalf,Aragorn,8295 -Elrond,Aragorn,8295 -Frodo,Bilbo,8296 -Pippin,Merry,8297 -Pippin,Frodo,8297 -Pippin,Beren,8297 -Pippin,Bilbo,8297 -Pippin,Sam,8297 -Pippin,Lúthien,8297 -Merry,Frodo,8297 -Merry,Beren,8297 -Merry,Bilbo,8297 -Merry,Sam,8297 -Merry,Lúthien,8297 -Frodo,Beren,8297 -Frodo,Bilbo,8297 -Frodo,Sam,8297 -Frodo,Lúthien,8297 -Beren,Bilbo,8297 -Beren,Sam,8297 -Beren,Lúthien,8297 -Bilbo,Sam,8297 -Bilbo,Lúthien,8297 -Sam,Lúthien,8297 -Frodo,Bilbo,8300 -Frodo,Bilbo,8336 -Frodo,Bilbo,8341 -Elrond,Boromir,8373 -Frodo,Bilbo,8379 -Thorin,Gandalf,8380 -Sam,Bill,8384 -Pippin,Sam,8386 -Frodo,Bilbo,8390 -Elrond,Aragorn,8391 -Sam,Frodo,8397 -Gandalf,Elrond,8405 -Gandalf,Aragorn,8438 -Frodo,Gandalf,8459 -Gimli,Legolas,8473 -Sam,Aragorn,8525 -Sam,Aragorn,8534 -Sam,Aragorn,8538 -Sam,Frodo,8563 -Frodo,Gandalf,8598 -Frodo,Aragorn,8598 -Gandalf,Aragorn,8598 -Gandalf,Aragorn,8600 -Gandalf,Aragorn,8614 -Frodo,Aragorn,8619 -Gandalf,Aragorn,8647 -Gimli,Sauron,8686 -Frodo,Merry,8690 -Frodo,Bilbo,8710 -Gandalf,Boromir,8712 -Legolas,Gandalf,8765 -Aragorn,Boromir,8779 -Aragorn,Boromir,8791 -Aragorn,Boromir,8796 -Merry,Aragorn,8822 -Pippin,Legolas,8827 -Pippin,Merry,8827 -Legolas,Merry,8827 -Sam,Boromir,8828 -Gimli,Gandalf,8829 -Gimli,Bill,8829 -Gandalf,Bill,8829 -Frodo,Aragorn,8830 -Pippin,Sam,8866 -Pippin,Merry,8866 -Sam,Merry,8866 -Aragorn,Boromir,8867 -Frodo,Gandalf,8871 -Gandalf,Boromir,8892 -Gandalf,Sauron,8912 -Balin,Fundin,8919 -Sam,Frodo,8952 -Pippin,Sam,8978 -Pippin,Elrond,8978 -Sam,Elrond,8978 -Pippin,Sam,8982 -Gandalf,Aragorn,9006 -Boromir,Aragorn,9018 -Gandalf,Boromir,9059 -Gimli,Frodo,9098 -Gimli,Gandalf,9098 -Frodo,Gandalf,9098 -Sam,Bill,9134 -Gimli,Legolas,9154 -Gandalf,Bill,9162 -Sam,Frodo,9169 -Sam,Bill,9179 -Gandalf,Fëanor,9210 -Gandalf,Aragorn,9240 -Peregrin,Gandalf,9258 -Sam,Bill,9282 -Gimli,Gandalf,9316 -Sam,Frodo,9329 -Sam,Frodo,9334 -Sam,Frodo,9343 -Sam,Gandalf,9343 -Frodo,Gandalf,9343 -Sam,Frodo,9350 -Gimli,Gandalf,9374 -Legolas,Sam,9402 -Legolas,Frodo,9402 -Legolas,Boromir,9402 -Sam,Frodo,9402 -Sam,Boromir,9402 -Frodo,Boromir,9402 -Gimli,Gandalf,9410 -Gimli,Glóin,9413 -Gimli,Gandalf,9417 -Gimli,Legolas,9444 -Gimli,Boromir,9444 -Gimli,Aragorn,9444 -Legolas,Boromir,9444 -Legolas,Aragorn,9444 -Boromir,Aragorn,9444 -Pippin,Gandalf,9468 -Pippin,Merry,9468 -Gandalf,Merry,9468 -Merry,Aragorn,9478 -Thorin,Bilbo,9605 -Gandalf,Daeron,9670 -Balin,Frodo,9676 -Balin,Bilbo,9676 -Frodo,Bilbo,9676 -Gimli,Frodo,9687 -Ori,Gimli,9717 -Balin,Fundin,9755 -Balin,Gimli,9852 -Aragorn,Boromir,9853 -Pippin,Merry,9861 -Frodo,Aragorn,9864 -Aragorn,Boromir,9870 -Pippin,Frodo,9877 -Pippin,Merry,9877 -Pippin,Aragorn,9877 -Frodo,Merry,9877 -Frodo,Aragorn,9877 -Merry,Aragorn,9877 -Balin,Gimli,9878 -Balin,Legolas,9878 -Gimli,Legolas,9878 -Sam,Frodo,9901 -Frodo,Gandalf,9903 -Gandalf,Bilbo,9982 -Gandalf,Boromir,10098 -Gandalf,Aragorn,10098 -Boromir,Aragorn,10098 -Aragorn,Boromir,10144 -Aragorn,Boromir,10152 -Sam,Frodo,10155 -Sam,Frodo,10235 -Pippin,Sam,10251 -Sam,Frodo,10273 -Sam,Aragorn,10273 -Frodo,Aragorn,10273 -Legolas,Aragorn,10279 -Aragorn,Boromir,10280 -Gimli,Frodo,10298 -Gimli,Sam,10298 -Gimli,Aragorn,10298 -Frodo,Sam,10298 -Frodo,Aragorn,10298 -Sam,Aragorn,10298 -Sam,Aragorn,10299 -Merry,Bilbo,10334 -Sam,Frodo,10356 -Sam,Aragorn,10356 -Frodo,Aragorn,10356 -Gimli,Frodo,10360 -Gimli,Aragorn,10478 -Legolas,Sam,10515 -Legolas,Frodo,10515 -Sam,Frodo,10515 -Legolas,Frodo,10518 -Sam,Frodo,10521 -Orophin,Rúmil,10531 -Haldir,Aragorn,10540 -Frodo,Elrond,10550 -Legolas,Aragorn,10555 -Haldir,Pippin,10568 -Haldir,Legolas,10568 -Haldir,Merry,10568 -Pippin,Legolas,10568 -Pippin,Merry,10568 -Legolas,Merry,10568 -Legolas,Frodo,10591 -Haldir,Rúmil,10645 -Haldir,Amroth,10795 -Frodo,Aragorn,10843 -Frodo,Aragorn,10845 -Frodo,Amroth,10850 -Galadriel,Celeborn,10863 -Haldir,Frodo,10869 -Haldir,Galadriel,10879 -Haldir,Celeborn,10879 -Galadriel,Celeborn,10879 -Legolas,Frodo,10883 -Galadriel,Celeborn,10892 -Haldir,Frodo,10896 -Gimli,Glóin,10909 -Haldir,Legolas,10933 -Balin,Celeborn,10938 -Balin,Aragorn,10938 -Celeborn,Aragorn,10938 -Frodo,Galadriel,10964 -Legolas,Aragorn,10978 -Frodo,Boromir,11009 -Sam,Frodo,11054 -Sam,Frodo,11062 -Sam,Frodo,11095 -Sam,Frodo,11140 -Frodo,Gandalf,11189 -Frodo,Gandalf,11192 -Frodo,Saruman,11192 -Gandalf,Saruman,11192 -Frodo,Galadriel,11248 -Frodo,Gandalf,11279 -Legolas,Boromir,11333 -Legolas,Aragorn,11333 -Boromir,Aragorn,11333 -Celeborn,Aragorn,11344 -Legolas,Galadriel,11359 -Frodo,Aragorn,11362 -Gandalf,Boromir,11363 -Elendil,Sauron,11364 -Frodo,Gandalf,11365 -Frodo,Boromir,11365 -Gandalf,Boromir,11365 -Frodo,Boromir,11367 -Frodo,Boromir,11375 -Frodo,Boromir,11380 -Frodo,Aragorn,11380 -Boromir,Aragorn,11380 -Pippin,Sam,11382 -Pippin,Merry,11382 -Sam,Merry,11382 -Pippin,Merry,11471 -Pippin,Frodo,11471 -Pippin,Boromir,11471 -Pippin,Gimli,11471 -Pippin,Sam,11471 -Pippin,Aragorn,11471 -Pippin,Legolas,11471 -Merry,Frodo,11471 -Merry,Boromir,11471 -Merry,Gimli,11471 -Merry,Sam,11471 -Merry,Aragorn,11471 -Merry,Legolas,11471 -Frodo,Boromir,11471 -Frodo,Gimli,11471 -Frodo,Sam,11471 -Frodo,Aragorn,11471 -Frodo,Legolas,11471 -Boromir,Gimli,11471 -Boromir,Sam,11471 -Boromir,Aragorn,11471 -Boromir,Legolas,11471 -Gimli,Sam,11471 -Gimli,Aragorn,11471 -Gimli,Legolas,11471 -Sam,Aragorn,11471 -Sam,Legolas,11471 -Aragorn,Legolas,11471 -Galadriel,Celeborn,11486 -Aragorn,Boromir,11516 -Galadriel,Celeborn,11528 -Celeborn,Galadriel,11539 -Celeborn,Aragorn,11539 -Galadriel,Aragorn,11539 -Elendil,Elessar,11549 -Arwen,Celebrían,11551 -Pippin,Merry,11553 -Pippin,Boromir,11553 -Merry,Boromir,11553 -Gimli,Galadriel,11566 -Gimli,Glóin,11572 -Gimli,Galadriel,11575 -Gimli,Glóin,11589 -Gimli,Glóin,11649 -Gimli,Glóin,11655 -Sam,Frodo,11680 -Gimli,Legolas,11730 -Pippin,Merry,11731 -Pippin,Boromir,11731 -Pippin,Aragorn,11731 -Merry,Boromir,11731 -Merry,Aragorn,11731 -Boromir,Aragorn,11731 -Pippin,Frodo,11732 -Frodo,Aragorn,11736 -Sam,Frodo,11739 -Sam,Frodo,11744 -Sam,Frodo,11771 -Sam,Frodo,11794 -Gollum,Aragorn,11841 -Merry,Aragorn,11895 -Sam,Frodo,11903 -Legolas,Galadriel,11943 -Frodo,Boromir,11956 -Frodo,Boromir,12025 -Frodo,Aragorn,12025 -Boromir,Aragorn,12025 -Legolas,Aragorn,12030 -Legolas,Frodo,12042 -Legolas,Aragorn,12042 -Frodo,Aragorn,12042 -Pippin,Merry,12063 -Aragorn,Boromir,12066 -Sam,Frodo,12117 -Isildur,Anárion,12126 -Isildur,Valandil,12127 -Isildur,Elendil,12127 -Isildur,Elessar,12127 -Valandil,Elendil,12127 -Valandil,Elessar,12127 -Elendil,Elessar,12127 -Frodo,Aragorn,12205 -Sam,Frodo,12226 -Sam,Boromir,12226 -Frodo,Boromir,12226 -Gandalf,Bilbo,12236 -Frodo,Boromir,12260 -Frodo,Boromir,12321 -Pippin,Sam,12469 -Pippin,Merry,12469 -Sam,Merry,12469 -Denethor,Elrond,12500 -Gimli,Sam,12520 -Legolas,Meriadoc,12521 -Legolas,Peregrin,12521 -Legolas,Boromir,12521 -Meriadoc,Peregrin,12521 -Meriadoc,Boromir,12521 -Peregrin,Boromir,12521 -Sam,Aragorn,12563 -Aragorn,Boromir,12601 -Frodo,Boromir,12615 -Pippin,Frodo,12634 -Pippin,Merry,12634 -Frodo,Merry,12634 -Gimli,Legolas,12637 -Sam,Aragorn,12645 -Sam,Frodo,12702 -Sam,Frodo,12730 -Sam,Frodo,12736 -Sam,Frodo,12769 -Samwise,Boromir,12805 -Samwise,Aragorn,12805 -Boromir,Aragorn,12805 -Gimli,Legolas,12876 -Gimli,Legolas,12878 -Legolas,Aragorn,12881 -Pippin,Frodo,12893 -Pippin,Merry,12893 -Pippin,Sam,12893 -Frodo,Merry,12893 -Frodo,Sam,12893 -Merry,Sam,12893 -Gimli,Sauron,12935 -Gandalf,Saruman,12946 -Gimli,Legolas,12961 -Denethor,Boromir,12986 -Frodo,Aragorn,13052 -Gimli,Frodo,13056 -Legolas,Aragorn,13191 -Gimli,Legolas,13238 -Gimli,Legolas,13309 -Gimli,Legolas,13429 -Gimli,Aragorn,13429 -Legolas,Aragorn,13429 -Saruman,Sauron,13474 -Gimli,Gandalf,13478 -Aragorn,Boromir,13479 -Gimli,Legolas,13530 -Sauron,Aragorn,13562 -Isildur,Elendil,13572 -Isildur,Elessar,13572 -Isildur,Aragorn,13572 -Elendil,Elessar,13572 -Elendil,Aragorn,13572 -Elessar,Aragorn,13572 -Gimli,Legolas,13576 -Legolas,Aragorn,13578 -Denethor,Boromir,13585 -Sauron,Thengel,13588 -Denethor,Sauron,13644 -Gandalf,Saruman,13655 -Gandalf,Shadowfax,13660 -Gandalf,Shadowfax,13663 -Gandalf,Aragorn,13663 -Shadowfax,Aragorn,13663 -Gimli,Legolas,13739 -Gimli,Legolas,13794 -Pippin,Merry,13839 -Legolas,Gandalf,13845 -Gimli,Gandalf,13846 -Gandalf,Aragorn,13848 -Legolas,Aragorn,13870 -Celeborn,Aragorn,13882 -Gimli,Saruman,13908 -Legolas,Aragorn,13909 -Gimli,Legolas,13949 -Gimli,Aragorn,13949 -Legolas,Aragorn,13949 -Pippin,Frodo,13952 -Pippin,Merry,13967 -Gandalf,Elrond,13986 -Pippin,Merry,14151 -Pippin,Merry,14177 -Pippin,Merry,14236 -Pippin,Merry,14331 -Frodo,Gandalf,14364 -Gandalf,Shadowfax,14365 -Pippin,Merry,14394 -Pippin,Merry,14436 -Pippin,Merry,14468 -Pippin,Merry,14544 -Pippin,Merry,14621 -Meriadoc,Merry,14799 -Pippin,Peregrin,14800 -Pippin,Merry,14804 -Pippin,Merry,15032 -Tom,Galadriel,15038 -Tom,Elrond,15038 -Galadriel,Elrond,15038 -Treebeard,Gandalf,15049 -Treebeard,Saruman,15049 -Gandalf,Saruman,15049 -Sam,Gandalf,15050 -Gandalf,Galadriel,15059 -Pippin,Merry,15258 -Treebeard,Merry,15265 -Treebeard,Pippin,15265 -Merry,Pippin,15265 -Pippin,Merry,15267 -Pippin,Merry,15292 -Treebeard,Pippin,15294 -Treebeard,Merry,15298 -Treebeard,Pippin,15298 -Merry,Pippin,15298 -Pippin,Merry,15312 -Pippin,Merry,15338 -Sam,Frodo,15374 -Legolas,Aragorn,15600 -Pippin,Merry,15612 -Pippin,Merry,15619 -Pippin,Boromir,15619 -Merry,Boromir,15619 -Gimli,Legolas,15669 -Gimli,Aragorn,15669 -Legolas,Aragorn,15669 -Pippin,Merry,15672 -Aragorn,Boromir,15901 -Pippin,Merry,15958 -Gandalf,Saruman,16001 -Gandalf,Saruman,16002 -Treebeard,Gandalf,16018 -Pippin,Merry,16036 -Gimli,Saruman,16040 -Legolas,Aragorn,16046 -Gandalf,Aragorn,16109 -Elessar,Aragorn,16187 -Gandalf,Shadowfax,16250 -Legolas,Aragorn,16259 -Gimli,Shadowfax,16260 -Gandalf,Shadowfax,16268 -Gimli,Legolas,16293 -Gimli,Gandalf,16293 -Gimli,Aragorn,16293 -Legolas,Gandalf,16293 -Legolas,Aragorn,16293 -Gandalf,Aragorn,16293 -Gimli,Gandalf,16298 -Gimli,Legolas,16410 -Elendil,Thengel,16455 -Elendil,Aragorn,16455 -Thengel,Aragorn,16455 -Denethor,Aragorn,16456 -Gandalf,Wormtongue,16556 -Gandalf,Thengel,16571 -Gimli,Gandalf,16579 -Gandalf,Wormtongue,16663 -Gandalf,Wormtongue,16851 -Gandalf,Saruman,16910 -Legolas,Aragorn,16949 -Gimli,Gandalf,16951 -Gimli,Legolas,17015 -Gandalf,Shadowfax,17026 -Legolas,Aragorn,17034 -Gimli,Galadriel,17041 -Gandalf,Shadowfax,17059 -Legolas,Gandalf,17094 -Helm,Erkenbrand,17122 -Helm,Erkenbrand,17178 -Gandalf,Wormtongue,17194 -Helm,Gandalf,17196 -Helm,Erkenbrand,17196 -Gandalf,Erkenbrand,17196 -Legolas,Aragorn,17207 -Helm,Erkenbrand,17239 -Helm,Gamling,17258 -Legolas,Aragorn,17457 -Gamling,Saruman,17476 -Gandalf,Aragorn,17581 -Elendil,Aragorn,17650 -Legolas,Erkenbrand,17707 -Legolas,Aragorn,17707 -Erkenbrand,Aragorn,17707 -Gimli,Gamling,17710 -Gandalf,Saruman,17770 -Gimli,Legolas,17785 -Gimli,Gandalf,17785 -Gimli,Aragorn,17785 -Legolas,Gandalf,17785 -Legolas,Aragorn,17785 -Gandalf,Aragorn,17785 -Gimli,Legolas,17820 -Gimli,Gandalf,17820 -Legolas,Gandalf,17820 -Legolas,Gandalf,17821 -Gimli,Legolas,17828 -Legolas,Helm,17848 -Legolas,Galadriel,17857 -Gimli,Legolas,17881 -Gandalf,Shadowfax,17989 -Shadowfax,Gandalf,18002 -Grimbold,Erkenbrand,18006 -Helm,Saruman,18010 -Saruman,Wormtongue,18116 -Saruman,Wormtongue,18157 -Gimli,Legolas,18177 -Pippin,Merry,18196 -Treebeard,Merry,18213 -Treebeard,Gandalf,18230 -Gimli,Legolas,18252 -Gimli,Aragorn,18252 -Legolas,Aragorn,18252 -Gimli,Merry,18299 -Pippin,Aragorn,18431 -Gimli,Gandalf,18452 -Pippin,Saruman,18465 -Treebeard,Saruman,18528 -Gandalf,Galadriel,18554 -Gandalf,Elrond,18554 -Galadriel,Elrond,18554 -Treebeard,Merry,18634 -Treebeard,Gandalf,18654 -Treebeard,Gandalf,18664 -Treebeard,Gandalf,18669 -Sam,Frodo,18689 -Sam,Boromir,18689 -Frodo,Boromir,18689 -Saruman,Aragorn,18825 -Treebeard,Merry,18829 -Pippin,Merry,18936 -Saruman,Wormtongue,18954 -Gandalf,Saruman,18988 -Gandalf,Saruman,18993 -Gandalf,Saruman,19202 -Gandalf,Saruman,19207 -Saruman,Aragorn,19218 -Gandalf,Saruman,19271 -Gimli,Legolas,19275 -Gimli,Aragorn,19275 -Legolas,Aragorn,19275 -Treebeard,Gandalf,19276 -Gimli,Legolas,19292 -Gimli,Legolas,19300 -Pippin,Merry,19326 -Pippin,Gandalf,19362 -Pippin,Merry,19362 -Pippin,Aragorn,19362 -Gandalf,Merry,19362 -Gandalf,Aragorn,19362 -Merry,Aragorn,19362 -Pippin,Merry,19366 -Pippin,Merry,19437 -Pippin,Merry,19453 -Gandalf,Saruman,19471 -Pippin,Gandalf,19475 -Pippin,Sam,19489 -Pippin,Gandalf,19519 -Gandalf,Aragorn,19687 -Pippin,Gandalf,19756 -Pippin,Gandalf,19762 -Pippin,Aragorn,19762 -Gandalf,Aragorn,19762 -Merry,Aragorn,19771 -Shadowfax,Gandalf,19793 -Elendil,Elrond,19848 -Wormtongue,Aragorn,19918 -Peregrin,Shadowfax,19921 -Pippin,Gandalf,19957 -Sam,Frodo,20041 -Sam,Frodo,20047 -Sam,Frodo,20230 -Sam,Frodo,20267 -Frodo,Bilbo,20483 -Frodo,Gollum,20519 -Sam,Frodo,20598 -Sam,Frodo,20607 -Sam,Gollum,20627 -Frodo,Gollum,20653 -Sam,Frodo,20655 -Sam,Gollum,20686 -Frodo,Gollum,20688 -Sam,Frodo,20735 -Sam,Gollum,20769 -Sam,Frodo,20777 -Sam,Frodo,20792 -Sam,Gollum,20838 -Sam,Frodo,20844 -Sam,Gollum,20844 -Frodo,Gollum,20844 -Sam,Frodo,20849 -Sam,Gollum,20859 -Sam,Gollum,20861 -Sam,Frodo,20888 -Frodo,Gollum,20903 -Sam,Samwise,20916 -Sam,Frodo,20985 -Sam,Gollum,20985 -Frodo,Gollum,20985 -Sam,Frodo,21041 -Sam,Frodo,21066 -Sam,Frodo,21137 -Sam,Frodo,21147 -Sam,Frodo,21153 -Sam,Gollum,21167 -Sam,Frodo,21168 -Sam,Gollum,21172 -Sam,Frodo,21214 -Sam,Frodo,21229 -Frodo,Gollum,21299 -Sam,Gollum,21301 -Frodo,Gollum,21369 -Sam,Gollum,21455 -Frodo,Gollum,21466 -Frodo,Gollum,21490 -Sam,Frodo,21492 -Sam,Gollum,21492 -Frodo,Gollum,21492 -Frodo,Gollum,21501 -Frodo,Gandalf,21551 -Frodo,Bilbo,21551 -Gandalf,Bilbo,21551 -Frodo,Gollum,21558 -Isildur,Elendil,21588 -Isildur,Frodo,21588 -Elendil,Frodo,21588 -Sam,Frodo,21626 -Sam,Gollum,21626 -Frodo,Gollum,21626 -Gollum,Aragorn,21673 -Frodo,Gollum,21680 -Frodo,Gollum,21683 -Gollum,Aragorn,21687 -Gandalf,Aragorn,21702 -Gandalf,Saruman,21703 -Gandalf,Aragorn,21703 -Saruman,Aragorn,21703 -Frodo,Samwise,21705 -Frodo,Gandalf,21706 -Sam,Frodo,21727 -Frodo,Gollum,21753 -Sam,Frodo,21765 -Frodo,Gollum,21825 -Sam,Frodo,21860 -Sam,Gollum,21860 -Frodo,Gollum,21860 -Sam,Gollum,21887 -Frodo,Elrond,21938 -Sam,Gollum,21945 -Sam,Frodo,21970 -Sam,Gollum,21970 -Frodo,Gollum,21970 -Sam,Frodo,22061 -Sam,Gollum,22081 -Sam,Frodo,22143 -Frodo,Boromir,22150 -Frodo,Hamfast,22183 -Frodo,Samwise,22183 -Hamfast,Samwise,22183 -Boromir,Aragorn,22187 -Denethor,Boromir,22194 -Mablung,Damrod,22233 -Sam,Frodo,22280 -Sam,Faramir,22341 -Frodo,Faramir,22343 -Sam,Frodo,22349 -Sam,Boromir,22349 -Frodo,Boromir,22349 -Elendil,Boromir,22366 -Isildur,Elendil,22367 -Isildur,Aragorn,22367 -Elendil,Aragorn,22367 -Sam,Frodo,22384 -Sam,Faramir,22384 -Frodo,Faramir,22384 -Frodo,Boromir,22391 -Frodo,Denethor,22441 -Frodo,Faramir,22441 -Denethor,Faramir,22441 -Mablung,Damrod,22556 -Samwise,Frodo,22557 -Samwise,Faramir,22557 -Frodo,Faramir,22557 -Sam,Frodo,22568 -Sam,Mablung,22568 -Sam,Damrod,22568 -Sam,Faramir,22568 -Frodo,Mablung,22568 -Frodo,Damrod,22568 -Frodo,Faramir,22568 -Mablung,Damrod,22568 -Mablung,Faramir,22568 -Damrod,Faramir,22568 -Samwise,Faramir,22571 -Isildur,Frodo,22593 -Boromir,Faramir,22687 -Mablung,Damrod,22692 -Mablung,Damrod,22710 -Sam,Frodo,22718 -Mablung,Damrod,22723 -Sam,Frodo,22824 -Sam,Faramir,22824 -Frodo,Faramir,22824 -Sam,Frodo,22832 -Sam,Frodo,22844 -Frodo,Boromir,22845 -Frodo,Aragorn,22849 -Boromir,Faramir,22852 -Sam,Faramir,22890 -Samwise,Faramir,22891 -Bilbo,Aragorn,22908 -Sam,Frodo,22959 -Frodo,Faramir,22986 -Frodo,Faramir,23030 -Sam,Frodo,23064 -Frodo,Faramir,23077 -Frodo,Faramir,23094 -Anborn,Faramir,23143 -Anborn,Frodo,23166 -Frodo,Gandalf,23212 -Frodo,Gollum,23277 -Frodo,Faramir,23277 -Gollum,Faramir,23277 -Anborn,Gollum,23341 -Frodo,Faramir,23375 -Gollum,Faramir,23389 -Frodo,Gollum,23399 -Frodo,Faramir,23420 -Frodo,Gollum,23435 -Frodo,Faramir,23435 -Gollum,Faramir,23435 -Anborn,Gollum,23477 -Sam,Frodo,23545 -Frodo,Elrond,23572 -Frodo,Gollum,23576 -Frodo,Faramir,23576 -Gollum,Faramir,23576 -Samwise,Faramir,23577 -Frodo,Gollum,23578 -Sam,Frodo,23617 -Sam,Gollum,23624 -Sam,Frodo,23678 -Sam,Gollum,23678 -Frodo,Gollum,23678 -Sam,Frodo,23726 -Sam,Gollum,23726 -Frodo,Gollum,23726 -Sam,Gandalf,23787 -Sam,Gollum,23789 -Sam,Frodo,23816 -Sam,Frodo,23837 -Frodo,Gollum,23855 -Sam,Frodo,23864 -Sam,Gollum,23890 -Sam,Frodo,23896 -Sam,Frodo,23910 -Sam,Frodo,23917 -Sam,Frodo,23940 -Gandalf,Galadriel,24026 -Gandalf,Faramir,24026 -Gandalf,Elrond,24026 -Gandalf,Aragorn,24026 -Galadriel,Faramir,24026 -Galadriel,Elrond,24026 -Galadriel,Aragorn,24026 -Faramir,Elrond,24026 -Faramir,Aragorn,24026 -Elrond,Aragorn,24026 -Sam,Frodo,24050 -Sam,Frodo,24058 -Sam,Frodo,24099 -Sam,Frodo,24138 -Sam,Frodo,24219 -Sam,Frodo,24220 -Sam,Frodo,24253 -Sam,Frodo,24284 -Sam,Frodo,24292 -Sam,Frodo,24334 -Frodo,Gollum,24339 -Sam,Frodo,24355 -Gollum,Shelob,24375 -Sam,Frodo,24413 -Sam,Frodo,24436 -Sam,Frodo,24442 -Sam,Frodo,24515 -Gollum,Faramir,24578 -Ungoliant,Shelob,24618 -Sam,Frodo,24664 -Sam,Gollum,24681 -Sam,Gollum,24687 -Sam,Gollum,24690 -Sam,Gollum,24692 -Sam,Gollum,24693 -Sam,Frodo,24711 -Sam,Frodo,24715 -Sam,Samwise,24715 -Frodo,Samwise,24715 -Sam,Shelob,24736 -Sam,Frodo,24742 -Hamfast,Samwise,24753 -Frodo,Galadriel,24792 -Frodo,Faramir,24816 -Frodo,Bilbo,24817 -Frodo,Bilbo,24857 -Sam,Frodo,24873 -Sam,Shagrat,25066 -Shelob,Shagrat,25096 -Gorbag,Shagrat,25308 -Gorbag,Shagrat,25310 -Pippin,Gandalf,25348 -Pippin,Gandalf,25359 -Pippin,Gandalf,25366 -Pippin,Gandalf,25380 -Pippin,Gandalf,25394 -Gandalf,Denethor,25399 -Gandalf,Boromir,25411 -Amroth,Imrahil,25440 -Pippin,Gandalf,25441 -Pippin,Ecthelion,25446 -Peregrin,Gandalf,25447 -Gandalf,Shadowfax,25472 -Pippin,Gandalf,25480 -Pippin,Gandalf,25485 -Denethor,Ecthelion,25521 -Pippin,Boromir,25523 -Pippin,Aragorn,25523 -Boromir,Aragorn,25523 -Gandalf,Faramir,25533 -Pippin,Boromir,25541 -Pippin,Denethor,25550 -Meriadoc,Pippin,25560 -Pippin,Denethor,25561 -Pippin,Gandalf,25572 -Pippin,Denethor,25573 -Pippin,Peregrin,25574 -Pippin,Denethor,25574 -Pippin,Ecthelion,25574 -Peregrin,Denethor,25574 -Peregrin,Ecthelion,25574 -Denethor,Ecthelion,25574 -Pippin,Gandalf,25578 -Gandalf,Denethor,25579 -Théoden,Saruman,25583 -Pippin,Gandalf,25584 -Gandalf,Denethor,25585 -Pippin,Gandalf,25586 -Treebeard,Gandalf,25589 -Gandalf,Denethor,25592 -Pippin,Gandalf,25599 -Pippin,Denethor,25600 -Pippin,Gandalf,25621 -Pippin,Gandalf,25629 -Isildur,Denethor,25635 -Isildur,Boromir,25635 -Denethor,Boromir,25635 -Pippin,Boromir,25636 -Pippin,Faramir,25636 -Boromir,Faramir,25636 -Denethor,Faramir,25654 -Beregond,Aragorn,25692 -Pippin,Peregrin,25697 -Gandalf,Shadowfax,25715 -Beregond,Shadowfax,25716 -Pippin,Shadowfax,25723 -Pippin,Shadowfax,25726 -Beregond,Pippin,25741 -Beregond,Pippin,25749 -Beregond,Peregrin,25753 -Beregond,Pippin,25780 -Pippin,Peregrin,25817 -Pippin,Peregrin,25867 -Beregond,Gandalf,25868 -Beregond,Pippin,25868 -Gandalf,Pippin,25868 -Pippin,Beregond,25869 -Pippin,Denethor,25872 -Pippin,Boromir,25872 -Denethor,Boromir,25872 -Beregond,Bergil,25917 -Pippin,Merry,25928 -Pippin,Bergil,25928 -Merry,Bergil,25928 -Pippin,Bergil,25930 -Pippin,Bergil,25935 -Pippin,Forlong,25939 -Forlong,Bergil,25941 -Amroth,Imrahil,25961 -Pippin,Gandalf,25987 -Pippin,Faramir,26001 -Gandalf,Merry,26010 -Gandalf,Shadowfax,26010 -Gandalf,Aragorn,26010 -Merry,Shadowfax,26010 -Merry,Aragorn,26010 -Shadowfax,Aragorn,26010 -Gimli,Legolas,26013 -Merry,Aragorn,26031 -Gimli,Legolas,26034 -Gimli,Merry,26034 -Gimli,Aragorn,26034 -Legolas,Merry,26034 -Legolas,Aragorn,26034 -Merry,Aragorn,26034 -Merry,Aragorn,26042 -Théoden,Saruman,26073 -Halbarad,Aragorn,26089 -Gimli,Legolas,26099 -Gimli,Merry,26099 -Legolas,Merry,26099 -Gimli,Legolas,26102 -Gimli,Halbarad,26115 -Legolas,Aragorn,26116 -Legolas,Gandalf,26125 -Legolas,Galadriel,26125 -Gandalf,Galadriel,26125 -Gimli,Gandalf,26126 -Meriadoc,Théoden,26151 -Théoden,Merry,26160 -Théoden,Aragorn,26160 -Merry,Aragorn,26160 -Éomer,Elrond,26169 -Éomer,Halbarad,26169 -Éomer,Aragorn,26169 -Elrond,Halbarad,26169 -Elrond,Aragorn,26169 -Halbarad,Aragorn,26169 -Gimli,Legolas,26170 -Merry,Aragorn,26171 -Éomer,Théoden,26176 -Éomer,Merry,26186 -Éomer,Aragorn,26186 -Merry,Aragorn,26186 -Éomer,Aragorn,26188 -Éomer,Théoden,26190 -Éomer,Aragorn,26190 -Théoden,Aragorn,26190 -Gimli,Legolas,26197 -Gimli,Merry,26197 -Legolas,Merry,26197 -Éomer,Théoden,26202 -Gimli,Legolas,26212 -Gandalf,Aragorn,26219 -Isildur,Elendil,26234 -Isildur,Théoden,26234 -Isildur,Sauron,26234 -Elendil,Théoden,26234 -Elendil,Sauron,26234 -Théoden,Sauron,26234 -Gimli,Aragorn,26236 -Legolas,Elrond,26249 -Legolas,Aragorn,26249 -Elrond,Aragorn,26249 -Arvedui,Aragorn,26250 -Gimli,Aragorn,26257 -Gimli,Legolas,26260 -Gimli,Aragorn,26260 -Legolas,Aragorn,26260 -Isildur,Sauron,26263 -Isildur,Sauron,26266 -Gimli,Legolas,26272 -Gimli,Aragorn,26272 -Legolas,Aragorn,26272 -Gimli,Legolas,26274 -Helm,Halbarad,26276 -Éowyn,Elrond,26278 -Éowyn,Aragorn,26278 -Elrond,Aragorn,26278 -Helm,Théoden,26279 -Éowyn,Aragorn,26283 -Gimli,Legolas,26295 -Gimli,Aragorn,26295 -Legolas,Aragorn,26295 -Gimli,Legolas,26330 -Gimli,Glóin,26361 -Gimli,Aragorn,26362 -Gimli,Glóin,26371 -Gimli,Legolas,26398 -Gimli,Legolas,26400 -Gimli,Amroth,26407 -Isildur,Elessar,26428 -Isildur,Halbarad,26428 -Elessar,Halbarad,26428 -Gimli,Legolas,26433 -Pippin,Amroth,26438 -Gimli,Pippin,26465 -Gimli,Legolas,26465 -Gimli,Aragorn,26465 -Pippin,Legolas,26465 -Pippin,Aragorn,26465 -Legolas,Aragorn,26465 -Sam,Frodo,26466 -Éomer,Théoden,26476 -Gandalf,Shadowfax,26497 -Dúnhere,Gandalf,26500 -Éowyn,Théoden,26544 -Éowyn,Merry,26544 -Théoden,Merry,26544 -Éomer,Aragorn,26549 -Pippin,Gandalf,26571 -Pippin,Frodo,26571 -Pippin,Gimli,26571 -Pippin,Sam,26571 -Pippin,Legolas,26571 -Gandalf,Frodo,26571 -Gandalf,Gimli,26571 -Gandalf,Sam,26571 -Gandalf,Legolas,26571 -Frodo,Gimli,26571 -Frodo,Sam,26571 -Frodo,Legolas,26571 -Gimli,Sam,26571 -Gimli,Legolas,26571 -Sam,Legolas,26571 -Éowyn,Dúnhere,26576 -Éowyn,Éomer,26576 -Éowyn,Théoden,26576 -Dúnhere,Éomer,26576 -Dúnhere,Théoden,26576 -Éomer,Théoden,26576 -Éomer,Aragorn,26584 -Brego,Baldor,26592 -Merry,Aragorn,26598 -Éowyn,Éomer,26599 -Brego,Baldor,26603 -Éomer,Aragorn,26614 -Merry,Boromir,26622 -Hirgon,Denethor,26628 -Théoden,Denethor,26630 -Hirgon,Denethor,26634 -Hirgon,Gandalf,26638 -Hirgon,Denethor,26638 -Gandalf,Denethor,26638 -Éomer,Théoden,26705 -Éomer,Merry,26706 -Éowyn,Merry,26712 -Théoden,Merry,26714 -Éowyn,Aragorn,26721 -Gimli,Merry,26725 -Meriadoc,Merry,26759 -Pippin,Gandalf,26788 -Pippin,Denethor,26800 -Pippin,Gandalf,26801 -Éomer,Gandalf,26819 -Éomer,Denethor,26819 -Gandalf,Denethor,26819 -Pippin,Denethor,26820 -Pippin,Denethor,26821 -Pippin,Gandalf,26862 -Beregond,Pippin,26868 -Beregond,Faramir,26868 -Pippin,Faramir,26868 -Beregond,Faramir,26909 -Beregond,Pippin,26910 -Gandalf,Shadowfax,26929 -Pippin,Faramir,26930 -Pippin,Boromir,26932 -Pippin,Denethor,26949 -Pippin,Faramir,26953 -Pippin,Gandalf,26955 -Pippin,Gandalf,26957 -Pippin,Faramir,26957 -Gandalf,Faramir,26957 -Pippin,Frodo,26958 -Pippin,Gandalf,26958 -Frodo,Gandalf,26958 -Pippin,Gandalf,26959 -Boromir,Denethor,26991 -Boromir,Faramir,26991 -Denethor,Faramir,26991 -Boromir,Denethor,26998 -Boromir,Faramir,26998 -Denethor,Faramir,26998 -Pippin,Gandalf,27035 -Pippin,Denethor,27035 -Gandalf,Denethor,27035 -Pippin,Gandalf,27056 -Pippin,Gandalf,27058 -Pippin,Frodo,27060 -Pippin,Gandalf,27060 -Frodo,Gandalf,27060 -Pippin,Gollum,27090 -Frodo,Gollum,27094 -Boromir,Faramir,27114 -Denethor,Boromir,27125 -Gandalf,Faramir,27128 -Beregond,Faramir,27161 -Nazgûl,Denethor,27184 -Nazgûl,Sauron,27184 -Denethor,Sauron,27184 -Pippin,Gandalf,27187 -Shadowfax,Amroth,27234 -Shadowfax,Faramir,27234 -Amroth,Faramir,27234 -Denethor,Faramir,27255 -Nazgûl,Faramir,27259 -Imrahil,Faramir,27261 -Denethor,Faramir,27265 -Pippin,Gandalf,27269 -Gandalf,Denethor,27322 -Denethor,Faramir,27350 -Denethor,Faramir,27362 -Denethor,Faramir,27368 -Denethor,Faramir,27387 -Pippin,Denethor,27389 -Denethor,Faramir,27404 -Pippin,Denethor,27422 -Beregond,Pippin,27428 -Beregond,Faramir,27428 -Pippin,Faramir,27428 -Beregond,Pippin,27435 -Beregond,Faramir,27435 -Pippin,Faramir,27435 -Gandalf,Shadowfax,27488 -Pippin,Merry,27536 -Éomer,Merry,27539 -Éomer,Théoden,27567 -Théoden,Ghân-buri-Ghân,27665 -Éomer,Denethor,27690 -Éomer,Théoden,27771 -Théoden,Thengel,27796 -Éowyn,Merry,27873 -Éowyn,Meriadoc,27881 -Éomer,Amroth,27905 -Merry,Gandalf,27906 -Éowyn,Éomer,27908 -Éomer,Théoden,27918 -Éowyn,Théoden,27951 -Imrahil,Amroth,27953 -Éowyn,Éomer,27962 -Éomer,Imrahil,27972 -Éomer,Húrin,27972 -Imrahil,Húrin,27972 -Arwen,Elrond,28013 -Isildur,Elessar,28014 -Isildur,Aragorn,28014 -Elessar,Aragorn,28014 -Gimli,Legolas,28019 -Gimli,Halbarad,28019 -Legolas,Halbarad,28019 -Elendil,Aragorn,28020 -Éomer,Aragorn,28021 -Éomer,Imrahil,28034 -Éomer,Aragorn,28034 -Imrahil,Aragorn,28034 -Grimbold,Halbarad,28038 -Grimbold,Dúnhere,28044 -Grimbold,Fastred,28044 -Grimbold,Horn,28044 -Grimbold,Harding,28044 -Dúnhere,Fastred,28044 -Dúnhere,Horn,28044 -Dúnhere,Harding,28044 -Fastred,Horn,28044 -Fastred,Harding,28044 -Horn,Harding,28044 -Gandalf,Denethor,28049 -Gandalf,Shadowfax,28053 -Pippin,Shadowfax,28055 -Pippin,Faramir,28067 -Pippin,Denethor,28070 -Pippin,Faramir,28070 -Denethor,Faramir,28070 -Pippin,Gandalf,28073 -Gandalf,Faramir,28074 -Pippin,Shadowfax,28077 -Pippin,Beregond,28089 -Beregond,Denethor,28102 -Pippin,Gandalf,28104 -Pippin,Denethor,28104 -Gandalf,Denethor,28104 -Gandalf,Denethor,28109 -Denethor,Faramir,28116 -Beregond,Gandalf,28122 -Beregond,Pippin,28122 -Beregond,Denethor,28122 -Gandalf,Pippin,28122 -Gandalf,Denethor,28122 -Pippin,Denethor,28122 -Gandalf,Denethor,28174 -Beregond,Faramir,28177 -Beregond,Gandalf,28191 -Beregond,Denethor,28191 -Beregond,Ecthelion,28191 -Gandalf,Denethor,28191 -Gandalf,Ecthelion,28191 -Denethor,Ecthelion,28191 -Beregond,Faramir,28195 -Beregond,Gandalf,28197 -Beregond,Pippin,28197 -Beregond,Faramir,28197 -Gandalf,Pippin,28197 -Gandalf,Faramir,28197 -Pippin,Faramir,28197 -Gandalf,Amroth,28204 -Beregond,Gandalf,28210 -Beregond,Pippin,28210 -Beregond,Faramir,28210 -Gandalf,Pippin,28210 -Gandalf,Faramir,28210 -Pippin,Faramir,28210 -Pippin,Beregond,28212 -Denethor,Sauron,28225 -Beregond,Faramir,28229 -Éowyn,Théoden,28249 -Pippin,Merry,28276 -Beregond,Bergil,28285 -Éowyn,Meriadoc,28301 -Éowyn,Faramir,28301 -Meriadoc,Faramir,28301 -Éomer,Imrahil,28323 -Éomer,Aragorn,28323 -Imrahil,Aragorn,28323 -Éomer,Elendil,28327 -Éomer,Imrahil,28334 -Éowyn,Éomer,28338 -Éowyn,Imrahil,28339 -Éowyn,Gandalf,28345 -Denethor,Faramir,28346 -Galadriel,Aragorn,28350 -Amroth,Faramir,28352 -Éomer,Imrahil,28365 -Elessar,Aragorn,28366 -Éowyn,Meriadoc,28368 -Éowyn,Gandalf,28368 -Meriadoc,Gandalf,28368 -Éowyn,Merry,28370 -Éowyn,Faramir,28370 -Éowyn,Aragorn,28370 -Merry,Faramir,28370 -Merry,Aragorn,28370 -Faramir,Aragorn,28370 -Éomer,Faramir,28373 -Éomer,Elrond,28373 -Éomer,Aragorn,28373 -Faramir,Elrond,28373 -Faramir,Aragorn,28373 -Elrond,Aragorn,28373 -Gandalf,Faramir,28386 -Shadowfax,Aragorn,28387 -Gandalf,Aragorn,28390 -Aragorn,Faramir,28419 -Faramir,Aragorn,28421 -Faramir,Aragorn,28432 -Faramir,Aragorn,28436 -Beregond,Gandalf,28443 -Beregond,Imrahil,28443 -Gandalf,Imrahil,28443 -Pippin,Gandalf,28444 -Éowyn,Aragorn,28448 -Théoden,Wormtongue,28464 -Saruman,Wormtongue,28468 -Éomer,Aragorn,28472 -Éowyn,Aragorn,28483 -Éowyn,Aragorn,28484 -Éomer,Éowyn,28488 -Éowyn,Éomer,28499 -Éomer,Gandalf,28503 -Pippin,Gandalf,28510 -Pippin,Merry,28510 -Pippin,Aragorn,28510 -Gandalf,Merry,28510 -Gandalf,Aragorn,28510 -Merry,Aragorn,28510 -Pippin,Merry,28511 -Merry,Aragorn,28516 -Pippin,Gandalf,28518 -Pippin,Aragorn,28528 -Meriadoc,Saruman,28532 -Meriadoc,Aragorn,28532 -Saruman,Aragorn,28532 -Merry,Gandalf,28543 -Éowyn,Gandalf,28565 -Éowyn,Faramir,28565 -Éowyn,Aragorn,28565 -Gandalf,Faramir,28565 -Gandalf,Aragorn,28565 -Faramir,Aragorn,28565 -Éowyn,Gandalf,28566 -Éowyn,Faramir,28566 -Éowyn,Aragorn,28566 -Gandalf,Faramir,28566 -Gandalf,Aragorn,28566 -Faramir,Aragorn,28566 -Beregond,Meriadoc,28568 -Elrond,Aragorn,28573 -Gimli,Pippin,28578 -Gimli,Legolas,28578 -Gimli,Merry,28578 -Pippin,Legolas,28578 -Pippin,Merry,28578 -Legolas,Merry,28578 -Gimli,Legolas,28579 -Legolas,Aragorn,28581 -Legolas,Imrahil,28583 -Legolas,Aragorn,28583 -Imrahil,Aragorn,28583 -Legolas,Aragorn,28587 -Meriadoc,Peregrin,28589 -Meriadoc,Imrahil,28589 -Peregrin,Imrahil,28589 -Legolas,Merry,28603 -Legolas,Merry,28619 -Gimli,Glóin,28632 -Éowyn,Merry,28635 -Pippin,Legolas,28639 -Pippin,Merry,28639 -Legolas,Merry,28639 -Angbor,Aragorn,28652 -Lúthien,Sauron,28683 -Isildur,Aragorn,28690 -Gandalf,Aragorn,28715 -Théoden,Imrahil,28719 -Théoden,Gimli,28719 -Théoden,Aragorn,28719 -Théoden,Éomer,28719 -Théoden,Legolas,28719 -Imrahil,Gimli,28719 -Imrahil,Aragorn,28719 -Imrahil,Éomer,28719 -Imrahil,Legolas,28719 -Gimli,Aragorn,28719 -Gimli,Éomer,28719 -Gimli,Legolas,28719 -Aragorn,Éomer,28719 -Aragorn,Legolas,28719 -Éomer,Legolas,28719 -Gandalf,Elrond,28720 -Gandalf,Aragorn,28720 -Elrond,Aragorn,28720 -Amroth,Imrahil,28730 -Gandalf,Sauron,28793 -Imrahil,Aragorn,28799 -Imrahil,Gimli,28818 -Imrahil,Glóin,28818 -Imrahil,Aragorn,28818 -Gimli,Glóin,28818 -Gimli,Aragorn,28818 -Glóin,Aragorn,28818 -Éomer,Elrond,28820 -Éomer,Amroth,28820 -Éomer,Imrahil,28820 -Éomer,Aragorn,28820 -Elrond,Amroth,28820 -Elrond,Imrahil,28820 -Elrond,Aragorn,28820 -Amroth,Imrahil,28820 -Amroth,Aragorn,28820 -Imrahil,Aragorn,28820 -Gimli,Legolas,28836 -Gimli,Gandalf,28836 -Gimli,Elrond,28836 -Gimli,Aragorn,28836 -Legolas,Gandalf,28836 -Legolas,Elrond,28836 -Legolas,Aragorn,28836 -Gandalf,Elrond,28836 -Gandalf,Aragorn,28836 -Elrond,Aragorn,28836 -Gandalf,Imrahil,28872 -Gandalf,Faramir,28872 -Imrahil,Faramir,28872 -Gandalf,Aragorn,28876 -Nazgûl,Aragorn,28894 -Gandalf,Imrahil,28926 -Gandalf,Gimli,28926 -Gandalf,Peregrin,28926 -Gandalf,Elrond,28926 -Gandalf,Aragorn,28926 -Gandalf,Éomer,28926 -Gandalf,Legolas,28926 -Imrahil,Gimli,28926 -Imrahil,Peregrin,28926 -Imrahil,Elrond,28926 -Imrahil,Aragorn,28926 -Imrahil,Éomer,28926 -Imrahil,Legolas,28926 -Gimli,Peregrin,28926 -Gimli,Elrond,28926 -Gimli,Aragorn,28926 -Gimli,Éomer,28926 -Gimli,Legolas,28926 -Peregrin,Elrond,28926 -Peregrin,Aragorn,28926 -Peregrin,Éomer,28926 -Peregrin,Legolas,28926 -Elrond,Aragorn,28926 -Elrond,Éomer,28926 -Elrond,Legolas,28926 -Aragorn,Éomer,28926 -Aragorn,Legolas,28926 -Éomer,Legolas,28926 -Gandalf,Sauron,28956 -Sam,Frodo,28958 -Pippin,Imrahil,28960 -Saruman,Sauron,28982 -Elrond,Amroth,29020 -Elrond,Imrahil,29020 -Amroth,Imrahil,29020 -Beregond,Frodo,29024 -Beregond,Gandalf,29024 -Beregond,Pippin,29024 -Beregond,Imrahil,29024 -Frodo,Gandalf,29024 -Frodo,Pippin,29024 -Frodo,Imrahil,29024 -Gandalf,Pippin,29024 -Gandalf,Imrahil,29024 -Pippin,Imrahil,29024 -Beregond,Pippin,29040 -Pippin,Merry,29069 -Pippin,Denethor,29069 -Pippin,Aragorn,29069 -Merry,Denethor,29069 -Merry,Aragorn,29069 -Denethor,Aragorn,29069 -Sam,Frodo,29070 -Hamfast,Samwise,29072 -Frodo,Shelob,29084 -Frodo,Shagrat,29084 -Shelob,Shagrat,29084 -Gorbag,Shagrat,29101 -Gorbag,Shagrat,29163 -Gorbag,Shagrat,29164 -Gorbag,Sam,29169 -Sam,Frodo,29207 -Gorbag,Shagrat,29246 -Gorbag,Shagrat,29288 -Nazgûl,Shagrat,29309 -Sam,Shagrat,29317 -Sam,Shagrat,29323 -Sam,Shagrat,29344 -Sam,Shagrat,29350 -Sam,Frodo,29427 -Sam,Frodo,29440 -Sam,Frodo,29449 -Sam,Frodo,29461 -Sam,Frodo,29480 -Sam,Frodo,29499 -Sam,Frodo,29503 -Sam,Frodo,29511 -Sam,Frodo,29521 -Sam,Frodo,29532 -Sam,Frodo,29545 -Gorbag,Sam,29578 -Sam,Frodo,29583 -Sam,Frodo,29584 -Sam,Frodo,29593 -Sam,Faramir,29619 -Sam,Frodo,29623 -Sam,Galadriel,29649 -Sam,Frodo,29654 -Sam,Frodo,29679 -Sam,Frodo,29684 -Sam,Frodo,29689 -Sam,Frodo,29694 -Sam,Frodo,29709 -Sam,Shagrat,29717 -Sam,Frodo,29739 -Sam,Frodo,29751 -Sam,Frodo,29764 -Sam,Frodo,29780 -Sam,Frodo,29788 -Gorbag,Shagrat,29792 -Sam,Frodo,29795 -Sam,Frodo,29807 -Sam,Frodo,29836 -Sam,Frodo,29851 -Sam,Faramir,29855 -Sam,Frodo,29863 -Sam,Frodo,29874 -Sam,Frodo,29888 -Sam,Frodo,29972 -Sam,Frodo,29987 -Sam,Shelob,29987 -Sam,Gollum,29987 -Frodo,Shelob,29987 -Frodo,Gollum,29987 -Shelob,Gollum,29987 -Sam,Frodo,29988 -Sam,Frodo,30000 -Sam,Frodo,30011 -Sam,Frodo,30029 -Sam,Frodo,30031 -Sam,Frodo,30035 -Sam,Frodo,30042 -Sam,Frodo,30043 -Frodo,Gollum,30061 -Sam,Frodo,30064 -Sam,Frodo,30085 -Sam,Frodo,30118 -Sam,Frodo,30141 -Sam,Frodo,30153 -Sam,Frodo,30170 -Frodo,Gandalf,30173 -Sam,Frodo,30187 -Sam,Frodo,30276 -Sam,Faramir,30276 -Frodo,Faramir,30276 -Sam,Frodo,30316 -Sam,Frodo,30351 -Sam,Frodo,30365 -Sam,Frodo,30368 -Sam,Frodo,30371 -Sam,Frodo,30379 -Sam,Frodo,30413 -Sam,Frodo,30419 -Frodo,Gollum,30437 -Sam,Gollum,30440 -Sam,Frodo,30453 -Sam,Gollum,30453 -Frodo,Gollum,30453 -Sam,Gollum,30488 -Sam,Frodo,30513 -Sam,Gollum,30536 -Sam,Frodo,30547 -Gollum,Gandalf,30571 -Gandalf,Sauron,30601 -Gandalf,Aragorn,30610 -Meneldor,Gandalf,30615 -Sam,Frodo,30618 -Sam,Frodo,30622 -Sam,Frodo,30628 -Sam,Frodo,30630 -Sam,Gandalf,30668 -Gandalf,Sauron,30681 -Sam,Frodo,30694 -Sam,Galadriel,30694 -Frodo,Galadriel,30694 -Frodo,Samwise,30706 -Sam,Frodo,30716 -Sam,Frodo,30721 -Sam,Aragorn,30723 -Sam,Frodo,30725 -Sam,Frodo,30729 -Sam,Frodo,30736 -Frodo,Gandalf,30737 -Sam,Frodo,30741 -Frodo,Gandalf,30744 -Frodo,Bilbo,30744 -Gandalf,Bilbo,30744 -Éomer,Gimli,30745 -Éomer,Legolas,30745 -Éomer,Gandalf,30745 -Éomer,Imrahil,30745 -Gimli,Legolas,30745 -Gimli,Gandalf,30745 -Gimli,Imrahil,30745 -Legolas,Gandalf,30745 -Legolas,Imrahil,30745 -Gandalf,Imrahil,30745 -Peregrin,Merry,30751 -Pippin,Merry,30759 -Pippin,Gandalf,30759 -Pippin,Frodo,30759 -Pippin,Gimli,30759 -Pippin,Sam,30759 -Pippin,Legolas,30759 -Merry,Gandalf,30759 -Merry,Frodo,30759 -Merry,Gimli,30759 -Merry,Sam,30759 -Merry,Legolas,30759 -Gandalf,Frodo,30759 -Gandalf,Gimli,30759 -Gandalf,Sam,30759 -Gandalf,Legolas,30759 -Frodo,Gimli,30759 -Frodo,Sam,30759 -Frodo,Legolas,30759 -Gimli,Sam,30759 -Gimli,Legolas,30759 -Sam,Legolas,30759 -Sam,Frodo,30760 -Pippin,Frodo,30763 -Pippin,Merry,30763 -Frodo,Merry,30763 -Gandalf,Bilbo,30772 -Gimli,Pippin,30775 -Gimli,Frodo,30775 -Gimli,Sam,30775 -Pippin,Frodo,30775 -Pippin,Sam,30775 -Frodo,Sam,30775 -Sam,Frodo,30798 -Éomer,Théoden,30860 -Éomer,Faramir,30860 -Théoden,Faramir,30860 -Éowyn,Merry,30888 -Éowyn,Faramir,30888 -Merry,Faramir,30888 -Merry,Faramir,30889 -Éowyn,Faramir,30896 -Éowyn,Amroth,30903 -Éowyn,Finduilas,30903 -Amroth,Finduilas,30903 -Éowyn,Faramir,30905 -Merry,Faramir,30945 -Éowyn,Faramir,30949 -Elendil,Aragorn,30950 -Éowyn,Faramir,30960 -Éowyn,Faramir,30981 -Éowyn,Húrin,30991 -Éowyn,Faramir,30991 -Húrin,Faramir,30991 -Éomer,Gandalf,30995 -Éomer,Imrahil,30995 -Gandalf,Imrahil,30995 -Húrin,Faramir,31008 -Faramir,Aragorn,31009 -Isildur,Valandil,31013 -Isildur,Elendil,31013 -Isildur,Elessar,31013 -Isildur,Aragorn,31013 -Valandil,Elendil,31013 -Valandil,Elessar,31013 -Valandil,Aragorn,31013 -Elendil,Elessar,31013 -Elendil,Aragorn,31013 -Elessar,Aragorn,31013 -Eärnur,Faramir,31017 -Faramir,Aragorn,31022 -Frodo,Gandalf,31023 -Frodo,Faramir,31023 -Frodo,Aragorn,31023 -Gandalf,Faramir,31023 -Gandalf,Aragorn,31023 -Faramir,Aragorn,31023 -Húrin,Elessar,31025 -Húrin,Faramir,31025 -Elessar,Faramir,31025 -Beregond,Faramir,31038 -Faramir,Aragorn,31039 -Éomer,Aragorn,31040 -Éowyn,Elrond,31045 -Éowyn,Faramir,31045 -Elrond,Faramir,31045 -Gimli,Legolas,31048 -Gimli,Aragorn,31048 -Legolas,Aragorn,31048 -Frodo,Gandalf,31052 -Frodo,Aragorn,31052 -Gandalf,Aragorn,31052 -Gandalf,Bilbo,31053 -Pippin,Frodo,31054 -Pippin,Gandalf,31054 -Frodo,Gandalf,31054 -Gandalf,Aragorn,31057 -Gandalf,Aragorn,31058 -Gandalf,Aragorn,31067 -Gandalf,Nimloth,31086 -Nimloth,Aragorn,31094 -Glorfindel,Arwen,31102 -Glorfindel,Erestor,31102 -Glorfindel,Elrond,31102 -Glorfindel,Galadriel,31102 -Glorfindel,Celeborn,31102 -Arwen,Erestor,31102 -Arwen,Elrond,31102 -Arwen,Galadriel,31102 -Arwen,Celeborn,31102 -Erestor,Elrond,31102 -Erestor,Galadriel,31102 -Erestor,Celeborn,31102 -Elrond,Galadriel,31102 -Elrond,Celeborn,31102 -Galadriel,Celeborn,31102 -Frodo,Gandalf,31103 -Arwen,Elessar,31106 -Arwen,Aragorn,31106 -Elessar,Aragorn,31106 -Arwen,Frodo,31108 -Frodo,Aragorn,31109 -Arwen,Bilbo,31113 -Arwen,Elrond,31113 -Bilbo,Elrond,31113 -Éomer,Théoden,31119 -Éomer,Gimli,31129 -Éomer,Glóin,31129 -Gimli,Glóin,31129 -Éomer,Gimli,31131 -Théoden,Merry,31141 -Pippin,Gandalf,31142 -Pippin,Shadowfax,31142 -Pippin,Frodo,31142 -Pippin,Gimli,31142 -Pippin,Aragorn,31142 -Pippin,Legolas,31142 -Pippin,Samwise,31142 -Gandalf,Shadowfax,31142 -Gandalf,Frodo,31142 -Gandalf,Gimli,31142 -Gandalf,Aragorn,31142 -Gandalf,Legolas,31142 -Gandalf,Samwise,31142 -Shadowfax,Frodo,31142 -Shadowfax,Gimli,31142 -Shadowfax,Aragorn,31142 -Shadowfax,Legolas,31142 -Shadowfax,Samwise,31142 -Frodo,Gimli,31142 -Frodo,Aragorn,31142 -Frodo,Legolas,31142 -Frodo,Samwise,31142 -Gimli,Aragorn,31142 -Gimli,Legolas,31142 -Gimli,Samwise,31142 -Aragorn,Legolas,31142 -Aragorn,Samwise,31142 -Legolas,Samwise,31142 -Elrond,Arwen,31143 -Elrond,Galadriel,31143 -Elrond,Amroth,31143 -Elrond,Celeborn,31143 -Arwen,Galadriel,31143 -Arwen,Amroth,31143 -Arwen,Celeborn,31143 -Galadriel,Amroth,31143 -Galadriel,Celeborn,31143 -Amroth,Celeborn,31143 -Théoden,Thengel,31144 -Elessar,Aragorn,31146 -Théoden,Thengel,31152 -Helm,Théoden,31153 -Théoden,Merry,31156 -Éowyn,Éomer,31161 -Fréa,Fengel,31162 -Fréa,Helm,31162 -Fréa,Théoden,31162 -Fréa,Baldor,31162 -Fréa,Déor,31162 -Fréa,Brego,31162 -Fréa,Goldwine,31162 -Fréa,Folcwine,31162 -Fréa,Aldor,31162 -Fréa,Walda,31162 -Fréa,Folca,31162 -Fréa,Thengel,31162 -Fréa,Gram,31162 -Fengel,Helm,31162 -Fengel,Théoden,31162 -Fengel,Baldor,31162 -Fengel,Déor,31162 -Fengel,Brego,31162 -Fengel,Goldwine,31162 -Fengel,Folcwine,31162 -Fengel,Aldor,31162 -Fengel,Walda,31162 -Fengel,Folca,31162 -Fengel,Thengel,31162 -Fengel,Gram,31162 -Helm,Théoden,31162 -Helm,Baldor,31162 -Helm,Déor,31162 -Helm,Brego,31162 -Helm,Goldwine,31162 -Helm,Folcwine,31162 -Helm,Aldor,31162 -Helm,Walda,31162 -Helm,Folca,31162 -Helm,Thengel,31162 -Helm,Gram,31162 -Théoden,Baldor,31162 -Théoden,Déor,31162 -Théoden,Brego,31162 -Théoden,Goldwine,31162 -Théoden,Folcwine,31162 -Théoden,Aldor,31162 -Théoden,Walda,31162 -Théoden,Folca,31162 -Théoden,Thengel,31162 -Théoden,Gram,31162 -Baldor,Déor,31162 -Baldor,Brego,31162 -Baldor,Goldwine,31162 -Baldor,Folcwine,31162 -Baldor,Aldor,31162 -Baldor,Walda,31162 -Baldor,Folca,31162 -Baldor,Thengel,31162 -Baldor,Gram,31162 -Déor,Brego,31162 -Déor,Goldwine,31162 -Déor,Folcwine,31162 -Déor,Aldor,31162 -Déor,Walda,31162 -Déor,Folca,31162 -Déor,Thengel,31162 -Déor,Gram,31162 -Brego,Goldwine,31162 -Brego,Folcwine,31162 -Brego,Aldor,31162 -Brego,Walda,31162 -Brego,Folca,31162 -Brego,Thengel,31162 -Brego,Gram,31162 -Goldwine,Folcwine,31162 -Goldwine,Aldor,31162 -Goldwine,Walda,31162 -Goldwine,Folca,31162 -Goldwine,Thengel,31162 -Goldwine,Gram,31162 -Folcwine,Aldor,31162 -Folcwine,Walda,31162 -Folcwine,Folca,31162 -Folcwine,Thengel,31162 -Folcwine,Gram,31162 -Aldor,Walda,31162 -Aldor,Folca,31162 -Aldor,Thengel,31162 -Aldor,Gram,31162 -Walda,Folca,31162 -Walda,Thengel,31162 -Walda,Gram,31162 -Folca,Thengel,31162 -Folca,Gram,31162 -Thengel,Gram,31162 -Éomer,Théoden,31163 -Éowyn,Éomer,31164 -Éowyn,Théoden,31164 -Éomer,Théoden,31164 -Éowyn,Faramir,31166 -Éowyn,Faramir,31167 -Éowyn,Éomer,31168 -Éowyn,Aragorn,31168 -Éomer,Aragorn,31168 -Arwen,Faramir,31170 -Arwen,Imrahil,31170 -Arwen,Aragorn,31170 -Faramir,Imrahil,31170 -Faramir,Aragorn,31170 -Imrahil,Aragorn,31170 -Éowyn,Meriadoc,31172 -Éowyn,Éomer,31172 -Éowyn,Merry,31172 -Meriadoc,Éomer,31172 -Meriadoc,Merry,31172 -Éomer,Merry,31172 -Éowyn,Merry,31174 -Éowyn,Merry,31178 -Gimli,Legolas,31180 -Treebeard,Gandalf,31188 -Treebeard,Gandalf,31192 -Treebeard,Aragorn,31197 -Treebeard,Gandalf,31202 -Treebeard,Merry,31202 -Gandalf,Merry,31202 -Galadriel,Celeborn,31245 -Gimli,Legolas,31247 -Treebeard,Galadriel,31255 -Treebeard,Celeborn,31255 -Galadriel,Celeborn,31255 -Galadriel,Celeborn,31259 -Pippin,Merry,31261 -Pippin,Aragorn,31268 -Pippin,Aragorn,31270 -Celeborn,Galadriel,31274 -Celeborn,Aragorn,31274 -Galadriel,Aragorn,31274 -Gandalf,Saruman,31282 -Saruman,Galadriel,31295 -Saruman,Gandalf,31313 -Saruman,Wormtongue,31313 -Gandalf,Wormtongue,31313 -Saruman,Merry,31330 -Saruman,Wormtongue,31330 -Merry,Wormtongue,31330 -Galadriel,Celeborn,31349 -Gandalf,Elrond,31350 -Frodo,Galadriel,31356 -Sam,Elrond,31357 -Sam,Frodo,31389 -Sam,Elrond,31389 -Frodo,Elrond,31389 -Pippin,Merry,31401 -Pippin,Bilbo,31402 -Frodo,Bilbo,31406 -Sam,Aragorn,31411 -Sam,Frodo,31423 -Gandalf,Bilbo,31436 -Gandalf,Elrond,31436 -Bilbo,Elrond,31436 -Frodo,Elrond,31437 -Frodo,Gandalf,31445 -Pippin,Sam,31474 -Pippin,Sam,31475 -Gandalf,Butterbur,31524 -Gandalf,Barliman,31581 -Butterbur,Merry,31614 -Sam,Bill,31626 -Sam,Bill,31629 -Sam,Bill,31651 -Frodo,Barliman,31652 -Pippin,Gandalf,31656 -Pippin,Lotho,31656 -Gandalf,Lotho,31656 -Merry,Gandalf,31658 -Gandalf,Shadowfax,31684 -Frodo,Lotho,31707 -Pippin,Merry,31716 -Pippin,Merry,31717 -Merry,Bill,31723 -Sam,Bill,31731 -Robin,Sam,31816 -Sam,Frodo,31834 -Frodo,Merry,31844 -Pippin,Sam,31845 -Pippin,Merry,31845 -Sam,Merry,31845 -Sam,Frodo,31863 -Sam,Merry,31875 -Sam,Bill,31880 -Pippin,Frodo,31930 -Pippin,Merry,31930 -Pippin,Sam,31930 -Frodo,Merry,31930 -Frodo,Sam,31930 -Merry,Sam,31930 -Frodo,Lotho,31940 -Pippin,Frodo,31943 -Frodo,Lotho,31950 -Pippin,Lotho,31957 -Sam,Frodo,32044 -Tom,Frodo,32058 -Tom,Sam,32058 -Frodo,Sam,32058 -Frodo,Merry,32075 -Peregrin,Lotho,32080 -Frodo,Merry,32095 -Sam,Frodo,32234 -Sam,Frodo,32238 -Sam,Frodo,32239 -Pippin,Merry,32283 -Meriadoc,Peregrin,32293 -Pippin,Sam,32295 -Pippin,Merry,32295 -Sam,Merry,32295 -Frodo,Merry,32296 -Pippin,Frodo,32301 -Pippin,Merry,32301 -Pippin,Sam,32301 -Frodo,Merry,32301 -Frodo,Sam,32301 -Merry,Sam,32301 -Sam,Frodo,32331 -Merry,Lotho,32348 -Merry,Saruman,32355 -Gandalf,Saruman,32372 -Saruman,Wormtongue,32396 -Saruman,Wormtongue,32399 -Frodo,Saruman,32400 -Sam,Frodo,32404 -Frodo,Saruman,32409 -Frodo,Wormtongue,32422 -Saruman,Wormtongue,32432 -Saruman,Wormtongue,32443 -Frodo,Wormtongue,32444 -Pippin,Fredegar,32459 -Frodo,Lotho,32469 -Pippin,Merry,32473 -Sam,Frodo,32499 -Sam,Frodo,32520 -Sam,Frodo,32523 -Pippin,Merry,32524 -Sam,Frodo,32525 -Sam,Frodo,32527 -Sam,Frodo,32538 -Pippin,Merry,32541 -Sam,Frodo,32544 -Sam,Frodo,32547 -Meriadoc,Peregrin,32548 -Meriadoc,Sam,32548 -Peregrin,Sam,32548 -Sam,Frodo,32552 -Sam,Frodo,32557 -Sam,Frodo,32563 -Sam,Frodo,32565 -Sam,Frodo,32568 -Sam,Frodo,32569 -Sam,Bilbo,32570 -Sam,Frodo,32573 -Sam,Frodo,32579 -Sam,Bilbo,32579 -Frodo,Bilbo,32579 -Sam,Frodo,32584 -Frodo,Bilbo,32586 -Frodo,Bilbo,32595 -Sam,Frodo,32597 -Sam,Frodo,32598 -Sam,Frodo,32599 -Sam,Bill,32599 -Frodo,Bill,32599 -Sam,Frodo,32603 -Sam,Frodo,32613 -Elrond,Sam,32614 -Elrond,Galadriel,32614 -Sam,Galadriel,32614 -Elrond,Galadriel,32619 -Sam,Frodo,32631 -Pippin,Merry,32645 -Pippin,Goldilocks,32645 -Merry,Goldilocks,32645 -Galadriel,Elrond,32650 -Sam,Frodo,32651 -Sam,Bilbo,32651 -Frodo,Bilbo,32651 -Frodo,Gandalf,32656 -Pippin,Merry,32659 -Sam,Gandalf,32663 -Pippin,Frodo,32666 -Pippin,Merry,32666 -Pippin,Galadriel,32666 -Pippin,Sam,32666 -Frodo,Merry,32666 -Frodo,Galadriel,32666 -Frodo,Sam,32666 -Merry,Galadriel,32666 -Merry,Sam,32666 -Galadriel,Sam,32666 -Pippin,Merry,32671 -Pippin,Merry,32674 diff --git a/docs/source/getting_started/intro_tutorials/lotr.ipynb b/docs/source/getting_started/intro_tutorials/lotr.ipynb deleted file mode 100644 index c1c6dd0bac..0000000000 --- a/docs/source/getting_started/intro_tutorials/lotr.ipynb +++ /dev/null @@ -1,384 +0,0 @@ -{ - "cells": [ - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "# Example: Lord of the rings \n", - "\n", - "Now that we know Raphtory is installed and running, let's look at the different ways to get some real data into a graph. \n", - "\n", - "For this first set of tutorials we are going to be building graphs from a Lord of the Rings dataset, looking at when characters interact throughout the trilogy 🧝🏻‍♀️🧙🏻‍♂️💍.\n", - " \n", - "

\n", - " \"Intro\n", - "

\n", - "\n", - "As with the quick start install guide, this and all following python pages are built as iPython notebooks. If you want to follow along on your own machine, click the `open on github` link in the top right of this page.\n", - "\n", - "## Let's have a look at the example data\n", - "\n", - "The data we are going to use is two `csv` files which will be pulled from our Github data repository. These are the structure of the graph (`lotr.csv`) and some metadata about the characters (`lotr_properties.csv`)\n", - "\n", - "For the structure file each line contains two characters that appeared in the same sentence, along with the sentence number, which we will use as a `timestamp`. The first line of the file is `Gandalf,Elrond,33` which tells us that Gandalf and Elrond appears together in sentence 33.\n", - "\n", - "For the properties file each line gives a characters name, their race and gender. For example `Gimli,dwarf,male`.\n", - "\n", - "\n", - "### Downloading the csv from Github 💾\n", - "\n", - "The following `curl` command will download the csv files and save them in the `tmp` directory on your computer. This will be deleted when you restart your computer, but it's only a couple of KB in any case.\n", - "\n" - ] - }, - { - "cell_type": "code", - "execution_count": 1, - "metadata": { - "tags": [] - }, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "****Downloading Data****\n", - " % Total % Received % Xferd Average Speed Time Time Time Current\n", - " Dload Upload Total Spent Left Speed\n", - "100 52206 100 52206 0 0 154k 0 --:--:-- --:--:-- --:--:-- 160k\n", - " % Total % Received % Xferd Average Speed Time Time Time Current\n", - " Dload Upload Total Spent Left Speed\n", - "100 686 100 686 0 0 2906 0 --:--:-- --:--:-- --:--:-- 2995\n", - " % Total % Received % Xferd Average Speed Time Time Time Current\n", - " Dload Upload Total Spent Left Speed\n", - "100 69632 100 69632 0 0 287k 0 --:--:-- --:--:-- --:--:-- 296k\n", - "****LOTR GRAPH STRUCTURE****\n", - "Gandalf,Elrond,33\n", - "Frodo,Bilbo,114\n", - "Blanco,Marcho,146\n", - "****LOTR GRAPH PROPERTIES****\n", - "Aragorn,men,male\n", - "Gandalf,ainur,male\n", - "Goldberry,ainur,female\n" - ] - } - ], - "source": [ - "print(\"****Downloading Data****\")\n", - "!curl -o /tmp/lotr.csv https://raw.githubusercontent.com/Raphtory/Data/main/lotr.csv\n", - "!curl -o /tmp/lotr_properties.csv https://raw.githubusercontent.com/Raphtory/Data/main/lotr_properties.csv\n", - "!curl -o /tmp/lotr.db https://raw.githubusercontent.com/Raphtory/Data/main/lotr.db\n", - "print(\"****LOTR GRAPH STRUCTURE****\")\n", - "!head -n 3 /tmp/lotr.csv\n", - "print(\"****LOTR GRAPH PROPERTIES****\")\n", - "!head -n 3 /tmp/lotr_properties.csv" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "## Setting up our imports and Raphtory\n", - "Now that we have our data we can sort out our imports and create the Raphtory `Graph` which we will use to build our graphs.\n", - "\n", - "The imports are for parsing CSV files, accessing pandas dataframes, and bringing in all the Raphtory classes we will use in the tutorial.\n", - "\n", - "The filenames are pointing at the data we just downloaded. If you change the download location above, make sure to change them here as well." - ] - }, - { - "cell_type": "code", - "execution_count": 2, - "metadata": { - "tags": [] - }, - "outputs": [], - "source": [ - "import csv\n", - "import pandas as pd\n", - "from raphtory import Graph\n", - "\n", - "structure_file = \"/tmp/lotr.csv\"\n", - "properties_file = \"/tmp/lotr_properties.csv\"\n", - "graph = Graph(1)\n" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "## Adding data directly into the Graph\n", - "\n", - "The simplest way to add data into a graph is to directly call the `add_vertex` and `add_edge` functions, which we saw in the quick start guide. These have required arguments defining the time the addition occurred and an identifier for the entity being updated. These functions, however, have several optional arguments allowing us to add `properties` and within this, `types`, on top of the base structure. \n", - "\n", - "\n", - "| Function | Required Arguments | Optional Arguments |\n", - "|--------------|-------------------------------|----------------------------------------------|\n", - "| `add_vertex` | `timestamp`,`vertex_id` | `properties` |\n", - "| `add_edge` | `timestamp`,`src_id`,`dst_id` | `properties` |\n", - "\n", - "\n", - "Lets take a look at this with our example data. In the below code we are opening The Lord of The Rings structural data via the csv reader and looping through each line. \n", - "\n", - "To insert the data we:\n", - "\n", - "* Extract the two characters names, referring to them as the `source_node` and `destination_node`.\n", - "* Extract the sentence number, referring to is as `timestamp`. This is then cast to an `int` as `epoch` timestamps in Raphtory must be a number.\n", - "* Call `add_vertex` for both nodes, setting their type to `Character`.\n", - "* Create an edge between them via `add_edge` and label this a `Co-occurence`." - ] - }, - { - "cell_type": "code", - "execution_count": 3, - "metadata": { - "tags": [] - }, - "outputs": [], - "source": [ - "with open(structure_file, 'r') as csvfile:\n", - " datareader = csv.reader(csvfile)\n", - " for row in datareader:\n", - "\n", - " source_node = row[0]\n", - " destination_node = row[1]\n", - " timestamp = int(row[2])\n", - " \n", - " graph.add_vertex(timestamp, source_node, {\"vertex_type\": \"Character\"})\n", - " graph.add_vertex(timestamp, destination_node, {\"vertex_type\": \"Character\"}) \n", - " graph.add_edge(timestamp, source_node, destination_node, {\"edge_type\": \"Character_Co-occurence\"})" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "## Let's see if the data has ingested\n", - "\n", - "To do this, much like the quick start, we can run a query on our graph. As Raphtory allows us to explore the network's history, lets add a bit of this in as well. \n", - "\n", - "Below we check the data contained in the graph by running the `earliest_time()`, `latest_time()`, and `len` the vertices and edges. " - ] - }, - { - "cell_type": "code", - "execution_count": 17, - "metadata": { - "tags": [] - }, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "Earliest time: 33\n", - "Latest time: 32674\n", - "Number of vertices: 139\n", - "Number of edges: 701\n" - ] - } - ], - "source": [ - "print(\"Earliest time: %i\" % graph.earliest_time())\n", - "print(\"Latest time: %i\" % graph.latest_time())\n", - "\n", - "print(\"Number of vertices: %i\" % len(graph.vertices()))\n", - "print(\"Number of edges: %i\" % len(graph.edges()))" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "We can also access a specific vertex, such as `Gandalf`, and see his degree at different points in time using the `at()` function. \n", - "\n", - "In the first call, we get the entire graph at time 1000, and then check the degree of gandalf. \n", - "\n", - "In the second call, we get the vertex gandalf, get their instance at time 10,000 and the degree. " - ] - }, - { - "cell_type": "code", - "execution_count": 18, - "metadata": {}, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "Gandalf's degree at 1000: 4\n", - "Gandalf's degree at 10,000: 26\n" - ] - } - ], - "source": [ - "print(\"Gandalf's degree at 1000: %i\" % graph.at(1000).vertex(\"Gandalf\").degree())\n", - "\n", - "print(\"Gandalf's degree at 10,000: %i\" % graph.vertex(\"Gandalf\").at(10000).degree())" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "## Updating graphs, merging datasets and adding properties\n", - "\n", - "One cool thing about Raphtory is that we can freely insert new information at any point in time and it will be automatically inserted in chronological order. This makes it really easy to merge datasets or ingest out of order data. \n", - "\n", - "A property on a vertex or edge can be either static or non-static. \n", - "\n", - "* Static properties, do not change and are fixed throughout the life of the graph, e.g. the `name` property. \n", - "* Non-static properties can change over time, e.g. `balance` of a bank account. \n", - "\n", - "All property objects require the user to specify a name and value.\n", - "\n", - "To explore this and to add some properties to our graph, lets load our second dataset!\n", - "\n", - "Below we are opening our property file the same way as the structure file. This data does not have a time element, so we can add the properties as static properties. This means they will be available at evert point in time and the values will stay the same. \n", - "\n", - "Now it's worthwhile noting that we aren't calling a function called `update_vertex` or something similar, even though we know the vertex exists. This is because everything is considered an addition into the history and Raphtory sorts all the ordering internally!" - ] - }, - { - "cell_type": "code", - "execution_count": 23, - "metadata": { - "tags": [] - }, - "outputs": [], - "source": [ - "with open(properties_file, 'r') as csvfile:\n", - " datareader = csv.reader(csvfile)\n", - " for row in datareader:\n", - " graph.add_vertex_properties(row[0], {\"race\": row[1],\"gender\": row[2]})\n" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "## Using our properties as part of a query\n", - "To quickly see if our new properties are included in the graph we can write a new query! Lets have a look at the dwarves who have the most interactions.\n", - "\n", - "To start we can create a function which for each vertex and check the size of exploded edges. This takes each edge and measures how many times it was updated. E.g. if Gimli and Balin met four times, in the graph they have one edge between them. But if we explode this edge, we can see each time they met. \n", - "\n", - "We can iterate through each vertex and filter by the **race** property and remove anyone who isn't a **dwarf**.\n", - "\n", - "Finally, we can sort the data into a dataframe to see **Gimli** has by far the most!" - ] - }, - { - "cell_type": "code", - "execution_count": 51, - "metadata": {}, - "outputs": [ - { - "data": { - "text/html": [ - "
\n", - "\n", - "\n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - "
timestampnameinteractions
331247Gimli185
131129Glóin31
210938Balin14
09605Thorin5
\n", - "
" - ], - "text/plain": [ - " timestamp name interactions\n", - "3 31247 Gimli 185\n", - "1 31129 Glóin 31\n", - "2 10938 Balin 14\n", - "0 9605 Thorin 5" - ] - }, - "execution_count": 51, - "metadata": {}, - "output_type": "execute_result" - } - ], - "source": [ - "result = []\n", - "# This returns an iterator, so we should store the value to avoid a deadlock\n", - "vertices = list(graph.vertices())\n", - "\n", - "for vertex in vertices:\n", - " if vertex.property(\"race\") == \"dwarf\":\n", - " interactions = sum([len(e.explode()) for e in vertex.edges()])\n", - " latest = vertex.latest_time()\n", - " result.append({\"timestamp\": latest, \"name\": vertex.name(), \"interactions\": interactions })\n", - "\n", - "pd.DataFrame(result).sort_values(by=\"interactions\",ascending=False) " - ] - } - ], - "metadata": { - "kernelspec": { - "display_name": "Python 3 (ipykernel)", - "language": "python", - "name": "python3" - }, - "language_info": { - "codemirror_mode": { - "name": "ipython", - "version": 3 - }, - "file_extension": ".py", - "mimetype": "text/x-python", - "name": "python", - "nbconvert_exporter": "python", - "pygments_lexer": "ipython3", - "version": "3.10.9" - }, - "vscode": { - "interpreter": { - "hash": "a9a34730827747ae273d5a5e0748f342e2039a3997e32d9a086d01739bd0f055" - } - } - }, - "nbformat": 4, - "nbformat_minor": 4 -} diff --git a/docs/source/getting_started/overview.rst b/docs/source/getting_started/overview.rst deleted file mode 100644 index e3b3757952..0000000000 --- a/docs/source/getting_started/overview.rst +++ /dev/null @@ -1,48 +0,0 @@ -.. _overview: - -{{ header }} - -**************** -Package overview -**************** - -Raphtory is an in-memory graph tool written in Rust with friendly Python APIs on top. -It is blazingly fast, scales to hundreds of millions of edges -on your laptop, and can be dropped into your existing pipelines. - -It supports time traveling, multilayer modelling, and advanced analytics beyond simple querying like -community evolution, dynamic scoring, and mining temporal motifs. - -Successful contributions will be reward with swizzling swag! - -Getting support ---------------- - -The first stop for raphtory issues and ideas is the `GitHub Issue Tracker -`__. If you have a general question, -raphtory community experts can answer through `Slack -`__. - -Bounty Board ------------- - -We offer bounties for the following contributions to the project, please see below to -win some cool swag! `Our Github bounty board `__ - -Community ---------- - -Raphtory is actively supported today by a community of software engineering experts and world-class researchers around -the world. Thanks to `pometry `__ and `all of our contributors `__. - -If you're interested in contributing, please visit the :ref:`contributing guide `. - -Development team ------------------ - -The list of the Core Team members and more detailed information can be found on the `pometry website `__. - -License -------- - -.. literalinclude:: ../../../LICENSE diff --git a/docs/source/images/index_api.svg b/docs/source/images/index_api.svg deleted file mode 100644 index c9eee89983..0000000000 --- a/docs/source/images/index_api.svg +++ /dev/null @@ -1,24 +0,0 @@ - - - - - - - image/svg+xml - - - - - - - - - - - - - - - - - \ No newline at end of file diff --git a/docs/source/images/index_contribute.svg b/docs/source/images/index_contribute.svg deleted file mode 100644 index 91b4140ec5..0000000000 --- a/docs/source/images/index_contribute.svg +++ /dev/null @@ -1,19 +0,0 @@ - - - - - - - image/svg+xml - - - - - - - - - - - - \ No newline at end of file diff --git a/docs/source/images/index_getting_started.svg b/docs/source/images/index_getting_started.svg deleted file mode 100644 index 3756254230..0000000000 --- a/docs/source/images/index_getting_started.svg +++ /dev/null @@ -1,16 +0,0 @@ - - - - - - - image/svg+xml - - - - - - - - - \ No newline at end of file diff --git a/docs/source/images/index_user_guide.svg b/docs/source/images/index_user_guide.svg deleted file mode 100644 index 4eee142cdf..0000000000 --- a/docs/source/images/index_user_guide.svg +++ /dev/null @@ -1,16 +0,0 @@ - - - - - - - image/svg+xml - - - - - - - - - \ No newline at end of file diff --git a/docs/source/index.rst b/docs/source/index.rst index 76856225c0..1f33acfc47 100644 --- a/docs/source/index.rst +++ b/docs/source/index.rst @@ -1,112 +1,91 @@ -:notoc: +.. _api_menu: -.. Raphtory documentation master file, created by +{{ header }} -.. module:: Raphtory +**************** +Raphtory +**************** -**************************************** -Raphtory documentation -**************************************** +.. automodule:: raphtory + :autosummary: + :members: + :undoc-members: + :show-inheritance: + :private-members: + :inherited-members: -**Date**: |today| **Version**: |version| +Algorithms +------------------- -**Useful links**: -`Source Repository `__ | -`Issues & Ideas `__ | -`Slack Support `__ +.. automodule:: raphtory.algorithms + :autosummary: + :members: + :undoc-members: + :show-inheritance: + :private-members: + :inherited-members: -:mod:`Raphtory` is an in-memory graph tool written in Rust with friendly Python APIs on top. -It is blazingly fast, scales to hundreds of millions of edges on your laptop, and can be -dropped into your existing pipelines with a simple `pip install raphtory`. +Visualisation +------------------- -.. grid:: 1 2 2 2 - :gutter: 4 - :padding: 2 2 0 0 - :class-container: sd-text-center +.. automodule:: raphtory.export + :autosummary: + :members: + :undoc-members: + :show-inheritance: + :private-members: + :inherited-members: - .. grid-item-card:: Getting started - :img-top: images/index_getting_started.svg - :class-card: intro-card - :shadow: md - New to *Raphtory*? Check out the getting started guides. They contain an - introduction to *Raphtory'* main concepts and links to additional tutorials. +Null Models +-------------------------- - +++ +.. automodule:: raphtory.nullmodels + :autosummary: + :members: + :undoc-members: + :show-inheritance: + :private-members: + :inherited-members: - .. button-ref:: getting_started - :ref-type: ref - :click-parent: - :color: secondary - :expand: +Graph Generation +-------------------------- + +.. automodule:: raphtory.graph_gen + :autosummary: + :members: + :undoc-members: + :show-inheritance: + :private-members: + :inherited-members: + +GraphQL Server +-------------------------- + +.. automodule:: raphtory.graphql + :autosummary: + :members: + :undoc-members: + :show-inheritance: + :inherited-members: - To the getting started guides - .. grid-item-card:: User guide - :img-top: images/index_user_guide.svg - :class-card: intro-card - :shadow: md - The user guide provides in-depth information on the - key concepts of Raphtory with useful background information and explanation. - +++ - .. button-ref:: user_guide - :ref-type: ref - :click-parent: - :color: secondary - :expand: - To the user guide - .. grid-item-card:: API reference - :img-top: images/index_api.svg - :class-card: intro-card - :shadow: md - The reference guide contains a detailed description of - the Raphtory API. The reference describes how the methods work and which parameters can - be used. It assumes that you have an understanding of the key concepts. - +++ - .. button-ref:: api - :ref-type: ref - :click-parent: - :color: secondary - :expand: - To the reference guide - .. grid-item-card:: Developer guide - :img-top: images/index_contribute.svg - :class-card: intro-card - :shadow: md - Saw a typo in the documentation? Want to improve - existing functionalities? The contributing guidelines will guide - you through the process of improving Raphtory. - +++ - .. button-ref:: development - :ref-type: ref - :click-parent: - :color: secondary - :expand: - To the development guide -.. toctree:: - :maxdepth: 3 - :hidden: - :titlesonly: - getting_started/index - development/index - api/index - userguide/index diff --git a/docs/source/userguide/graphql.rst b/docs/source/userguide/graphql.rst deleted file mode 100644 index 7f37f323d9..0000000000 --- a/docs/source/userguide/graphql.rst +++ /dev/null @@ -1,5 +0,0 @@ -{{ header }} - -******************** -GraphQL -******************** diff --git a/docs/source/userguide/index.rst b/docs/source/userguide/index.rst deleted file mode 100644 index c2ff591b2c..0000000000 --- a/docs/source/userguide/index.rst +++ /dev/null @@ -1,18 +0,0 @@ -{{ header }} - -.. _user_guide: - -========== -User Guide -========== - -This guide explains each component of raphtory. - -.. toctree:: - :maxdepth: 2 - - raphtory - rust - js - graphql - io \ No newline at end of file diff --git a/docs/source/userguide/io.rst b/docs/source/userguide/io.rst deleted file mode 100644 index 873ab6a0f4..0000000000 --- a/docs/source/userguide/io.rst +++ /dev/null @@ -1,5 +0,0 @@ -{{ header }} - -******************** -IO -******************** \ No newline at end of file diff --git a/docs/source/userguide/js.rst b/docs/source/userguide/js.rst deleted file mode 100644 index 655c049d97..0000000000 --- a/docs/source/userguide/js.rst +++ /dev/null @@ -1,5 +0,0 @@ -{{ header }} - -******************** -JS -******************** \ No newline at end of file diff --git a/docs/source/userguide/raphtory.rst b/docs/source/userguide/raphtory.rst deleted file mode 100644 index da063304f4..0000000000 --- a/docs/source/userguide/raphtory.rst +++ /dev/null @@ -1,5 +0,0 @@ -{{ header }} - -******************** -Raphtory -******************** \ No newline at end of file diff --git a/docs/source/userguide/rust.rst b/docs/source/userguide/rust.rst deleted file mode 100644 index 5f2b2dbc24..0000000000 --- a/docs/source/userguide/rust.rst +++ /dev/null @@ -1,5 +0,0 @@ -{{ header }} - -******************** -Rust -******************** \ No newline at end of file diff --git a/examples/custom-algorithm/src/main.rs b/examples/custom-algorithm/src/main.rs index 2d4590edf7..97c250f6f8 100644 --- a/examples/custom-algorithm/src/main.rs +++ b/examples/custom-algorithm/src/main.rs @@ -2,7 +2,7 @@ use async_graphql::dynamic::{FieldValue, ResolverContext, TypeRef}; use async_graphql::FieldResult; use dynamic_graphql::internal::TypeName; use dynamic_graphql::SimpleObject; -use raphtory::db::view_api::GraphViewOps; +use raphtory::db::view::GraphViewOps; use raphtory_graphql::{Algorithm, RaphtoryServer}; #[derive(SimpleObject)] @@ -29,7 +29,7 @@ impl Algorithm for DummyAlgorithm { ) -> FieldResult>> { let mandatory_arg = ctx.args.try_get("mandatoryArg")?.u64()?; let optional_arg = ctx.args.get("optionalArg").map(|v| v.u64()).transpose()?; - let num_vertices = graph.num_vertices(); + let num_vertices = graph.count_vertices(); let output = Self { number_of_nodes: num_vertices, message: format!("mandatory arg: '{mandatory_arg}', optional arg: '{optional_arg:?}'"), diff --git a/examples/custom_python_extension/Cargo.toml b/examples/custom_python_extension/Cargo.toml new file mode 100644 index 0000000000..e78c07ab21 --- /dev/null +++ b/examples/custom_python_extension/Cargo.toml @@ -0,0 +1,17 @@ +[package] +name = "custom_python_extension" +version = "0.1.1" +edition = "2021" + +# See more keys and their definitions at https://doc.rust-lang.org/cargo/reference/manifest.html + +[dependencies] +raphtory = {path = "../../raphtory", features = ["python"]} +pyo3 = "0.19.2" + +[lib] +crate-type = ["cdylib"] + + +[build-dependencies] +pyo3-build-config = "0.19.2" diff --git a/examples/custom_python_extension/build.rs b/examples/custom_python_extension/build.rs new file mode 100644 index 0000000000..dace4a9ba9 --- /dev/null +++ b/examples/custom_python_extension/build.rs @@ -0,0 +1,3 @@ +fn main() { + pyo3_build_config::add_extension_module_link_args(); +} diff --git a/examples/custom_python_extension/pyproject.toml b/examples/custom_python_extension/pyproject.toml new file mode 100644 index 0000000000..ccc82af269 --- /dev/null +++ b/examples/custom_python_extension/pyproject.toml @@ -0,0 +1,31 @@ +[build-system] +requires = ["maturin>=0.13,<0.14"] +build-backend = "maturin" + +[project] +name = "custom_python_extension" +requires-python = ">=3.8" +classifiers = [ + "Programming Language :: Rust", + "Programming Language :: Python :: Implementation :: CPython", + "Programming Language :: Python :: Implementation :: PyPy", +] +dependencies = [ + "raphtory" +] + + +[project.urls] +homepage = "https://github.com/pometry/raphtory" +documentation = "https://docs.raphtory.com/" +repository = "https://github.com/pometry/raphtory" +twitter = "https://twitter.com/raphtory/" +slack = "https://join.slack.com/t/raphtory/shared_invite/zt-xbebws9j-VgPIFRleJFJBwmpf81tvxA" +youtube = "https://www.youtube.com/@pometry8546/videos" + +[project.optional-dependencies] +export = ["pyvis >= 0.3.2", "networkx >= 2.6.3", "matplotlib >= 3.4.3", "seaborn >= 0.11.2"] + +[tool.maturin] +features = ["pyo3/extension-module"] +python-source = "python" diff --git a/examples/custom_python_extension/python/custom_python_extension/__init__.py b/examples/custom_python_extension/python/custom_python_extension/__init__.py new file mode 100644 index 0000000000..def2f54143 --- /dev/null +++ b/examples/custom_python_extension/python/custom_python_extension/__init__.py @@ -0,0 +1 @@ +from .custom_python_extension import * diff --git a/examples/custom_python_extension/src/lib.rs b/examples/custom_python_extension/src/lib.rs new file mode 100644 index 0000000000..32544ca621 --- /dev/null +++ b/examples/custom_python_extension/src/lib.rs @@ -0,0 +1,17 @@ +use pyo3::prelude::*; +use raphtory::{db::api::view::internal::DynamicGraph, prelude::GraphViewOps}; + +fn custom_algorithm(graph: &G) -> usize { + graph.count_vertices() +} + +#[pyfunction(name = "custom_algorithm")] +fn py_custom_algorithm(graph: DynamicGraph) -> usize { + custom_algorithm(&graph) +} + +#[pymodule] +fn custom_python_extension(_py: Python<'_>, m: &PyModule) -> PyResult<()> { + m.add_function(wrap_pyfunction!(py_custom_algorithm, m)?)?; + Ok(()) +} diff --git a/examples/custom_python_extension/test/test_custom_algorithm.py b/examples/custom_python_extension/test/test_custom_algorithm.py new file mode 100644 index 0000000000..3b6f0d846c --- /dev/null +++ b/examples/custom_python_extension/test/test_custom_algorithm.py @@ -0,0 +1,16 @@ +from raphtory import Graph +from custom_python_extension import custom_algorithm +from pytest import raises + + +def test_custom_algorithm(): + g = Graph() + for v in range(10): + g.add_vertex(0, v) + assert custom_algorithm(g) == 10 + + +def test_error_for_wrong_type(): + """ calling with the wrong type should still raise a type error (unless it defines a bincode method)""" + with raises(TypeError): + custom_algorithm(1) diff --git a/examples/py/companies_house/companies_house_example.ipynb b/examples/py/companies_house/companies_house_example.ipynb index 314770a02e..742538842f 100644 --- a/examples/py/companies_house/companies_house_example.ipynb +++ b/examples/py/companies_house/companies_house_example.ipynb @@ -25,7 +25,7 @@ "import os, json\n", "import matplotlib.pyplot as plt\n", "from raphtory import Graph\n", - "from raphtory import vis\n", + "from raphtory import export\n", "from datetime import datetime, timedelta" ] }, @@ -617,7 +617,7 @@ "metadata": {}, "outputs": [], "source": [ - "vis.to_pyvis(graph=g2, edge_color='#F6E1D3',shape=\"image\") " + "export.to_pyvis(graph=g2, edge_color='#F6E1D3',shape=\"image\") " ] }, { diff --git a/examples/py/companies_house/companies_house_visualisation.ipynb b/examples/py/companies_house/companies_house_visualisation.ipynb index 13003cde53..dc736f8243 100644 --- a/examples/py/companies_house/companies_house_visualisation.ipynb +++ b/examples/py/companies_house/companies_house_visualisation.ipynb @@ -26,7 +26,7 @@ }, { "cell_type": "code", - "execution_count": 2, + "execution_count": null, "metadata": {}, "outputs": [], "source": [ @@ -56,30 +56,11 @@ }, { "cell_type": "code", - "execution_count": 3, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "Warning: When cdn_resources is 'local' jupyter notebook has issues displaying graphics on chrome/safari. Use cdn_resources='in_line' or cdn_resources='remote' if you have issues viewing graphics in a notebook.\n", - "nx.html\n" - ] - }, - { - "data": { - "image/png": "", - "text/plain": [ - "
" - ] - }, - "metadata": {}, - "output_type": "display_data" - } - ], + "outputs": [], "source": [ - "from raphtory import vis\n", + "from raphtory import export\n", "from raphtory import Graph\n", "import requests\n", "from contextlib import closing\n", @@ -105,8 +86,8 @@ " g.add_edge(1, src, company, properties={\"title\": title, \"weight\": share})\n", " g.add_edge(1, dst, company, properties={\"title\": title, \"weight\": share})\n", "\n", - "vis.to_networkx(graph=g, k=0.8, node_size=250, node_color=\"red\")\n", - "vis.to_pyvis(graph=g, edge_color='#F6E1D3', edge_weight=\"weight\", shape=\"image\", edge_label=\"title\", node_image=\"image\") " + "export.to_networkx(graph=g)\n", + "export.to_pyvis(graph=g, edge_color='#F6E1D3', edge_weight=\"weight\", shape=\"image\", edge_label=\"title\", node_image=\"image\") " ] } ], @@ -126,7 +107,7 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.10.9" + "version": "3.11.3" } }, "nbformat": 4, diff --git a/examples/py/math_overflow/degree-trajectories-top5.png b/examples/py/math_overflow/degree-trajectories-top5.png new file mode 100644 index 0000000000..b9e26a1b9d Binary files /dev/null and b/examples/py/math_overflow/degree-trajectories-top5.png differ diff --git a/examples/py/math_overflow/mo_investigate.ipynb b/examples/py/math_overflow/mo_investigate.ipynb new file mode 100644 index 0000000000..141cd7ee9c --- /dev/null +++ b/examples/py/math_overflow/mo_investigate.ipynb @@ -0,0 +1,969 @@ +{ + "cells": [ + { + "cell_type": "code", + "execution_count": 1, + "metadata": {}, + "outputs": [], + "source": [ + "import pandas as pd\n", + "import raphtory as rp\n", + "import datetime as dt\n", + "import networkx as nx\n", + "\n", + "import seaborn as sns\n", + "sns.set(font_scale=1.2)\n", + "import matplotlib.pyplot as plt\n", + "\n", + "from plotting_utils import *" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Reading in a graph of interactions on Stack Exchange" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
srcdsttime
0141254192988
1341254194656
2121254202612
32511254232804
414161254263166
............
50654521349885801457260401
5065462003111141457261526
5065475142811141457261724
50654856259562591457261848
50654956353563531457262355
\n", + "

506550 rows × 3 columns

\n", + "
" + ], + "text/plain": [ + " src dst time\n", + "0 1 4 1254192988\n", + "1 3 4 1254194656\n", + "2 1 2 1254202612\n", + "3 25 1 1254232804\n", + "4 14 16 1254263166\n", + "... ... ... ...\n", + "506545 21349 88580 1457260401\n", + "506546 20031 1114 1457261526\n", + "506547 51428 1114 1457261724\n", + "506548 56259 56259 1457261848\n", + "506549 56353 56353 1457262355\n", + "\n", + "[506550 rows x 3 columns]" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "file = \"/Users/naomiarnold/CODE/Raphtory/raphtory-research/stackexchange/sx-mathoverflow.txt\"\n", + "sx_df = pd.read_csv(file, names = [\"src\", \"dst\", \"time\"],sep=\" \")\n", + "display(sx_df)" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "metadata": {}, + "outputs": [], + "source": [ + "def load_pandas(data:pd.DataFrame):\n", + " g = rp.Graph()\n", + " for (_, src_id, dst_id, time) in data.itertuples():\n", + " g.add_vertex(timestamp = time, id = src_id)\n", + " g.add_vertex(timestamp = time, id = dst_id)\n", + "\n", + " # Remove self loops\n", + " if src_id != dst_id:\n", + " g.add_edge(timestamp = time, src = src_id, dst = dst_id)\n", + " return g" + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "metadata": {}, + "outputs": [], + "source": [ + "g = load_pandas(sx_df)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "g.add_edge" + ] + }, + { + "cell_type": "code", + "execution_count": 6, + "metadata": {}, + "outputs": [], + "source": [ + "g = nx.Graph()" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "g.add_edge" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Working with the aggregate graph object\n", + "\n", + "Take metrics you might expect in something like networkx applied to the full aggregate graph. Get degree of all nodes for example" + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "[(11142, 968), (6094, 914), (290, 910), (297, 724), (1946, 721), (2841, 551), (18060, 539), (1459, 536), (1409, 506), (1149, 477)]\n" + ] + } + ], + "source": [ + "degrees = sorted([(v.id(), v.in_degree()) for v in g.vertices()], key = lambda x: x[1], reverse=True)\n", + "print(degrees[:10])" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Handy functionality for tracking vertex properties over time in different window sizes\n", + "Get the top 5 all time leaders by degree and track their connectivity over time" + ] + }, + { + "cell_type": "code", + "execution_count": 6, + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "iVBORw0KGgoAAAANSUhEUgAAAj8AAAG5CAYAAABhrVVvAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjcuMSwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy/bCgiHAAAACXBIWXMAAA9hAAAPYQGoP6dpAAEAAElEQVR4nOydd5gUVfb3v7eqOk1kGJLEIQiIElRkFTNm111X/emru7jqiqsiZkUUVAy4rqKoiDlgxoABFcNiDogiSTJDTsMwOXWq8P5R6Vbonp6enumemfvh4ZnuirduV/jWOeeeQxRFUcBgMBgMBoPRQeDS3QAGg8FgMBiM1oSJHwaDwWAwGB0KJn4YDAaDwWB0KJj4YTAYDAaD0aFg4ofBYDAYDEaHgokfBoPBYDAYHQomfhgMBoPBYHQomPhhMBgMBoPRoWDih8FgMBgMRocio8TPs88+i4svvjjm/GnTpmHcuHGWabIs44knnsCxxx6LUaNG4YorrsDOnTtbuqkMBoPBYDDaKBkjft544w089thjMecvWrQI7777rmP6U089hTfffBP33Xcf5s2bB1mWMWHCBEQikRZsLYPBYDAYjLZK2sXPvn37cNVVV2HmzJkoKipyXaa0tBR33nknxowZY5keiUTw0ksv4brrrsMJJ5yAoUOHYtasWSgpKcGXX37ZCq1nMBgMBoPR1ki7+FmzZg08Hg8WLFiAkSNHOuYrioIpU6bg7LPPdoif9evXo76+HkcddZQxLS8vD8OGDcNvv/3W4m1nMBgMBoPR9hDS3YBx48Y54nho5s6di/379+OZZ57Bs88+a5lXUlICADjggAMs07t162bMSwZFUSDLmV3snuNIxrcxHbB+cYf1izusX9xh/eIO6xd3MqVfOI6AEJLQsmkXP/FYv349nnzySbzxxhvwer2O+cFgEAAc83w+H6qrq5u1b55Pu1GsUXg+sR+5o8H6xR3WL+6wfnGH9Ys7rF/caWv9krHiJxwO45ZbbsHVV1+NoUOHui7j9/sBqLE/+md93UAgkPS+ZVlBTU1D0uu3NDzPIS8vgJqaICRJTndzMgbWL+6wfnGH9Ys7rF/cYf3iTib1S15eIGHDRcaKn5UrV2LTpk148sknMWfOHABANBqFKIo49NBD8fzzzxvurtLSUvTt29dYt7S0FEOGDGnW/kUx809uSZLbRDtbG9Yv7rB+cYf1izusX9xh/eJOW+uXjBU/I0aMcIzYeu211/Dll1/itddeQ/fu3cFxHHJycrBkyRJD/NTU1GDt2rUYP358OprNYDAYDAYjw8lY8eP3+9GvXz/LtPz8fAiCYJk+fvx4zJw5E507d0avXr3w8MMPo0ePHjj11FNbu8kMBoPBYDDaABkrfhLluuuugyiKmDZtGkKhEI444gi8+OKL8Hg86W4ag8FgMNKMLMuQJDEF2yEIhXhEImFIUvpHNmUKrdkvPC+A41IzGIkoisJ+RRuSJKOioj7dzYiJIHAoKMhGZWV9m/KxtjSsX9xh/eIO6xd32ku/KIqCmpoKBIN1Kdsmx3GQ5bbbJy1Fa/ZLIJCDvLzOrkPaO3fObvsBzwwGg8FgJIsufHJyCuD1+hLO/xIPnifM6uNCa/SLoiiIRMKoq6sEAOTnFzZre0z8MBgMBqNdIcuSIXxycvJStl1B4Nq0NaylaK1+8Xp9AIC6ukrk5hY0ywWW+Zn8GAwGg8FoApIkATAfloz2g/6bNjeOi4kfBoPBYLRLUuHqYmQWqfpNmfhhMBgMBoPRoWDih8FgMBiMNsBrr72MSZP+3aR1gsEg5s9/p4VaFJuFCz/GMceMbvX9JgoTPwwGg8FgZDjvv/8unn/+6Sav99Zbr+Gtt15rgRa1bdhorwwiKNbjq5L3cEThOHQP9El3cxgMBoORZsrK9uOhhx7A8uVL0adP38ZXsMFS+bnDLD8ZxAc7nsOCnS/h7pWXpLspDAaDwcgA1q9fB49HwNy5b2HYsEMc80OhEB588D789a+nYdy4sbjssr/ju+++BgC8+OKzePnl51FSshfHHDMae/fucay/cOHH+H//72/G3xNPPAr/+td4rFq1wlgmHA7h+eefxvnnn41x48bi0kv/jm+//cqyne+++wb//Of/w7hxYzFx4gSUlOy1zI9Go3jqqSfwt7+dgVNOORb//vel+PXXX1LQQ8nBLD8ZxNa6dQAAWZHS3BIGg8FohygKEG3GEGmZA5qTz8YjAE0crXTMMcfhmGOOizn/+eefxubNm/Dww48jNzcXH3/8Ie6663bMm/cBLrroYgSDQXz99f/w/POvoFOnAtdt7NtXgg8/nI8777wPWVlZeOSRBzFjxnTMm/cBCCGYPn0qNmxYj1tuuR29e/fB//73Oe68cwpmzHgYxx13AlatWolp0ybjssuuwMknn4aVK5dj1qyHLfuYMWM6tm/firvuug9du3bDTz99j8mTb8ADD8zE2LHHNKlPUgETPxlEQMhJdxMYDAajfaIoyHrtQ/C7S9LWBLF3DwTH/63JAigee/bsQlZWNnr27IXc3FxMmHAVRo06DLm5ecjKykIgEADHcSgs7BK7XaKIW2+9HQceOAQAcOGF/8Dtt9+C8vJy1NXV4ocfvsN//zvLECmXX34lios34bXXXsJxx52Ad9+dh+HDR+Jf/1KDsfv27YctWzbj3XffAgDs2rUTixZ9gZdffoPax3gUF2/Cm2++ysRPR8dDvOluAoPBYLRblHaY9ucf/7gEt912I84662QMG3YIxow5Eqeccjpycpr2Mt2vX3/jc3a2uq4oRrF5czEAYMSIUZblDz30MDzzzBwAwObNxTjiiD9Z5h9yyAhD/GzcuAEAMHHiBMsyoigiJye3Se1MFUz8ZBAsHxeDwWC0EISoVpdmuL2aXcYhCbdXYxxyyAi8//6n+O23JVi69Fd89tknmDv3BTzyyGyMHj0m4e14vc6XbzVY2j1gWpZlCIIqIQghkGXrcvo8dTtqn82Z8zyysrIty6WqSntTYQHPGQRhPweDwWC0HIQAXk/6/rfAG+6LLz6LVatW4JhjjscNN9yKt956H7169ca3336tHXLz9jlw4IEAYAmABoCVK1egqEi1Fh144GCsXr3SMn/9+rXG5/79BwIAysvL0Lt3H+P/p58uwMKFHzerfcnCnrYZBTP9MBgMBiNx9uzZhYcf/g9+//03lJTsxbfffo2SkhIMHz4CABAIZKG2tgY7dmyHKDbd6lVU1B9jxx6LRx55ED///CN27NiOl19+Hj/++B0uumg8AODvf78YmzZtxJNPPoYdO7bjyy8/w/vvm4kVBwwYiLFjj8XDD/8HP/74PXbv3oU33ngFr78+F7169U5NRzQRJn4yCI75vRgMBoPRBG666TYcfvgY3HvvnbjoonPxwgtP4+qrr8Vpp50JADjhhHEoLOyCSy+9CBs2rE9qH/fc8wCOO+5EPPjgfbj00ovw008/4P77H8KJJ54MABg8eAhmznwCy5YtxaWXXoR5897AP//5L8s27r33PzjhhHF4+OEHcPHFF+Czzz7FlCl34owzzmpeByQJUVgGJAeSJKOior7V9/vMhruwrOI7AMCzR34b01wpCBwKCrJRWVnfPP9zO4P1izusX9xh/eJOe+iXaDSC8vK9KCw8AB5P6gaSNDvmp53Smv0S77ft3DkbPJ+YTYdZfjIIWuxILNcPg8FgMBgtAhM/GQShYn6icjiNLWEwGAwGo/3CxE8GEZZCxud6sSaNLWEwGAwGo/3CxE8GUS9WG5/rqM8MBoPBYDBSBxM/GURIClKfG9LYEgaDwWAw2i9M/GQQohI1PkdYzA+DwWAwGC0CEz8ZhKSYCagicijOkgwGg8FgMJKFiZ8MIipHqM/M8sNgMBgMRkvAxE8GQVt+6JFfDAaDwWAwUgcTPxmEKJsxP7QQYjAYDAaDkTqY+Mkg6IBnluGZwWAwGDU11Xj44Qdwzjln4tRTj8fVV1+OlStXNGube/fuwTHHjMayZUtT08gEWbjwYxxzzOhW3WcsmPjJEGRFtlh7ZCZ+GAwGo8Nz9913YPXqVZg+fQZeeOFVHHjgYNx00zXYsWNbupvWpmHiJ0Owu7mY+GEwGIyOza5dO/Hbb0tw881TMHLkoejbtx9uvHEyunTpii+//DzdzWvTCOluAEOFjvcBmPhhMBiMjk5+fic8/PBjGDp0mDGNEAJCCGpr1RJIM2ZMN5b9/PNPEQw24PDDj8DkyVPRpUtXAMCWLcV47LGZWLt2NQoLu+Diiy+Nu9+FCz/GK6+8iEsuuRyvvPIiSkv3oX//gbjhhlswYsQoAEA4HMKrr76ML7/8HOXl+9G3bxEuvfRynHDCScZ2vvvuG7z44jPYtWsnhg4dhtGjx1j2E41G8fzzT+PLLz9DfX0d+vcfiAkTrsKYMUc2s+cah1l+MgQ63gdgMT8MBoORahRFgSQG0/ZfUZQmtTc3NxdHHXUMvF6vMe3bb7/Crl078ac/jTWmLVr0BWpqqjFnzvOYOfMJbNiwDs899xQAoK6uDtdfPxHZ2Tl47rlXcMstUzB37ouN7nvfvhJ8+OF83HnnfXjxxdcRCAQwY8Z04ximT5+Kzz77BDfeeCtef/1tHHvs8bjzzin4/vtvAQB//LES06ZNxgknnIS5c9/CGWechddff8WyjxkzpuO3337BXXfdh5deegPjxp2MyZNvwM8//9ikfkoGZvnJEByWHzDxw2AwGKlCURQUf3ctGipWp60NWYWHYNBxs0EISWr9P/5YiQceuBfHH38ixo49xpienZ2DyZOnQhAE9OtXhJNOOhWLF/8EQBVGoVAQU6dOR05ODgYMGIjrrrsZd9xxS9x9iaKIW2+9HQceOAQAcOGF/8Dtt9+C8vJy1NXV4ocfvsN//zsLY8ceA0HgcPnlV6K4eBNee+0lHHfcCXjvvbcxfPhI/Otf/wYA9O3bD1u2bMa7774FQHXpLVr0BV5++Q1qH+NRXLwJb775quX4WgImfjIEZvlhMBiMFiY5zZER/PDDt7jnnmkYPnwk7rrrfsu8Xr16QxDMx3l2dg5EUY0j3bKlGH369EVOTo4xf/jwEQnts1+//pZtAoAoRrF5czEAGC4wnUMPPQzPPDPH2K/dfXXIISMM8bNx4wYAwMSJEyzLiKKInJzchNrXHJj4yRDs4ofF/DAYDEbqIIRg0HGzITcjgawgcBBFOen1Od6flNVn/vy38fjjj+DEE0/CtGn3wuPxWObbvwMw3FOEEMiy1d3G84k9+ml3m3W77u47WZYNEea2X1qgKYraj3PmPI+srGzLchzX8hE5LOYnQ7C7vRbtfTdNLWEwGIz2CSEEvBBI2/9khM8HH7yHWbMexrnnXoDp0x9wFTrxOPDAwdi5czuqqqqMaRs2rG1yO2gGDjwQALBq1QrL9JUrV6CoqL+x39WrV1rmr19v7rd//4EAgPLyMvTu3cf4/+mnC7Bw4cfNal8iMPGTIUg2yw+DwWAwOjY7dmzH44/PxHHHnYiLL74UFRXlKC8vQ3l5Gerq6hLaxkknnYbOnQsxffod2LRpI5Yv/x2PP/5Is9pVVNQfY8cei0ceeRA///wjduzYjpdffh4//vgdLrpoPAA1fmfTpo148snHsGPHdnz55Wd4//13jG0MGDAQY8cei4cf/g9+/PF77N69C2+88Qpef30uevXq3az2JQJze2UIUZmJHwaDwWCYfPvtVxBFEd9//w2+//4by7wzzjgLU6dOb3QbgUAAjz/+NGbNeggTJ16O3Nw8TJhwFR544J5mte2eex7As8/OwYMP3oe6uloMGDAI99//EI4//kQAwIEHDsHMmU/gqaeewPvvv4OiogH45z//haefnm1s4957/4PnnpuDhx9+ALW1NejZszemTLkTZ5xxVrPalghEaerYuxbk2WefxY8//ojXXnvNmPb1119jzpw52LJlCwoKCnDaaafh+uuvh9/vBwCEw2E8+OCD+PzzzxEKhTBu3DhMnToVnTt3TrodkiSjoqK+2cfTFNZXL8Oja2+0THvuqO9clxUEDgUF2aisrG+W/7m9wfrFHdYv7rB+cac99Es0GkF5+V4UFh4Aj8cZt5IszY35aa+0Zr/E+207d84Gzyfm0MoYt9cbb7yBxx57zDJt6dKlmDRpEk455RR88MEHuPvuu7Fw4ULcc4+pWKdPn44ff/wRs2fPxiuvvIItW7bguuuua+XWN5+oHEl3ExgMBoPB6BCkXfzs27cPV111FWbOnImioiLLvHnz5uFPf/oTrrrqKhQVFeH444/HjTfeiI8//hiRSAT79u3Dhx9+iGnTpmH06NEYMWIEHn30Ufz2229Yvnx5eg4oSfTyFj4uAADIFTqlsTUMBoPBYLRf0i5+1qxZA4/HgwULFmDkyJGWef/6179w2223WaZxHIdoNIq6ujr8/vvvAIAjjzRzCfTv3x/du3fHb7/91vKNTyGiZvnx81nqd1utLwaDwWAwGKkh7QHP48aNw7hx41znDRs2zPI9Go1i7ty5OOSQQ9C5c2fs27cPBQUF8Pl8luW6deuGkpKSFmtzS1AdrQAA+PgAEHXm/WEwGAwGg5Ea0i5+EkUURUyePBmbNm3CG2+8AQAIBoOuSZh8Ph/C4XCz9icIrWsU21K3BgDAEx4AICtizDboAV2JBnZ1FFi/uMP6xR3WL+60h36R5dSnctZT9BACZM4wofSTrn7hedKs53SbED91dXW44YYb8Ouvv+LJJ5/EiBFqam6/349IxBkoHA6HEQgEkt4fxxEUFGQ3vmAK8XnVn6Jv/gDsDW6HpEjI7xQAR2L/uHl5yR9je4b1izusX9xh/eJOW+6XUIhHWRnX7AekG21ZFLYkrdUvskzAcRzy87OMUd/JkPHip7S0FFdccQV2796NF198EUcccYQxr0ePHqiqqkIkErFYgEpLS9G9e/ek9ynLCmpqGprV7qZS0aC6vQZlj8QSqPkcyiqq4eGcli2e55CXF0BNTRCSxIZd6rB+cYf1izusX9xpD/0SiYQhyzIkSUnZEGxC1L6RJJlZfihau18kSYEsy6iubkAwaC0DlZcXSFiEZbT4qa6uxiWXXIK6ujq88cYbGDJkiGX+4YcfDlmW8fvvv+Ooo44CAGzduhX79u2ziKRkaO1cDiFRFVsBLs+YFo5GQOLUYJEkmeWccIH1izusX9xh/eJOW+4XSUr9U1h/sDPhYyVd/dJcYZvR9rv//Oc/2LlzJx5++GF07twZ+/fvN/5LkoTu3bvjz3/+M6ZNm4YlS5Zg1apVuOmmmzBmzBiMGjUq3c1vEnoVdx9nmvHs9b4YDAaDwWA0n4y1/EiShIULFyIajeKSSy5xzP/qq6/Qu3dv3HfffXjggQcwadIkAMBxxx2HadOmtXZzm42e58fDeUHAQYHMhrszGAwGg9ECZJT4efDBB43PPM9j1apVja6TlZWF+++/H/fff39LNq3F0cUPTwQIREBUibBipwwGg9HBqayswJNPzsKSJYsRDocxatRhmDTpRvTrV9Sk7Sxc+DEeeOAe/Pjj0pZpaAxmzJiOvXv34Mknn2vV/TZGRru9OhK0+OE5DwBAlJnlh8FgMDoyt99+ixb+8Tief/5V+Hw+XH/91QiFQuluWpuGiZ8MQY/50S0/6jQmfhgMBqOjUlNTgx49DsCUKdNw0EEHo6ioPy65ZALKyvZj69bN6W5emyaj3F4dGUmz8vAcD4Golh/m9mIwGIzUoSgKInLyFhOJcBCbMfzfy/lBSOIJGPPy8jB9+gzje2VlJd55501069YdRUUDAAAvvvgsli//HYWFhVi8+GecccafceONk/Hdd9/gxRefwa5dOzF06DCMHj0m7r5mzJgOAMjP74TPP/8UwWADDj/8CEyePBVdunQFAOzbV4Jnn52DpUt/RUNDPUaMGIWJE6/H0KHqSGxFUfDKKy/io4/eR21tDcaNOwWRiDXh8P79pYYbj+N4DB8+ApMm3Yg+ffom3C+pgImfDMHq9lJ/Fub2YjAYjNSgKAoeWjMJm2tXp60NA3OHY/LBs5skgHT++98Z+PjjD+D1evHgg49aEvmuWLEM559/EV5++Q3Isow//liJadMm47LLrsDJJ5+GlSuXY9ashxvdx6JFX+CUU07HnDnPo6KiHNOn34HnnnsKd9xxNxoa6nH11ZejZ89eePDBR+DxePHSS89h0qQr8Npr89C1aw+8/vpcvPnma7j11tsxZMhQfPTR+1i48GOMGnUYALUqw7XXXokhQ4Zi9uznwPMc5s17A//+96V49dV56Nq1W5P7JVmY2ytD0MUPR3jwmtuL1fdiMBiMVJL6shetxQUXXIQXXngNJ598Gm6//WZs2LDeMv/yy69Er1690adPX7z33tsYPnwk/vWvf6Nv3374y1/+hrPPPrfRfWRn52Dy5Kno168Ihx56OE466VT88cdKAMAXX3yG6uoq3HfffzFs2CE48MDBmD79fvh8frz33jtQFAXvvfc2zj//Qpxyyuno27cI1157Ew48cLCx/a+++gJ1dbW48877cOCBgzFgwCBMmXIncnJysGDBB6ntsEZglp8MwRrzo7u9mOWHwWAwUgEhBJMPnt0st5cgcM1KrNdUtxdN//6qm2vKlDuxdu1qzJ//Nu64424AQEFBZ+Tk5BjLbtlSjDFjjrSsf8ghI/Duu2/F3UevXr0hCKYsyM7OgSiqz6HNm4vRp08/FBQUGPN9Pj+GDTsYmzcXo7q6GuXlZTjoIGtB8oMPHoFt27YAADZs2ICamhqcccaJlmUikQi2b9+WSDekDCZ+MgR3txez/DAYDEaqIITAxydfs0zgOfBK62W9rqqqwtKlS3DCCScZooTjOBQVDUBZ2X5jOZ/PZ1mPEAJZtqZcpkVNLDwej2OaYqRudk/hLMsyBEEwCpzG26+iyOjbtx8efPBRx3aaU48zGZjbK0Ow5vnRhrozyw+DwWB0WCoqyjB9+lT8/vtvxjRRFLFx43oUFfWPud6BBw7G6tUrLdPWr1/brLYMHHggdu7cjsrKCmNaOBzG+vXr0L//AOTnd0K3bt0NN5nOhg3mfvv3H4iSkr3IyclF79590Lt3H/TocQCeeWY2VqxY3qz2NRUmfjIAWZGgaKqaJzwb6s5gMBgMDBgwCEceORazZj2MFSuWYcuWYtx//92ora3FBRf8I+Z6F144Hps2bcSTTz6GHTu248svP8P777/TrLaccsrpyM/vhDvvnIJ169aguHgT7r13GoLBIM455zwAwPjxl2L+/HfwyScfYseO7Xj++aexdu0aYxunnXYm8vLyMW3aZKxZsxrbt2/D/fffjV9++RkDBw5qVvuaChM/GYAe7wNYkxyyoe4MBoPRsZk+/QGMHj0Gd999B6644hLU1FRjzpzn0aNHj5jrHHjgEMyc+QSWLVuKSy+9CPPmvYF//vNfzWpHTk4OZs9+Frm5ebj++omYOHECwuEwnn76RfTs2QsAcO6552PixGvxyisv4dJL/44tWzbjrLPOtmzjySefQ35+Pm6+eRImTPgnysr2Y9asOXEtWS0BURRWo9aOJMmoqKhvtf2FpAZc9+sZAIDZY77AsxvvwuqqJbh04O0Y2+10x/KCwKGgIBuVlfVttupyS8D6xR3WL+6wfnGnPfRLNBpBefleFBYeAI/Hm7LtNjfgub3Smv0S77ft3DkbPJ+YTYdZfjIAu+WHI7w2nbm9GAwGg8FINUz8ZAC0yOEJD2L8LMwox2AwGAxGqmHiJwPQS1twhAchBJw2ZlBm4ofBYDAYjJTDxE8GQA9zB2BYfpRWzCfBYDAYDEZHgYmfDKA8vA8AJX40y4/CLD8MBoPBYKQcJn4ygMpIKQAgJKkjzJjlh8FgMBiMloOJnwxA1kZ7HZQ/GgDAgVl+GAwGg8FoKZj4yQD0mB8vp9ZnIUT9WWRm+WEwGAwGI+Uw8ZMB6OJHz+9DmOWHwWAwGIwWg4mfDEBPcmgGPLOYHwaDwWBY2bFjO0455VgsXPixMU1RFHz22SdGwdGFCz/GMceMTlcTLcyYMR2TJv073c1whYmfDMAUP8zyw2AwGAwnoiji3nvvRDAYtExfsWIZZsyYjlAolKaWtU2Y+MkA7Hl+ON3yA2b5YTAYDAbw4ovPIjs72zGdledMDiHdDWC4JTnUMjyzk5rBYDA6PCtWLMNHH72Pl19+A+edd5YxfdmypbjuuqsAAOef/1fcccfdxryFCz/G3LkvoKxsP/r3H4ibbroNBx98iOv2Z8yYDgDIz++Ezz//FMFgAw4//AhMnjwVXbp0BQDs21eCZ5+dg6VLf0VDQz1GjBiFiROvx6BBBwJQRdgrr7yIjz56H7W1NRg37hREImHLfvbvL8WTT87CkiWLwXE8hg8fgUmTbkSfPn1T1leJwiw/GYBe3sIR88MsPwwGg5EyFEVBSBLT9j8ZK01tbS3uu+8u3HDDrejevYdl3vDhIzFjxkMAgOeffwUnnXSKMW/Bgg8wffoMvPDCq/B6Pbjrrilx97No0ReoqanGnDnPY+bMJ7Bhwzo899xTAICGhnpcffXlKC3dhwcffARPP/0SfD4/Jk26AiUlewEAr78+F2+++RomTrwOL730OnJzc/HVV/8zth8MBnHttVcCAGbPfg5PPvks8vM74d//vhT795c2uV+aC7P8ZABGzA9ntfwwc2YLIMsIvLsQUo+uiBz/p3S3hsFgtBKKomDyqh+xrqYybW0YltcZ/x1xtJHFPxFmzvwPDjlkBE499XTHPI/Hg9zcPABAp04F8Pn8xrwpU+5EUVF/AMCFF16MqVNvRWVlBQoKOrvuJzs7B5MnT4UgCOjXrwgnnXQqFi/+CQDwxRefobq6Ci+++DoKCgoAANOn348LLvgb3n//HVx77Q147723cf75F+KUU9R2XnvtTVi2bKmx/a+++gJ1dbW48877IAiC0cbly3/HggUf4PLLr0y4T1IBEz8ZQERWA9i8nBcAleGZWX5SDr9tF4QtOyFs2cnED4PRwdBfLNsKn3/+KVatWoFXXpnX5HVpV1Jubi4AIBwOx1ocvXr1NkQJoIohUVS9Eps3F6NPn36G8AEAn8+PYcMOxubNm1FdXYXy8jIcdNAwyzYPPngEtm3bAgDYsGEDampqcMYZJ1qWiUQi2L59W5OPr7kw8ZMB1Ik1AIAcIR8AoL8UMMtPauFK9oMro976RAkQ+PQ1iMFgtBqEEPx3xNEIy1LS2xAEDqKY/Eupj+ObZPX59NMFqKgox3nn/dkyfebM/+Crr/6HRx55Iua6PO+8t8V7png8njjLu68nyzIEwTwmWbYuR4spRZHRt28/PPjgo47tBAKBmO1qKZj4yQDqotUAgGxd/GiWH5lZflJHKIzsl9+zTCKhEJQc5+gJBoPRPiGEwM8n/9gTeA5iK+Zfu+uu+xzWmgsvPAeXX34lTj31DABokphKloEDDzRyCelus3A4jPXr1+H00/+M/PxO6NatO/74YyWOO+4EY70NG9aC1/q7f/+B+PzzT5GTk4tOnToBUIfvT59+B0488RRLvFJrwAKeM4B63fLj0S0/+s/CLD+pgoRczL0y618Gg5G5dO3aDb1797H8B4CCgs7o2rUbACAQyAIAbNq0EQ0NDS3SjlNOOR35+Z1w551TsG7dGhQXb8K9905DMBjE2WefCwAYP/5SzJ//Dj755EPs2LEdzz//NNauXWNs47TTzkReXj6mTZuMNWtWY/v2bbj//rvxyy8/Y+DAQS3S7ngw8ZMB1Imq5SdHUAPXOJeA56VlX+O/qyehItz6UfHtAe9vq5wTmVuRwWC0cQYOHISjjjoad999Oz766P0W2UdOTg5mz34Wubl5uP76iZg4cQLC4TCefvpF9OzZCwBw7rnnY+LEa/HKKy/h0kv/ji1bNuOss862bOPJJ59Dfn4+br55EiZM+CfKyvZj1qw5RmB2a0IUFljiQJJkVFTUt9r+rl1yOsJyEPePegPdAr3x3ran8eXeeTi154X4v35XAwD+vfh4AMCYwpNw1bDpKCjIRmVlfbP8z+0NQeBi9kvuf552LF83cTyU/NzWal7aiNcvHRnWL+60h36JRiMoL9+LwsID4PF4U7bd5sb8tFdas1/i/badO2eD5xOz6TDLT5qJyhGEtdFe2YbbK/ZQ95AcdExjMBgMBoOROEz8pJl6sRaAGuQc4LONz4D7UHcf53dMYzSCNlzTATN6MhgMRoeEiZ80I8oRAICH8xo1veJZfsxgaEaikEg03U1gMBgMRgbBnqRpxl7XCwA47WdZVbnYuQKzVjQdJn4YDAaDQcHET5oxxY+ZkCokqcMVsz15juUVNvy9yTDLD4PBYDBomPhJM26Wn6H5h1mWod1fTPokQSzxwzqTwWAwOiQZJX6effZZXHzxxZZp69atw/jx4zFq1CiMGzcOr776qmW+LMt44okncOyxx2LUqFG44oorsHPnztZsdrPQxQ9HWX70z4qWSVRfBmD1vpKBRGMEPDP1w2AwGB2SjBE/b7zxBh577DHLtMrKSlx22WXo27cv5s+fj2uuuQYzZ87E/PnzjWWeeuopvPnmm7jvvvswb948yLKMCRMmIBKJtPIRJIdR0Z2O+dHEjz5PVEzLBUvL1HRI1Ow/cVC/NLaEwWAwGJlA2sXPvn37cNVVV2HmzJkoKiqyzHvnnXfg8Xhw7733YuDAgTjvvPNw6aWX4rnnngOgVoN96aWXcN111+GEE07A0KFDMWvWLJSUlODLL79Mw9E0HVF2CXjWRnTJioR11b/jodWTjHks5icJNLeXWNQbwfPPhOLVCvixrmQwGIwOSdrFz5o1a+DxeLBgwQKMHDnSMm/p0qUYM2aMpTLskUceiW3btqGsrAzr169HfX09jjrqKGN+Xl4ehg0bht9++63VjqE5uAU8c1Sen1lrb8Kuhs2O5RmJowc8G6KnFQoBMhgMBiNzSbv4GTduHGbPno0+ffo45pWUlKBHjx6Wad26qcXc9u7di5KSEgDAAQcc4FhGn5fpRGW14CbPOd1eskv14P2h3a3TsPaE7vbyeGwzmOmHwWBkNvv3l+KYY0Y7/i9c+DEANRRCr7gOAAsXfoxjjhmdziYbzJgxHZMm/TvdzXBFaHyR9BEKheD1Wmt3+Hw+AEA4HEYwqJZ6cFumurq6WfsWhNbRhRtqlwFQLT/6Pj2apUuG5Fh+b3C7Ubsk0RomHYVY/cJrGZ6J32P5XQWeg9JKv3M6YeeLO6xf3GkP/SLLqbfu6gZjQlo33Vpx8SZ4vT68885HFqN1Tk4OAGDFimWYMWM63n13Qes1iiJd/cLzpFnP6YwWP36/3xG4HA6rlpKsrCz4/Wqph0gkYnzWlwkEAknvl+MICgqyk16/Kfj9qjXC7/EZ+8yHtm/iPJM4wiM3Vz3WvLzkj7E9Y++XKAdIAHy5WcgpyEaII8ZyXCv9zpkAO1/cYf3iTlvul1CIR1kZ1+wHpButLQq3bduMvn37okePbq7zOe1+xvMcBIEzvrfWC7yOW78QQkBIan8DWSbgOA75+VmW535TyWjx06NHD5SWllqm6d+7d+8OUXujLy0tRd++fS3LDBkyJOn9yrKCmpqGpNdvCmW1ZQCAEZ2ORmWlWkm+vlYVfKLktPzIioQHFt+MqWMfRU1NEJLEhr7r8DyHvLyAtV9kGYFv1fivkAzUVdbDrwAEQE11AxSPL30NbiVc+4XB+iUG7aFfIpEwZFmGJCkpqzZOiNo3kiS3qoVj06ZN6NevyPU4li1biuuuuwoAcO65Z+GOO+425i1Y8BHmzn0BZWX70b//QNx00204+OBDXPcxY8Z0AEB+fid8/vmnCAYbcPjhR2Dy5Kno0qUrAGDfvhI8++wcLF36Kxoa6jFixChMnHg9DjzwQPA8B1GUMHfui/joo/dRW1uDceNOQTgcgqKYv8H+/aV48slZWLJkMTiOx/DhIzBp0o3o06eva7vckCQFsiyjuroBwaD1GZmXF0hYnGa0+DniiCMwb948SJIEnlfjYH755Rf0798fhYWFyM3NRU5ODpYsWWKIn5qaGqxduxbjx49v1r5TdcE0RlBURZaPZBn7VDSTbazg5qVl36rzJbnV2tmWoPtFWFdsTvd4LP0lSjKUDtR/7Hxxh/WLO225XyTJXZ0oioKw850yYQRFgSgmr3x8vFm7MVE2by5Gp06dcM01V2DHju3o3bsPLrnkchx55FgMHz4SM2Y8hKlTJ+P551/BgAED8dVX/wMALFjwAaZPnwG/34+HH34Ad901BfPnfxJzP4sWfYFTTjkdc+Y8j4qKckyffgeee+4p3HHH3WhoqMfVV1+Onj174cEHH4HH48VLLz2HSZOuwNy5b6F371547bW5ePPN13DrrbdjyJCh+Oij97Fw4ccYNUpN2hsMBnHttVdiyJChmD37OfA8h3nz3sC//30pXn11Hrp2dbdsxaK5wjajxc95552HF154AVOnTsWECROwatUqzJ07F/fccw8ANdZn/PjxmDlzJjp37oxevXrh4YcfRo8ePXDqqaemufWJoSctJFTsuT7UvSZakZY2tSdI2HSbKn6rlYeAhTwzGB0FRVFwx68i1lel76of2onggTFCwgJIFEXs2LENHNcf1157E7KysrFo0Re49dbrMWvWHIwePQa5uWoZpE6dCuDzmW6gKVPuRFFRfwDAhRdejKlTb0VlZQUKCjq77is7OweTJ0+FIAjo168IJ510KhYv/gkA8MUXn6G6ugovvvg6CgoKAADTp9+PCy74G95//x1ce+0NeO+9t3H++RfilFNOBwBce+1NWLZsqbH9r776AnV1tbjzzvuMEdxTptyJ5ct/x4IFH+Dyy69sSlc2m4wWP4WFhXjhhRcwY8YMnHPOOejatSsmT56Mc845x1jmuuuugyiKmDZtGkKhEI444gi8+OKL8DhG9mQmuvmUvhi49A/Ca5coWbYYBqZ8GAxGBiMIAj799CvwPGcIm6FDD8LWrVvw1luvY/ToMTHXpV1Jubm5AMyYWTd69eptSSuTnZ1jhJZs3lyMPn36GcIHAHw+P4YNOxibN29GdXUVysvLcNBBwyzbPPjgEdi2bQsAYMOGDaipqcEZZ5xoWSYSiWD79m3xuqFFyCjx8+CDDzqmjRgxAm+//XbMdXiex6233opbb721JZvWYpiWH0r8UDl/YuE2DJ7RCD51VKBC6N5mMBgdAUJUq0uz3F4C1yxXSzJur6ysLMe0AQMGYsmSn+Oup4eK0MSrEOBmMDCXd19PlmUIAm8ckyxbl6PFlKLI6Nu3Hx588FHHdpozQClZmIkhzegZmy2WnwTET1RuG+U7MgnFY9f6zPTDYHQkCCHwC+n731Ths2XLZpx66vEW9xEArFu3Bv37DzCOqaUZOPBA7Ny53cglBKhWpPXr16GoaADy8zuhW7fu+OOPlZb1NmxYa3zu338gSkr2IicnF71790Hv3n3Qo8cBeOaZ2VixYnmLH4MdJn7SjKmsafHT+M8SlZj4aSpyQX66m8BgMBgJU1TUH/369cOjjz6ElSuXY/v2bZg9+1GsXbsal1xyOQAgEFAtQ5s2bURDQ8uMUj7llNORn98Jd945BevWrUFx8Sbce+80BINBnH32uQCA8eMvxfz57+CTTz7Ejh3b8fzzT2Pt2jXGNk477Uzk5eVj2rTJWLNmNbZv34b7778bv/zyMwYOHNQi7Y4HEz9pRrf80HE+xOVnuXGY1VTILD8JIqsmaqlnd8PtZcAMPwwGI4PhOA7//e8sDBt2MO66awouu+wfWLt2NWbNmoMBA1TBMHDgIBx11NG4++7b8dFH77dIO3JycjB79rPIzc3D9ddPxMSJExAOh/H00y+iZ89eAIBzzz0fEydei1deeQmXXvp3bNmyGWeddbZlG08++Rzy8/Nx882TMGHCP1FWth+zZs0xArNbE6KwMuEOJElGRUV9q+zr0bU3YX3177h80DT8qespAIDK8H7ctuz/LMs9eNi7mLLsfOP7syd/Ak84v80ORW0JBIFDQUE2KivrjX7x/LYK/kU/IXrQQIT+po4AzH78ZXANIdRPuABy18J0NrlVcOsXBuuXWLSHfolGIygv34vCwgPg8XgbXyFBmhvz015pzX6J99t27pydcJ4fZvlJN4oe80NZflzcXhzhMWnof4zvzPKTIMZwOnaqMxgMBkOFPRHSjOw22stlLBJHOIwoGIs8j5qjgcX8JAbR3F6wvA1o/ctsngwGg9EhYeInQ6Aj9t0sPzzUEWACUYcjRuVo6zSsraOl51c4SlCyce4MBoPRoWHiJ80oitPy45aFRh/+7uFUH2dUjp2sqqMQrtsFMVwdfyHd8sOxU53BYDAYKhmV5LAjYuT5QeMxPwAgcJTlpwM/zyMN+7D+S7V+28hzv429oJ50i3NxezEYDAajQ9KBH5+ZgSl+TNwsPzyxu706dsxPQ+UG43PcAYvxLD9soCOD0a5hg5nbH6n6TZn4STOKy2gvtySHDrdXBw945gUz5bsshWIuR9zEDzP8MBjtGr20QyTCwgPaG/pvyvPNc1wxt1eaUeDM8Owe86M+vAUj5qdjix/CmSVA5GgdeCFGbRjZJeCZqR8Go13DcTwCgRzU1VUCALxeX0rKQMgygSQxa5Kd1ugXRVEQiYRRV1eJQCAHXDPjOJn4STNGhmeS2MOZub1UFFk0PsvUZwfM7cVgdEjy8tS0ILoASgUcx0GWWZJDO63ZL4FAjvHbNgcmftKMYlRnp2t7xRY/zO2lIlND/ZV4QtAt4JkZfhiMdg8hBPn5hcjNLYAkxXlBShCeJ8jPz0J1dQOz/lC0Zr/wvNBsi48OEz8ZgnWoe+wf18MsPwAAhRY/UpycR2yoO4PRoeE4DhzX/BIXgsDB7/cjGJRYiQuKttov7ImQZtwyPMfzTVuGundggpUbjc9KHLcXcY350VdMebMYDAaD0QZg4ifduNX2ivOz8MzyAwAQIzXGZzmu28tttBfzezEYDEZHhomfNJNonh8dfdSXGSvUMYnU7zY+xxvq7p7kUIeZfhgMBqMjwsRPmjHEj6Wqe+PiR+7AD24xXIW6/cuM79uXTI+9sGthUwaDwWB0ZNgTIc0YSQ7jWHsuLLrO+Ky7xGRFatmGZTDBqmLLd1lsiLmsa5JDnY6rHxkMBqNDw8RPmjHdXu7ihwOPcQecZ3433F4d+MntkgE7JnrAM21NMz534D5kMBiMDgwTP2lGgTPPjwVi/8osP03K1MrcXgwGg8GwwZ4IaUY34MRMbGgzTugPfoVZLQyyCg6KPTNewDPrQgaDweiQMPGTZhqz/MiwWng4qDWtOrLlR7Zlt1bi9AWRWGFTBoPBYFhh4ift6LW9EvspdMuP3IFjfuzlLOIlOTQLm7Kh7gwGg8FQYeInzTRVxHAs5se0/BDVCqbEy3at50Nyq+rOtA+DwWB0SJj4STv6aK9ELT/aaK8O/OTWLT+8J1v7Hkf8GG4vvqWbxWAwGIw2AhM/aSbWUPcuvgNclzeSHHbgDM+65YcXVPEjxxM/RsAzC/RhMBgMhgoTP2nGSHJoezZ39nV3Xd4c6t5xxY9u6eE8WZbvbrgmOWS1vRgMBqNDw8RPmtFjdzhidcvETHpouL06sPjRLT+eHPV7XMtP7IBn0oFdhwwGg9GRYeInzUiKOlKJJ4JlOokx+ksXRc2x/ISlEF7d/BD+qPwl6W2kE72KOy+olh9ZDMYe8dXBy1uQmjp4PvoK8q6SdDeFwWAwMgYmftJMTPHTmOWnGeJn4e7X8GPpp5i9/rakt5FOFElze2niBwAqtn/mvnAHj/nxL1gEYdV6RB59Nd1NYTAYjIyBiZ80I2luL7v44WL8NKmI+dndsDnpdTMB3eXH8T5jWrh+j/vCbuUtDB3U/k0//L6ydDeBwWAwMg4mftJMLMtPjiffdXljtFczYn4axLqk180kCO81v8QQg8QobGqe6kpHSvEsddzYMAaDwYiF0PgijJbEFD/WgOf/63c1KiP7cVz3v1qmp8Ly0+ZHiilOy4/gK3BftoPH/EDquMkwGQwGIxZM/KQRWZGMPD92y0++txC3HPy4Yx29AGpzYn6aVBU9E9GzYhMOnfudiYrtCxsPeHZ1e7V/OtChMhgMRsIwt1ca0a0+gFP8xIIQvbBpc6w3bfuRSCeGJFrmZkWJJX46dsAzg8FgMJww8ZNGJKo+lz3PTyw4Tbjsqd9uJEhsKm1eBhjCjwCaaHS1/CgKiN5HFrcXMeZ3GPzexpdhMBiMDkKbED+iKOLxxx/HiSeeiEMPPRT/+Mc/sGLFCmP+unXrMH78eIwaNQrjxo3Dq6+2jWG9tPhJ3PKj/mQ7a7fg4x1zk9pvrGH0bQ5CQDhN/LgVepVN65glyWE7OfwmITAPN4PBYOi0CfHz9NNP491338V9992HDz/8EP3798eECRNQWlqKyspKXHbZZejbty/mz5+Pa665BjNnzsT8+fPT3exGsbq9ErX8mD/ZR0mKn7b+9NfjnQjhDPEDOb74cQ147kjwHfz4GQwGg6JNvA4uWrQIZ511Fo455hgAwJQpU/Duu+9ixYoV2Lp1KzweD+69914IgoCBAwdi+/bteO6553DeeeelueXxkTRXDUf4hIOQ6eUSFUylwV34dPerOLrbnzE4b2TbD3g2hmkRIwbKNeZHptxaHVH8UCO9CM+q2jMYDIZOm3giFBYW4ptvvsGuXbsgSRLefvtteL1eDB06FEuXLsWYMWMgUGb9I488Etu2bUNZWWYneIuV4yceHMyHWECrat4Y721/Gov3f4HnNk5vUvsyFmO0FyV+3GJ+6Bw3bgHP7Tzmh9u73/ziaRPvOQwGg9EqtIk74tSpU3H99dfjpJNOAs/z4DgOs2fPRt++fVFSUoLBgwdblu/WrRsAYO/evejSpUs6mpwQsbI7x8Nq+UlsvS11awEANdEKdRtt3O0FmAHP+mgvWSt2SkPoEXG0tavNW74Sg7AcPwwGg+FKmxA/xcXFyM3NxZw5c9C9e3e8++67uOWWW/D6668jFArB67WOZPH51OR34XA46X0KQisYxTj14SQQIeH9Cbz5k3GET3A908IhCBw4ygXUKseZYnTtwvMcCOcBAFTu+Bz80dOM6eqC6h+F4yB4eGp9oi1HQNrg8SeKxdglSWa/MACY5wnrFyusX9xh/eJOW+2XZomfzZs346effkJpaSkuvvhi7Ny5E0OHDkVOTk6q2oe9e/fi5ptvxty5czF69GgAwPDhw1FcXIzZs2fD7/cjErG+9euiJysry7G9ROA4goKCxFxKzaGKU0Wbh/ckvL/cYMD47OGFxNYjpvgpKMiGl3IRtsZxppq9XlXIBAJ++LK6YDeAQF4v5OWpfaP/lRUREQCE5yzHGeY5KABycvzg2+DxJ4qU5UVU+6xIstEvDCusX9xh/eIO6xd32lq/JCV+ZFnGXXfdhfnz50NRFBBCcMYZZ+Cpp57Cjh078Prrr6NHjx4paeDKlSsRjUYxfPhwy/SRI0fi+++/R8+ePVFaWmqZp3/v3r17UvuUZQU1NQ3JNbgJVNbWAlBLVlRW1ie0TkN91PyikITWk6hRT5WV9RBF63c3/rf7PfCEx7ie5yTUrtYkHFbFbjAUha+gCAAQDdejpiaIvLwAamqCkCQZpLIOfgAKsfaTT5LBAairDUFOsN/bIlx1A4wCILJs9AtDhec5y/nCUGH94g7rF3cyqV/y8gIJW6CSEj9PPfUUPv74Y9x///044YQTcPTRRwMAbr31VlxzzTWYNWsW/vvf/yazaQe6iNqwYQNGjBhhTN+4cSOKioowcuRIzJs3D5IkgddGtPzyyy/o378/CgsLk94vLRBaiqioChkOfML7o8NYEl2PLoUhirIlztdt/epIOd7aopbWOKrLGfBwmZUgT9ZGcSkyoBA/AECKNhgXniTJEEUZXEQLguY4y3HqRyNJMqRW+J3ThSBSMT+SbPQLwwrrF3dYv7jD+sWdttYvSTnp5s+fj+uuuw7nnXceOnXqZEw/6KCDcN111+Gnn35KVfswYsQIHH744bjtttvwyy+/YNu2bXjsscewePFi/Pvf/8Z5552Huro6TJ06FcXFxXj//fcxd+5cXHnllSlrQ0uR1Ggvqjp5olmhZVsFTzrg2S1LdHW03Fw3E4ug6m0iHDghS5sUcY74iqoPfyXWSKf2PdjLOtqNvakyGAyGQVKWn7KyMhx00EGu87p3746amppmNYqG4zg8/fTTeOyxx3D77bejuroagwcPxty5czFy5EgAwAsvvIAZM2bgnHPOQdeuXTF58mScc07muWvsJDXaC7T4SUy7OoqgUoGwCmQQWEVUg1hnmZ95mKqF85hxXZIYBJBvfCeaZc0xzLuDjPayJHl0SwLJYDAYHZSkxE+/fv3w3XffYezYsY55v/76K/r169fshtHk5+fj7rvvxt133+06f8SIEXj77bdTus/WQNbET6IiBrBabRK1/CiUWBBl0bINWZEd26HLbshuZSPSjWatIoQDx3lAOA8UOQo5aovTiqqWIMXjibWhFmxkBiAzyw+DwWC4kZTb65JLLsGrr76Ke++9Fz///DMIIdi+fTteeuklvPTSS/j73/+e6na2S8xHrylGKiMhPLv5D+yor3Vdh1BCKdEMz7TlJyqHLfuTXMQNbRd5c8ssBMXMCgo2xJxmweEEdZSBJFrFD9HED4SOmd2YMPHDYDAYriRl+Tn//PNRUVGBp59+Gm+99RYURcFNN90Ej8eDCRMm4KKLLkp1O9spmgWDmjJ700r8WrEPn+/djg+OOcuxhmypBJ+YdpVgrhOVwzbLj5tlx5z/a/lX6JszGKf2vDChfbUKdFV3ALyQDSlSAylaZ10uorq9Ylp+2rnhx1LeQ1G0chcdxOXHYDAYcUg6z8+VV16Jf/zjH1i+fDmqqqqQl5eHkSNHWgKgGfFRFKsFAwBWVqklOaIxAo1FxRzq7iGNj8ISZdEicCJy2BLyIicQ07OpZlVmiR/D8qMl1/LmAQ17IUassWYkGFKXDvitqxvH387Vj2z7bYMhwN+2cnEwGAxGS9CslIxZWVno2rUr8vPzcfjhh6eqTR0GxbD8qE/j3ytLEW4kMDUqmwkdE4n5ichB2/pWt5e75ccqClZW/oRd9Zsb3VdroYtG/SgEnxrkLIarLcuRoJrsUgn40CGxiR/SEEpTQxgMBiOzSNry89FHH+GRRx7B/v37QQjBu+++i9mzZ8Pj8eCRRx5xlJxgxEYXPy9sXt3osqIcbXQZmrBkfeBF5IhleLub+HGzh2yv34De2QObtO+WQ2+hqt0Fbwzxo9e2cgx11+tetFDzMgW75SfqUvyVwWAwOiBJWX4WLlyI2267DUceeSQeffRRyNpN9pRTTsF3332Hp556KqWNbK8otqevl2vckhNVTMuPfX03IrJV/JSHS/BH1WLju6xIEGUR87c/g493ztWEkXO7ddFqx7S0YXMX8t48AMDuVU+jqmQVvWArNyyzILL1+FmhUwaDwVBJyvLzzDPP4MILL8T06dMhUTfU8847DxUVFXjnnXdwww03pKqN7Rir20vgGteifbMOpNZu/OEetrm9nt14l+W7DBmbalfiiz1vAQBGdT7GNfFhvZi63E3NRR+9ZgRuU4HfSz+6DIdf8L1tjQ4a5Gu3/IhM/DAYDAaQpOVn69atOOWUU1znjRw5Evv27WtWozoK9oDnRMRM/9yDcHT3M6zrxyEiWSvb2/chKZIlqWFNtMK1HTXRipj7CEsKaiKtaWWxBjzndBkZdzEHesR3Av3XprGLH2b5YTAYDABJip/CwkJs3uweALt58+Zm1dTqSOiPXt2CYX8WxxI3wwuOtG0hNmE5fpCrrEgW11gs99bP+z93nR6RFFz9QxT/+jaKLTWtlEvG7vby5MRfvIMafpzih+X6YTAYDCBJ8XPmmWfiiSeewOeff45IRI1BIYRg9erVeOqpp3D66aentJHtF+uoJXsNrliPKl0sJVJ3KyIF486XFUkbAaYSkoOulp9sIc91/fIQUBkGJAXYVts6lhSz5IbaD4SPlcG5Y0Pso72Y5YfBYDAAJBnzc8MNN2Djxo244YYbwGlxKhdffDEaGhowevRoXH/99SltZHtFoWw/ACDZHlayIrtmcW6KIaMxy4+oRBGhxE9ECsHNohRrlFmYCqpttYK+huFHEz8kVhJDa/8adBBLkPDHBst3UlYJDElTYxgMBiODSEr8eL1evPDCC/jpp5/wyy+/oKqqCrm5uRgzZgyOP/5446HEaASjRpUeuGvtN0lR4PZY10tcJBbwHF/8SLKkCR6ViBx2dbfR+YUs26eMCa0nfvSdqv3ANWb5sZ+OWv/ZLSPtCkkCZ8vrQyozJ2idwWAw0klS4ufyyy/HhAkTcPTRR+Poo49OdZs6DPbaXnbRIcUMyNUDpJvv9nJYfuSQq6SSIUFSREcF+gglfqKtFD+sKGq+GsIJ2t+mub30pId6Buj2CAmFXSaylxIGI1OQxCA43s+MBWkiqZifZcuWsR8sBSi2mJ+QLSYjlvjhiHuAtBuNWn4U0RLzE8vtBbhbf8KU/moty48sqS44jlMTaTZd/KjlLtq1+HE7NpElOWQwMoFQ7Q6sXnAGdvx2f7qb0mFJSvwce+yxWLBgAaLRpmUbZtix5vkJydaHkxQzoDlxy48kx3/gSYpoGe0lKtGY7jQ38VMfbf2YH0WLP9ItP55A1xgLuh9HRxA/btmcCcvwzGBkBGXF7wIAqnZ9leaWdFyScnv5fD4sWLAAn332GQYOHIisrCzLfEIIXnnllZQ0sD1jD3i2W37kGJYdXSxVhsvw7rY5OKLLOBTlHOS6rIzGa4V9t2+B8X1p+bcYlj/asgxPBEiKCNFF/NRQ+jcaq8EpxhA/WqwPIRwGHD0TW366BTmFg50r2KyUhvhpz7WuqGHtis8LEo4A7GWFwWAwACRp+SkpKcGhhx6KQw45BIFAAIqiWP7L7TmQNJVQAc+KojiKmsay/Ogux8pIKf639x08veEu1+XUbcQXP5trrfXE6sVqh93Ho7mX3Cw/DdTzVGytmB/D8kO5u4zEhY2fe0ahU7e4mHYCHcwtDe6vTmOWHwaDwQCQpOXntddeS3U7OiS0VnCL75FjuG2IbfhSZaQ09j4aEQNuSQ3tbi9BG0pO1xXTES1FUuPuKmW4iR9jBBzdZzHao/Bq+gDSnpP+UccmDR+sDntn4ofByAjae3L5tkDSVd0ZzUehYn5o8cOBQIYSM+CZNMFg15jl56f9C11bppPn6WzkGnKz/NCCR2qlC1qW9dFedKBzPMuPLThfr6HWni2UmgtV6tHVrGrPAp4ZDAYDQJLiZ+jQoTFHexFCkJWVhb59++KSSy7B2Wef3awGtm/cxY+X4xCSpdjipwkD7fQs0KMLT8TS8m8SbJW537/3vxHv73gGgHuiQ1r8tJblR8/zQ+gEkEbuI1rQxGgQ3/7Fj+H24jgoHi02ill+GAwGA0CSMT9TpkyBx+PBgAEDcM011+Duu+/GNddcgyFD1PSxZ599Nnr37o3bb78dCxe6WRYYgLWwKV2qIqTF/uwN1cdYM3H1owc89wwU4bmjvsOpB1zY+DqauBicNwqHFR4HgWgxPy5ur7SIH5ixUjrErVgpFU++oXo53tjyCIpr/jAsP+263IMmfhSeMy0/TPwwGAwGgCQtP6tWrcLYsWPx9NNPWx5AkyZNwvXXX4/a2lo88cQTeOihh/Dyyy/jzDPPTFmD2yME7jE/9639FZ8c+1eX5RPXrLKblaQR7K6yeAHPUhrEjxnHRItAzjbPyrMb70adWI1Vlb9gZv5MdWK7jvnRfkMmfhiMDIQF/aSbpCw/33zzDS666CJX19f//d//YdGiRQDUfEDFxcXNa2E7hh7qrhc1TeQHaUp6Sd2ipMftJFISQ9IzKGt70teVXeKH0hHzY6/qbvlsEZHm5zpRDeyujJRCNirJthHxI0rq/6YgUW4vQcuELUks0pLBYDCQpPgJBAIoKSlxnbdnzx54tBgDWZaNzwwnbgHPHGn8JyEJLKOjCxZzu40//AxrkSZ+OE38uAVP0/Kh1d1e1OlLGrH80FxR+k/1QxsQP9zeUuQ+/BxyH34OpKYu4fXomB/D8gMw6w+DkQFUbPsk3U3o8CQlfk4++WQ8+uijhoVH5+uvv8asWbNw0kknIRKJ4L333sNBB7kn32MAbgHPfALRzG6V3mMha/KEa8Ty083fy/hsiBxiFT+NWX5az+0V2/JjCXhW4FyOoi0Mdfd9vdj47Fm+JvEVJT3mh7eIH8JGfDEYDEZyMT+33XYbtm3bhkmTJsHj8aBTp06orKyEJEkYO3YspkyZgkWLFuGrr77CCy+8kOo2txsUKiC3XlRHUtkTHbphLy4KALsbtqBX1gDHdMPyo1tGYmzzz70vwcvFDwAA/qhcrDdLXddF/Ly0XsSvpTL65ZrCovWkhDUztvpR0/FNceu0AcsPaMuppwmXK235IQQQBHWoO7P8MBgMRnLiJzs7G6+++ioWL16MX375BZWVlejRowfGjBmD0aPV0gijRo3Cl19+iR49eqS0we0L0/LzxvYNCa+lByDT3LPyMjx31HeO6XrMjy5gBuQMg1s1GVpQra5aon3SYn6giR9t5NiuOgUfb1e3uy9oig2p9bIcas2j3V56sdcEhrpDs4i1AcuPnBMwPit+X+Ir0gHPgCqcRBFEFFmoJYPB6PA0K8nhUUcdhUMOOQSlpaXo06cPeN50x/Ts2bPZjWvv0AHPq6r3G9NvHDwKszauwAH+bNf13Cw/sZBsMT+jC0+EqESxu2ELvtwzj9qm05UWK+anLur++GwtKWHGSlHEs/wQAj+fhZDUYEySiAK+DQx1V/LzzM984u5OQg91BwCvAATBLD8MRgbgzeqBSIN73CyjdUgq5gcAlixZgvPPPx9jxozBX/7yF2zatAk333wzHnzwwVS2r11DBzzTdNdEDxcj/MfN8hN7H7rbSyvpQAiO6noaBuUOtyzHJSB+dLdXOIbKab0kh3rMD2X5IW6WHxN7sLbEyZb6VxkLJdCalJeIGu0FAMTLEh0yGJkCJ2Q1vhCjRUlK/CxevBiXX345/H4/brnlFiMAdejQoXj11Vfx8ssvp7SR7RXFKGwKHFl4gDFdD3qOleFZ4JKx/FjFzcGdxlimuQZRE+s8Q/zEeAa32lB3t5gf41R2CXiGM1hbJErbiPmhXXNNGe6uH5tuLdJjh5j4YTDSDzUII5ERqozUk5T4eeyxx3DSSSfhtddewyWXXGI8xK+66ipMmDAB7777bkob2X4xh2zrgueSooMgaBaNmOKHJG75MWN+rD+1h/PiocPnx11XHz5ud3vtbXBv15qK1lE/+s1Ct/aUBHfgy/0fI0IUa2FTCrv4kUjbiPnh9+4zPpMmiJ9otBLbuqxEjbxNneDVcv2w0V4MAHVlq7C/eH7M64XRijDxkxaSEj/r1q3DeeedBwCORIdHH300du/e3fyWdQDomJ+o9qYuEI6y/LhfFE1xe8kxLD8AkC3kGp8DfI5jfqwkhzvq3G+YkVa7hvX9q6fv/auuwCel7+LXHECRRcdyMlEcQ/wlorm9MvzmT+qC5pcmCJddwS+xq3A9NtS/pG6HZXlmUGz+/jrsWTUbNXt/TndTOii05SfzYw/bI0kFPOfm5mL//v2u8/bu3Yvc3FzXeQwrtPNG1ISOh+PANeL28vNOf3Fnb3fXZWNZfgA1cPqmYbNQFt7riAECTMus3fLjiSOZJVkBHytYKVUYMT/qn4gcAgDs8gFSbQNkKQqANzpYdgnFljhtmiybrqFMhO7LJsT8BKVSAFTeI724KbP8MChCtduQj6PT3YyYKLII0gQ3f1tEkSUgg29B7ZWkLD8nnXQSZs2ahT/++MOYRghBSUkJnnnmGZxwwgmpal/7xoj5MS0/Ho4z3F5izKruTnFREdkHUXY+2PQHPx/j6hqafxiO6fZn120ihuXH7i3K8ZjvMdtqW8OSYlp+ZBfrmBiptnyvRq3xWbdmiURXRpltcqYDlJvi9rJbtJQKtU+83/ySknYx2gkZ7HKp3LkIf3z8Z9TsXdz4wm0MyyAXZvlJC0mJn5tvvhmFhYW44IILDKFz00034fTTTwchBDfddFMq29huod1euuWHdnu5PdjjURutcExLprCpTqzRXqJN32QJphwpDTV5N02CjlEghKBerDG+58paIkcprC8NANhNzCGleZ7OAIAQryaVzPi4n2jU/Nykofk28VNSBgDggi38AzHaFJkcbLvjt/uhSGFsXXx7upuSeghze6WbpMRPfn4+3n33Xdxzzz044ogjMHbsWAwZMgS33nor3n//fXTu3DnV7WynmEPdV1WVA1AtP7r4EeOMHR/U6WDHtC/3vO0IYNQFS1NKYpho4gdWt5ddL/h5goMLdMHW0pYfeufEMoRdL1hq74OfsBQAMDTvMOR48gEAtR5VIGX6cHcSMcUPv3NvwuvVK3uMz4rdItjABFBHxnI+ZLD4addQ96hMFqDtmaSdqV6vFxdccAEuuOCCVLanQ0E/ok3LDwHfyGgvABjV9UgUV1lrPX1V8h4G5Y3A4YXHG9OchU0TR383Mdxe0C0/1nb5eYAn+v6avJumQe+bcEYFegAIGS9TivFHhoIlZDkAINfTyXAD1nragOVHUSwByqQ+GGdhk0i9VSTJUkR909T6zv/5twide3rq2sloU8iGZZRZHdKFtQYh+w3SQcLi58MPP2zShv/2t781sSkdD4WK+eGJWtx0UE4n0+0Fdei2WzzO3wb9E+9tetExfXfDFqv40S4ykoSRT9+v6fZSt2XP50OLn5bO9UOP2iKEQKZqoYU4XfSYGaAjnDn/rN6X4L3tzwAAIh4q4DlTEUVLJqNErVTRUJnluyJH4LnkbETnfggAELax0ZgdGSlab3xm4idNUP3OfoP0kLD4mTJliuW7mVFXcUwDmPhJDP1hbVZ1p91egGr9EVzET7YnsRF1qXB7NRbwHJGBbI/e3iR20wTKit+ztI+2/AQ5BQCxvFVFeHN+90BfeHm1PlaY1244GVziwp6NmYQjIPUNULLjZ4cVw9aAb1mKgOSbqQwUr8e+CqODEKzahI1fX2F8r9j2KXoecmUaW9QxoV1dzO2VHhI2B3z11VfG/yeffBJ+vx833XQTFi1ahFWrVuG7777DXXfdhYKCAjzzzDMpb+iHH36IM888E8OHD8ef//xnfPbZZ8a8Xbt24corr8Rhhx2GY445Bo899hikDH6o6ehWDIV6v+cJZ7i9gPiur6O7nY5u/l7wcn5qfauejTfUvTFi1fayC5x9DYpp+Wnh63jv6mepBlrFj/FJb5+iIKxZfjzEC45wRl+FBc0ilsmWHy3eh67pxe0rb3Q1+2g3WYqoVd11hPY9dJgRm/qKtZbvgjc/TS1JgCTuWW0G+r4uZ/6zqj2S8NnVq1cv4/9TTz2FiRMn4oorrkDv3r3h9XrRvXt3XHTRRbjyyivx8MMPp7SRH330EaZOnYp//OMf+PTTT3HWWWfhpptuwvLlyxGNRnH55ZcDAObNm4fp06fjrbfewpw5c1LahpbFFD+C5gLTiZXoEAAuHzIV9416wzIqzJHJOE6Sw0RpbLQXIa0Y82Pds0X8KEQXlLTlR22zl1dFj1dLEBkxLD+ZK350y4/i9UDspxYK5kvL4q0CAGgot8aCKXIE8FC/fwrTMHF7SuFZtibjk0W2VUhDEJ4lK0AaEov3agy7i8UulDMJf25RupvQIkjRBoTrdhrfK3Z8kcbWdFySegXcvHkzhg0b5jpvwIAB2LVrV7MaRaMoCh5//HH885//xD/+8Q8AwNVXX42lS5fi119/xe7du7Fnzx688847yM/Px+DBg1FeXo6HHnoIV111FbzexLMhtzaG5UcxNSjnED/xHyqEEIhKxPiuJ/wz96FZfpLIoqW7MXmb5UeU7cvp9ciUVqzvBRDCQbK9NSmA5UEc4VQB4eF8lr9hQVuvDVh+4PUYQ2O5EvfkojShqi2W77IUBaGsPYprTqfkyH5FLZEi52ZBOrB/yrbLUPF/tAjCtl0QN21DcPzfmr9B28g/KVIHRZGSSoXR4rRTy0/Z5vcs30s3vI5OvcchkD8gTS3qmCR1dhUVFeHjjz92nff2229j8ODBzWoUzdatW7F792785S9/sUx/8cUXceWVV2Lp0qU4+OCDkZ9vmm+PPPJI1NXVYd26dSlrR0ugx0sp1EVO5/kBGhc/duziJ155i8awu71ERX0Y10SsbeJgJiJuTfFjt/wAqvihg6L12B6vJnp0t6A+LD6zLT+a28sjQO7eJfH1bL+Bavmh33NSn4GbL3XmmDLIZIGZ4Qjb1BdJoQlpDuLhSHsAGVKkLiXbTjWknYqfhsqNjmm0JYjROiRl+bnmmmtw/fXXY9u2bTjxxBNRUFCAsrIyfPnllyguLsbzzz+fsgZu3boVANDQ0IDLL78ca9euRe/evXH11Vdj3LhxKCkpQY8ePSzrdOvWDYBaamPkyJFJ7VcQWv7C47Rd0Nk+vR4eHCHgCFFz5vDOtvA8Z/nbL2cIttdtAABElYhleV38eAShycfEEQJB4BBRVJP74v2f49yiidjTELAsJ3AEgq6ttHVaA0HgAc76YJUBcJzaBkJMy4+P90MQOAha/IyWDxECUSC3UnubCqdZtYjXA3QrVKdFxUb7V6GGMqsTIjB/IIAocmp+I0rU6H1uh1+9CZ6Pv0J03FGQ/pTctdhS2K+jTCcVvxkhzviScM16+A84yvieKf3CUWUteD79YihV/cLzLgMOpIZWu2+mmkw5X5pKUuLn1FNPxZw5c/DUU0/hscceg6Io4DgOhx56KObOnYvRo0enrIF1depbyW233YZJkybhlltuwRdffIGJEyfi5ZdfRigUQl5enmUdn09zbYTDju0lAscRFBRkN6/hCRAoV11yguaa40BQ2FkdlSMQgoiiICfPj4Is97bk5akiZNJhd+LW78cDAIggWdquaGaAgvwcFOTFP6a/D52IN9c/ZXz3+jwoKMjGvo3bjGnFoX0AigAAN4zOwgurgrj72Fx8XBwGEIbX70VBgVUctRQFnXMQkK2nsEKA7CwP8gqyEfEKhuUny5uFgoJsZO1T26ZoWiAnywu+FX7rZJC8PKIAhCw/fAU56mdZQnaj7Y1YvvkE0RLkzClKSs5vJRiGfoX5vTw8LtsMf/8rFFGC98sf4T99bLP32RLo11EmQttxU/GbVXidDygPqXXddrr7RfCYIiE/zwte8KWxNSbN7Rev3xmKEQjwrfLMaUnSfb40laSHfYwbNw7jxo1DOBxGdXU1OnXq1CLxNR7tArj88stxzjnnAAAOOuggrF27Fi+//DL8fj8iEevNXhc9WVnxhwTHQpYV1NQ0NKPVidEQVNsZ0cqh8xxBZaWag0Md8SWjoqoB/rDVTcHzHPLyAqipCUKSZBSiH/456Ba8WjwTmyvX4701r+H4Hn+BwHkgaWbuutowKqV6xOPkrhchIHfCixsfAABEIxIqK+tRHTSDIqtq1TpZuR7gpO4yTjzZC45EIGrBuXUNEVRWtoybw565uaoqiOpaq8leAVBfH4Ik1MMTFo08P5ziQWVlPaIhLW5Jc43VVdVDrozfL6mkvmIdglVbUNj/zBj11Ez4yjp4AUQJh2BUhg+A1BA2zpFYiFH1kemRshDlG1C2ZzW69j/RXKCyptFtJERNHfTbXaR4J+pctukPhQ27Zkr2mULs11EmQj9OUtF/QZfA6braOsu2M6VfJMqHvm31Z+jc75TW2W+0AfuLP0Cg0yBwvBfBqs3oOuhvEDzelPRLJOyswdjQEMm46yNRMuV8AVQBlqgFqtljXj0eD2655Rbce++9KCoqau7mHHTvrlYrt8cRDRo0CN9++y3GjBmDjRutPtTS0lLLuskg2qN6WwBRG46vKFpgMYixXz3uJxwVIXrc2yJJsrG8APWtaE/DNryxeRbqIrX4c++LjdFiikQSOiZOMd+2FEXthwE5B2NTzSoAQIMWhyIQs49kKOA0YRIR5Rbru+o9P1i+i6KCiBi1TFMASJIEUZQhyApCWp4fD/FBFGUjuFzSEiLKUalVfmud9YvUnCq8rytyu8e3kJKQKuplQYDEqaYqJRJttL2S5vbitMu7vmKjQ2iJNQ1Alt+xblMgQdOySsqrXNuleL1GZurW7OemQF9HmUwq2ihJUec00f2cSne/KFRI6tYl9yGnxzHg+Ja3/uzf/An2/PGsZRrn64wu/cYBaH6/EM55DLKcuddHoqT7fGkqzXbSKYqCX3/9FfX1LaNaDz74YGRnZ2PlypWW6Rs3bkTfvn1xxBFHYO3atYZ7DAB++eUXZGdnY+jQoS3SplShF+X08qqri+fMnyPAqw+uoOR8S3CDzvUDAMWaWGlqwLPAmeJHDw4+q/clxrSIrD6QOduZ49dkdKgFU1YEq4ot3wlxBjzLBJbRXvWC2t5sQXWNGgkb01zVPVS7tdFlLAHPWsAyiTofXnYULTA9R1LFP9FiJ6Sh5mgSIiZ2XsVtX4TaRow3PiUVcQBsGH3KoAOec7oeCgCQ5UisxdOLbVi+LKZmuH9jRIPOdBKR+hKXJZODE1zcQykcgclIjIyPUPL7/ZgwYQLmzJmDTz75BDt27MDTTz+Nn376CZdddhlOPvlkdO3aFTfccAPWr1+PRYsW4dFHH8W//vWvjB7mDpjiJ6CLHyrwuenix/o2IUPGD/s+NkZ/JRosKBBa/KhCwccHcHjhCQCADdV/AHCeOAEt0U+w+c/UhGkQ6/Dsxrst06yjvRSjgGmOoI4G1JM9ynopjAx1dwAw6nqVkTX447fLURPYbyl0GgtZe8BlKWqQtP7Akwb2pRdqdvNoIUaCQXeRwjdvCLVnxVrkPPIChD82NGs7DBU9z0+3IRfDl9NbneYYAZZ+avb+jPryPyzTZHsgfwuhyI1fY83avvYbEI4OfGbip7VpE6leJ06ciEAggFmzZmHfvn0YOHAgZs+ejT/96U8AgBdeeAH33HMPLrjgAuTn5+Pvf/87Jk6cmOZWN05EUoUJT/Rh2MmLH4GzjyBQ8NqWmca3RMtbuFl+ACAsqW9dgtFW63qBVrD80AnaAp0GY1nFd45lZHVBbQWgQbP8ZAmqwDQSNhpD3Vsvu6o1wVzjNzvd7bUlpOYF2XDALxi99a/q8cV4U1QfZLq1T/2tZO1mLg0bBHz6rbpgKo6bEmJEklUhKdjOM7qdcdodC9+XP4JIEvxffI+64UOa01oGAEXSLLe8B7KW8LOlH/bJsHftS45pshRyWTL1tLQY1LcvePPNOnysxEWr02zxQwjBEUccgezslo1Uv+yyy3DZZZe5zuvXrx9eesl5sWQ6etFR3bctWNxe6kMkUfFjd2ttqrG+NXEJGvkESvDQgunQzsdiddUSrK1eDuCfRl4fo73aaj+WyLi5hUY0RxpU07MMBXuGnoq6iNM8rYZPmRYIPebHx6umZj3Z4+LsdZjAHwSuFd1eski/uTYuAjyrbdYOhaDavw/Fn41Hv2P/A39uX8c6MvUg00W1oieC9PsgB/zggiEQSUZznUkOF5woOsQPTyVl5Pbsg9zLmpai0X1oIo1ERXDllZALC5JrbBsnFe5DMVyNiu0LAQAcHwDh1FCFTBQ/YrjKMc16/QDh+j2o3PEl/LlF6NT7hJTt260/UimI9G3xPlP8sOKmrU+zryiO4/Daa6+1SLBze8csS6H+DJyb5SfB2Ay7uKGzPqvbTszy4+FMVyFt+bG3lbe9wfuo3duTIKYKXfyszQLe3D4bC3a6vB0ClPvFDHj2cZr4odx/zw/5rVVjfqwxC/H3SxqCDhcXrwhY3fcbhEK7seF//3RdT3+zB2jxQ21HT3aYYssP0HgckX/ht83aXfZz85q1fpuDdiOmoB5b6cY3jM8c7zPcLpkofjjeS31W4xntlp+SNc9j37q52P7rdNc4nWRxi4FKpdVJ0eIUA/kDqYlM/LQ2SV9RP/30E7755hsEg0HItgcIIQQPPPBAsxvX3lEMy49eRsIpfhoStvzE17GJFjbN4s1q8bT4CRrD5Hlte9b16Hpf4Ra6jj2+zgCAskAWAPdUBGrMj3k+hm2WH9qataxwT6vG/MiSKX5ksZGbadh5A+blxgWsHhdBFGKMKrG8tWrWRZIC8eOIPxJt27TFACVTn0rqVgi+tPFiru0S6txMheUnXLfH+Ex4j1HSIh1VxfW0FbHSPehBwZ16j0OwejPCtdsdriExbKbgECM18AQSz4Iev3HO/pClsCPVRvKbV6+TQKchqNzxpTpNkaEoSqPpL9JOEq7rTCUp8fPSSy/hoYcegs/nQ+fOnR0/WMb/gBmCbk0x3F7EbbRXYg+pxiw7iVp+cjxmmRC6YKpe2kIXP/aYH7qgaUuNzZE1q0angmFA/VLXZaoEqgEK5fbSRsPRgd8emWtVy48kJi5+iPbgkwPmKD5Ojn+51pevQfF316jLKjz4+hCQa75pAoCiu6XsQiUJfF/9bG2zKFp/e7v4CYabfvPsyKUxaLdiMwPHATXOR0eRJbN2VitbHUK1OwzL5cDjHkdOF6ufXJFFhKo3AwC6DroAO5c9pE63tZO2WCkpHLHmJnLKit9FWfG7KBp1GQoHu4dfJL4D9XoknIBOfU5G1c5FUGQRm7+/DpyQhf5jH8zIZ6j3p9/hXbICwXNPg1TUO93NaTZJiZ/XX38df/nLXzBjxoyMH1GVyRjiQlETGtJurxxBvVHVi4mZpBu1/CRY2FQfeQbQ1h7g2G5nYcHOl4w8OXbLz5+6cZitBdq2lDFFNz0XeApjLhPkANqlZI/5oS0/vMIZIqM1oN1etBXIFV30Um/8vBL/ct2xdIbxmcgc+Mp6VfzILg/RFBw3sT8koraHqG0fRFGAUBgIJJ5fSK9s3xGxHHsKHoYyleMnp9vhqNr5FQAqJqyV2Lv6OeNz6Ya3HOInGjTjxHx5fSkLlV38mP0jS6kcrh/72ti24uVmix+93YTwxrGF63YZo9sUOQLSCvmMmorv+18BAN7FyxFsB+InKVtqWVkZ/u///o8Jn2ZiumfUG5tA3eDyPGrf1oiJXdSNiZtELT/0G0eIEj/53kIUZQ9FLLdXtodA0KZtrmmhDM+aS4e3jWzrnTUIh3U+HgAgEeubm+728tsCngHAK/Npi/lp1O2lCYeSHDOBZ2OWHylq/l6cwoPTziuL24tPndvLjj3mR1i/2fis6O62YBNjJ1KQj6gtIokN2Ln6cewu0ILe5ebbU3XB3fuwyfBlH2BYQVvf7WUeixSpds7Vc5PxfvBCFqAl+IRNpDVUmoWrU2n5aem8UuZQd8EQPxXbPqHmZ7i1sxVHyLYkSYmfYcOGYdOmTaluS4dDt/zIRsyP+XPkCqr4qY0mKH5SFPMDmNafAwL9LNO9vB+x3F6AGffzyKqWuTj0m7dkGyklcB74tKDIqGW0l1vAsyl+BJlv1QvZEvPTiOWHyBLqvVXYkv+TMU1oRPzQwpVTeBDNSkeLHyVVlh+3BwQlVEhDEIFPvjYXz8nSpjdN/HRUy8/eP55Becn/sLXbCtT4y1IyFFoX34JXq4Vo3BNa92HL6/sHQHjnC7RhGdHmuVl+oiFrHJiSQstPS4sP4/g4gfoNKDIw75KFFATfZwJJHcUdd9yBG264AVlZWRg5ciQCAWfGyp49eza7ce0d+1B33s3yk7D4iW3ZuXrI/U0SP9cf9BBWVy3BuAPOs0wXiMdoq93y0xqIYTUppGyLf+DAGUkeRVuGZ93y4+VdxI/SujE/TbX8hLzWumXSwQcDu7fEXIVQAeqcwhniR3Z1ezVT9FH9Jmf5wTWErFaaoHVYspIVAGrqmmb5URQj0aNlWgbGQ6Saql2mcAx56pAjpsDyo51/nKDFv3HpCXj2BroZn3nBWX/RdAtpWc1dxU+FZZ2UZqluafGjW36I4Jp8NuOHvbeTjOtJiZ+LLroIsizjjjvuiBmYtW7dOtfpDBO99ITbaK+mu73cxQ1PBBza+dgmtWtA7sEYkHuwY7qaADG25aclkcQGiGH1hidzNvFDOKO8x2+5wN81y4+oSIhy6o3M7zLU3SNzILa33ppIBR744yr0yxmCq4fcF7tBsoys1z6AnJ+H0N8SK7hojfmJLQK4PfuQ9eYCBHOs02Wf9bgVRTIeDID1LVqBAs6w/FA301SJH3okUn4e0BACoWJ+iCxjY49fsT9vO4pKR6J7oI86vSniR5YdcUXc/grI3WLHfLUX6GzGvCKApMTyo/a9UV5BFxUuMT8rv7gFDbWlGHjs40Z5lFRBn/uyW04dKiBY/esUP3LUWk5JcalZlixKC1vCTMsP72r58S78GvI557ZoG4S1m+D76mcEzz2tybm32ssghKTO6vvuuy8jo9HbGnpsSlQ7l3zUQz1PSI3lJ9FYn4T2AQ5Q3GN+WppQjVkLS7bdjAk4dNMerpwCKNrFGSbmDdEt4Nkj87Cb/NdU/4qKyD5UVOyDrMgxLWZcyX7we0rB7ylNXPxQN/p4lh9ho3vdL3s+FkUWQSgrGF0zKOStR/TwUUDF59ZRMamK+aFGiyk+TXTRlh9ZRmm+ehx7Om9AN9+Z6n5dhvDHwm1Z39eLEbzwrCQa3Lbw5/VHsEqN9yIKl9KYH067Foj+wmSvoSWFsX/bNwDU6y7Q6cBm75vG4oZ1TShoxsRoH/SGGctIojXVRWotPy0c80NZtrILh6N8y4eW+XzxlhZ3RAY+WqT+/fhr1F/19yat2xLxgukgKfFz7rktq0o7CrrbKyipSkK39tCfw7KEkCTCzzcW75GaMm1RWcHXu2UMzifon2fdpip4dReddb3qPT8CGGN8lxXFMnotWWRFwpKy/+GAqBrk7M3uCcl2s+YIhyO7nIo3tjwCmQBhJYgcAGGiBUiDN8p2EMpCJsicw8RN3/dEOQpvzFEX1LHJsrPSq+vB0DfvODE/WhtEznpDd4ofCXScO20t4GQe0kGDgZ/sAc+pifmhszsrXq1vbeJHR+SiRnLFphRU1a1Eis9rCKGmiKe2DKGSjcpESsnbtn7O8ZpIjhXwrLuXAXfLTHOhLThu4ifSsBcAIEVVt69+zdIvQPYA51TG/Oj3hN6H3Qpfdk9s/uFGY5Yvu1ustRLfPGXZKuhzEnb8ZrUwK0RO/J6SDjK5HmITSFj8DB06NGFrDyEEa9euTbpRHQX9JhCU1KcdLX4CvACBEIiKglox2qj4iVW7Kyo3rRjgN7tlPLNWQp4XeOVEezAigeIy2itUsxXbfpkGZH9J7RfwpcDo9FPpZ3hty8MAgGtAwPFeKucQtLZw8PF+CAqBSBQ0iA0oBBCGupwXdNZqq+WHEHuCTvNzVInAixjih+4AKbEbFf2QaXSoO4DagC2o0yF+rN/lqPk2zCs84NWSHCqpH+3lXbzc/KIHQNK5g6gbpEwkKPoyTQhgNsRPwG+IHjnHGSPSHqFHQcmc1GzLj6JIxmhJw0KoW5pt4keK1lLtqEXKofbnVjZi5+//1fatirDa0t8AAKUb38QBh/xbXc8mdlJp+dELI3OcB5zH6ntORTyOw7Jln0+UhO8pyUAqzHNLSTTtBP1W2NEsP9dccw1zdaUYvbpSUDuXdFcXoArIXMGLymgYtdEIuvqcQeU0idbuaoyttWqbalzuJQQEbkPdQ7XbHcuKKRI/G2tW2BohQLQ99PXh6wI4iJAQ0Up7yEQ9Fp7qG9oN6HEJeKYTO0bj3VDpG5MkmWUj4kGLn8YCnuEc2m5/UNi/y5QrgJMFEK/f2K9+wzWSHDbz7U3YbP7mikfdJj0yi1D9qnCyaflpyugtLYO04vVA7pwPrqIacmGnZrS67SDS4icFlh/6fOMclp/YyQNbopioYhE/zmsskXIb9rw+LWH5AeHA2Sy/SgoscLoI1WP0+v1pOrYvmW7Oh5z4PSUJ6EzrUs8ELVkW8dPBLD/XXnttS7ajQ6LfBH6vUi8G2vKjf6+MhlEddVpvHl/1O37auxsPjzgWWYI6aiCs9EKVdCbyuG8Q4IqTapOnUQ3lHO3l9vaWgsEpDn7IU7AqaxOw35pmQb+J85orShdH9jxKgH2ou9PtJVJWEjGe+KGOn0hSQlmt6YeMFKmGLIUdN1fAFA4KsW7V7oKwZG5WZMuDilN4EI+57UiwAgCVM6W5GZ7pE8Cw/FDtsZVlUTzOZRrDEEoeD6KD+sH38zKQcObVoUo1iiJZLC4y0ZI7NGOk2/7i97RPnOlSi1Hegg6A3r7kbuSc9TEEby5SBv0SYBf0jcTbyGIInOB3iKZ9619F96EXp6Z5FvFjt4ykIPBcu071bfuye1n3T+SE7ylNgdTWI+v1DyF3NrP4J2xRpH4XvqIqs91yCdK2W9/G0Ud7ebT7WVe/1aRvZnl2PjDeLF6P7fW1+Lp0p7oNzosK6WxIyEOlfHbSbaLFT9R2YRBCoCj6aC/zJqzfLM8IzzGmSS0gflZlu0/XY4sEXfwo1v7iYlRQ97jk+ZEogRFV4ogfuelvQvY37HDtzhjb1ren70NLVmh/27Wk97eKgkElo8F5zPOprkITw7rlp5lZfcVBReYXQY/nod1etoeafl41xWSuW348AqAlVCWR9h/zowof8/ySOa3PmmF1aKjQwxBkw4JPYpS3sIuhyu2fJb1fNyzuX9uoLdrd16nPyY51dSuz3fLDuQyZb0YLAaixRi1h+dFj8/Rt291fhtsrxXh/XgauqgbCFuq+k+h9wHY/5yqqUtaudMHETxpRoEBWBES1E+ug3ALLfL2+1+LyvTG38cP+3QAAL+eHgviuMZ1ttTJ+2ed+cdHi5/0ttngYuAc86xaIP4kfGdNa0zJK9OH3WtuimhCQFat4AACJEkaCzFncMwBQHi4xPse1/CTjA3cMV46hECWr5Ue/OdbtX2bbHCUwqPb8adPfkNVjJAjhkF04AgBQX7VNXUyP+dGESvWen1Cz79fE2k9B6lQXW+SIEVS9sNiWHwlawHITRLEeVK14PUZQtWf1xnaTZyQW9grlsh6X1ozj1sVx39F3GNNiFTZ1xLWkeKg7bT0Rw5WWnD205afv6KlaQ2n/uTpfjwPKKjzEMj0lGJYfYuREMtvXvBtbuG6X4Z7WLT90fi5A+71bIq7GRbglXDTYnnKipCzGgm0HJn7SiKzIiChmjZSALajZq7kovtu/G3UxhryvqanAlrrqJiUxvPFnEf9dIWJjlUv1Yuocn7dZwrpKehn3mB/67cGrqBd2S7i9YlEbrQRAW350K4gWuEiJH5m6sXsU3qHSttaZ+anixvxQHZVo8LDzIROjk4yCt3rla/fgKcuQYermzyk8FI82AksrZlm1VwtQpkZ7RRpKse2Xqdj602SITQxs5fdpNz9CqJFctOXHaonSxU+THuCU28sYTg81R0l7pq5sueW7THTLT/PFj6VmlCF+7IkkrecpL8QwuSbbFtv29cKlKqarWrdQ5fU4kl4ZshRGXenvAIBI3W5jeuraZ1p+6FF36rzmiZJdK2YZnw1rld3yA7llhpO7uEwTtuDY+tf33ZIUNCi9MPGTRmRIUGDWqbIHlMvUA62BepOWbSfi9oYa2Llu6EMQiAdXDr7HMp1+4G6rdd4w7KJlTwP1kAcQa6i7Dge1na1p+fFoNyjD8qOJH9nlbVCy3+htZl86Jiiu+KFv4Ak+lJw3Tvf1iMPy43FdLpblB4AhSLyB7gAA3qNZBakkh/poGsA6wicRFE39Sgd0NUtmROPE/OjH2oSHFDECngUoAfOhze/e16S2tjlsfWSKn+QvKjOxnnku6W4XRbRl47anknApQdEsbNuvLfmF3rn6l7oX9jlssjkbssXlpQ+HT21iQtPy4xjk00zLj6SlEejU+0Twmlva/nKjEKX5MXluuMToKP4kRnsB7SLLOhM/aURRFGPo+Ij8Lo75UbqEAHXyVUasIzDW11Q61j0gqwhPHbkIozofj6m/RvH4H+rN73+7rBfvtloZV38fwfd71ItNtF3bOR7zJCcxhrrTF0KIqHV7rv0pit31rWP+6aElOBS009l0V+lvcJTby24tsam0etEUBG7ix//R/xB48yOruyzRh5L9xhlLCOgBz9pNONaQ2LqyFfTGjE8ExBha7svtq+1KnW8mOZSto26amCFXH4Yud+lsjkoRRUBREHh3IfyffW1bQd9RE8QPbfmhhuTqLrD2ij2w3Yz5Sf560oeCc7T40UZ9Sba0C/aMz6nO9eNm8fzjo9MhSxHjnLTk4/Llw5vdU1/ZIp4M4ZBKV6hu+XEtPdE88aNf0537nWlMc8b8yC3z9uiWmTbRfrMv1xLirJVh4ieNqMOqnXW9dGjxE6E+76i31XxSFMcNRdD8yFtqFKytVPDtHhmSomB5GSWoAMz+Q0JJEJj1h6Rty9qGbPq6JMSIXLVeR+5vAWsqWsf8c2rPiwDQMT/aUHcX8TM0/3DjswI4Yn7qombApSPgWZTgWVsMYfsecOVV5vQkLT8x31Z1k7ct5sfO3tXPUBujtqWYVhPzBq61URcOkYhlnUSGF9Poo64Un9cQWkSUQIIhCMXbLW44de9Nt/wgagY8y4VmPJySk1o3TKbhyN+kWX6aU+LCUkxTQxc/jrQLjtFfKR5h53IcshTSYtqclh/1u5mQ0a0cRypjfozrtAXEDx1PpOMmfloti3LCL262wS/tINcPEz9pRHV7aTlqXEySUephGaGHSdsuwJpoBFF9msKDE7siIqumalqk1EeBX0rNk3hXnWJxc62tlB2WH/qcp/P8WAOe3S+EfcHYgdqJUBOpwJKy/8Vdxs9noatffSsUtLdAex4gWvwEhGyc0Ws8AM28TOejURSL5cexHaoulULfnJO1/MRye4l6zTf9DbTxgFN6SwQE4sC+xjd637oFhQRDjWbajb0zxRRoPO861H1f/jbrOqTp4kcXcPB6AJ8X4qB+ibexDWNY4bSuSmnMDxXDwhvix2b5sbmGU1k3S92+ejy9D70Z+T3NuoOcEKDEgS27vD7iUY6gYvun1Az9/E695cf1pU6RGx2O775JCZU7/mdkqbbU5CP2mB8FpLIaqYbb7xLcnOC9y15jrz0kOmTiJ43Qlh/BxfJzYI75tktbgSTbiVgnRrG5Tr1Y+Mhw8JHD8cwa9SZHW09/KrGe6J/ukOGlzoCpv4oO8eN8XKsXqsXyE0P8fLHnPdfpifLQmsZzS3k4MxZE0ISZHvBsigdiW4eKYZBo61rIkj3anh2bhEzxQ7/5JPpG7hCJsW6iuvgxhkYlcLO1t0E/Zu2v3hem+AlbC0U2RfzIsunF4nljtJfupopyYWzvusravKQsP+r29OBtI+i5Hdx446ELFV57gTFGezXjuPU4GWvMjyl+6Ae63bohNzFLfKNQAseXW2RM5oUs85q1Cw9NDFXu+B9K1r5kTM7qPMy1zc1qnu5u1vYp+ApsCzR9XzV7F2PH0hnmBErcuVl+Agu/bfI+GkPYtts5MYk8PwDaRaJDJn7SiKLW3gYACC4m1vH9hhifreLHeuKFZQm12mgwTlIr9C4rU28eEWrR3/Y7T1jBtttII5YfRVGTndGxQPRD1OP5jlq7eSmeS0O7Gl0mTMUr6H0YNR7kevyA9UZqvEXaYn7s+YHsZTQsFzzt807Y7ZXgUHfNgmIIFtt6netUS1dBH7qgqtX24/isx/zoQkUSk3d70f3Ac46YH4l3KVaZjOWHcntZ2t4O4g3ioQtRQVaFih7zQ0LJixA9uJ2nkhWaw7hlS9JAu0hPdYkLhYqp6TLwHNvMGJYfTcQHqzZYpvccfo2+YiobqO8UANDvT/egoN8Z9AJN3qQ9Cz4dT8TxXvQ5/Hbju0xaT1jY3f4xscc7y3JqrW1pgImfNKIOu44d85MleDAwJx8AEKGLYtpOuqgsIeziB99cI+PO38wH+vIy58m6vso6LWwL+rHHAIWiaqBeHhVzSvvgBW4fZG4/AKAhcr6riVhRFGz9+XZsWzI9pgl5d8MWy/eG8Hkor30dUfEgy/SIbFpjeJvlxy3mh/5uj/mRbTf917c8gh/2fUI1nNoG9QDOenMB+F0JuPgSHOpubFuP+bGNBulUr47gqtz5PzOQmdoWAaGCNm1uAX1klijb3F5NKDtBWyAE3oj54csqkf3ka/EfDU25X1IBz+oOzJFq7ZmqXV8BAHitvInMa79lMDnxI4shQ9wI3nxjOp3DxuL6stf6okYFpoLaferoLkVR4PF3huBXB3so6kR1Icf9UAvUp6y2HO8Hr9feSumDWLf8qOdbTpcR6DVikjE3meHujnQVNnHXud9pKNBeaqqzSpu8/aRJMuYHsIYBtEWY+EkjiiLHjfkBAK82PeLi9tIFU0SWXcWPm9hpjLDdM0N9JoSAQM3jU+h3t/z4lTpwcldtemfIcLZLDFeipmQxqnd/G3OI9epKax6J+vBVkJXuqA9fBgAYmDscADDhwDuNZTya7zwaJ+ZHPw7AGfNjrxYPwCiqqh0QdRBWseB/73PX46Cxx1bENJ/bLD+di/5szCrwj7T8JpH6PfrGLH/scQtGcDUtIBqpsRQLYyg+oD6kBCp+QZbV0So2lCQS9ZlJDgVn29sxukARJM3tJejip/FiuG5I1HlnFDWF+kDW8/7Q56Y9oFgfTp5q6vcvV9th7FgxXU72R5ORldo812QpbNYnS+FQd9PSStew4VzmJ45d/BAXq7jEpSF7eRPdXgr1nOL2V8Rauk3AxE8aUS0Tsd1egPngLg+bNydRu/j0pIhRWcb+sPPGKCYRIBm2x/xQm5AUAQrU3BQHFdARz+bNkidWMbOz3lljjDb5imHnMH0AqBPdA/4kWXXrHdf9LDwx5jOM6WKmwNcrtuvuKzNZmf0t0rT80A9Su+XHAW1dsble9Ad1PKr3fG/foOtyolSH/bk7DHeHJ9AVh/z1Mxzy14UYUHCJ5WiMh5ZN7BgBikYJA+0PVdWdvomHqrfGbTu/ZQe4Mu1mp/eZwLvm+zACdBUCL8nXdq9Y25UIEavlpyO4vaRoHcJ1avkB3b0pc1rfNST7pq3/zpwj/k3P9VO583+o3v0DKnd9bZRf0Kna/W2S+3ViKW2h78dokxLT8qOLIdkyLF9p2YBnOi6Hvj83UfzIYghVu+ypH5zXTbeaIgBAWe4uyFkJ5t9JlFhWZkkCqWrEsheNwrNqvfqZ4yDpxYVTUOojnTDxk0YURYKixHZ7AcDaGvWB8+yW1cY0PeePXxM/EVnC2mqnCo8mcW6G7cleaWOHpAcXK8iiYvT0N8UoFFTaBiY9suYGxz7oN8u60uWu7aBHXVnWhV9rlwI/b63n4wh41mN+Y7i9ANOKATRN/NitD3QGYjfqy1c7psVye63t9Bk29FxsmL8J4cALAfBCFghvfWM038p1oRer6XbLj2wRrSXrXnJZS4UrLUfW258i+/m31Qm61Uvblj3vjm7l8YkB08Wox/w0QZCbMT8dx+21fYmZlNQragHJuvhJ1s3gMrxaR3dplax9CduW3Ikdv96LkvVvOtYP1zUef5dQU6gEhb5cffSemY7ByPNjfxnU2i7Zradm6H1So7Bc22i0ITWWnz1/PI2GynWWaW45hMzfW0RETq2rkS/eHnNeztNvxF3Xu3g5fD+o5URAYLqh23jQMxM/aUSGDD0oOJblxw3d7RXQHgYRRYafd5pR7SO3dPrkEPSKkSolZAvyoTchK1psB5GNYqKA6fYKcYAM6xtLWHZapCyxJjHM1Y5MzMYKWhyEy3p6biPD8uNS1V39pn6XE3B7WdazKkFre/v0jLtuXdlKl6nux17vtQ5J1UtUAHBkadUDlR2mekeiNmvMD5GkGPlSnHC2+j964K3i1zIEd+5kma8HbHIKDxglW5IPeIbu9nIroNrO0GtWAWbAs8JpD+MkxY/iOBfiY7pSTaKhBGtANQJtVeo2RM3PZU2AGWOYudZ2u+vYekypsv7o20mN5afCrTCsS8mafKmP8VlU6lJqzbIUM20innWU9Z4QdZADmhAsnaEw8ZNG1AzPmuXHLftmDHS3l99we0lYXF7iWE63/NhLUfxzMI+x3d1/+hKbVrG+qOvZna0nfekG9U2xhvMgolhzsUhKLuxYAgZjBNrKMW8werIz542B126Yv4bXoz5aYyxjr+pueaOzWH4aCfql9snvsZZY8KzfDMR5OMnRBpftxd+dDiG0+LEei9mX9pgfY21tOc1nr4mfrV1XYtsSM14KiOPeoPtLUZD96gfqx4BV6AY9tVhW9BnW9lbde0ThAMFjbY7td1NkEcXf34DNP9zkDLqO2Ia6azfd9pBdNhE4LeA5LFcgJNQn7/aKk7QvURyJEJOktnSp8ZnXaltZRl82kufHETdnubZTJBZcrU/JW34I5xQ6bkKU+LMRiKj3S4mTLOVimgO/aRu8y5yW50ThKqgQBELMcjbM8sNIFnq0lyfGjal/dp5jmmn50d1e7iehnsAwYHNF9QiQmG42O5b8H/qIC9tNhtPqRu3yqPE4kmC+KdTIY1022nh+mVguKL0NbhajUM0O4/O66qUxb4WWm20TLD+WmJ+Is93CztgjvmSJfnjYgpBj7MNYmrb8EA5das03RFMwWOObxMH9teWJZb5uRdndeb1jP9uXTHdvPHWq0FYgeui11KMrirv/jgZfDSRObZNMJEBve4ycRaHa7agvW4G6/cuMWBcAQFQ03iwNt5rQ/t1eNPpoLwDY0WW16zmXCDFz58Asf+JGduHBxmd7HFCy7PjtPpepTtdVrDw/jpQMFotMqtxezrgjQggVP9fE88/t3u42LRIFJ6vnuEykhOIIEyHrPRfLk51EhRYhpvW5jV+HTPykERnmaC8+hvi5qK+a62dYXmdjmiRbxY8bPqHBrK1luyf0ynbm97GTo22atvzowsNu+dEfwEEtWRcR1mnLy5BhjctRl298iHVsIaLFmbjMiVLtWlu91JGszESPQ9FcWdrNTh+Z1snTBX/vfyMA4MDcEVTDY4/2AuK7JejjJHqhSLebtcvbFF2PSeEIvFIAWUo3bRPW4G4AiA4ZACVH73drhmfwPGRvYvmXSEMQnmVrEPhokTmROiHEIQOMz+HjxkDiraNVivaPNGKU9AewPdFafdkf5vaoIdV6XyocB2jxVEYZjTZ+000UXjGv74rsvQjKZcZ3KVqHqt3fJiZKDGuK83fvPeqmmKv5cnohq0BNLaGkSPy4YgQtA2ZRUfeYH5rC/n+xWHFTlujQuPfYcw2ZJTaagmOYO1zuSYoCriGouoqhxv0YAf+tQKIuVYXjDLcXC3hmJI36wIqd4Rmgh7o7y1s44nwsQkXG1hp1Qq4tFpcQErMqu06BNpTdcnprFyYh1oe2nv4+QvTsz1XqcuBAlIjDRZVIfhnaKiLJhdQc2bENo81ZvY3PP5Z+inX+nVo7rBhD3fUO0x6muquNIzzyPJ21vVk61dyGi/iJ5/ai31hNMeMiftxEFeeM+REULfBbtrm9QKBk08OZbccKIJqVmNXP++0v8H9hHaFGIqbAkfNyjM9KwOeo5+WRfNRDzPw9uX3mQ3zPH08Zn/WK1wAlfgJ+88HXwdxegmT+7qIQxkqvGZS+7Ze7sH3JdOxZNafR7bgG8GqQOBXbIw2lEPzaddCS4seg8dFeNP78QWgJt1eszPBIWvy4WX6s925Oc6Prlh8phZafREg4nozjDLcXYW4vRrKotb30mJ9YeX60oGaXPD9+h+WHyoEB2RA94w8UMDBPvZCvPEizNMX55bMFoIsWzkFbfmS9qCn1IFNFiPo9rD2kCTEvJIFUOd07tPiJEWejC5Hjuv8VsmKKH0KC2nznje6M4VMt39f7dPETO8khAONhqrvaOMJTNz5a/FCfKTOxWKSKrng3A4u53jCfO5d3C+a1pL/XrR+KXutItGyLKDBHY6hTHG2PehLLJ8LVOeOU6JtkdMRQ47N8QDfIOQHLsnnBQuOhpVCCmd9TqjVJsZXYMNtliB96yG8HGO1F45UCMeepRUCBiu2N55eKFUcDABwXW/yE63YbQ+GtbtvkKeh7OgAgp9toairl9oqRld0uhvz5A1FY9GdHPFpKiBl3FPu6bSp2YaXHc3GKfr3IRmHf1iBhlyrH3F6MZmIG9MYf7eXh9JINzgzPHsJZYoWuHXSo8VkU81CqxQZ+tX8DZh7lwQeneXF6X31/1v3QQ9f/30DeiKu13E6I0/JDFz0s9mkPZphviYoScLiwErH86P1TlDMUvQLmQxaKNsLIJV4mJ6sn8qnNxYp1sA+/1t0oejt5wpsPbUu1dPOzLnSiBw2EXJCvNTr2TdHyYCexXXfulh/zAaXnugkRNT9StSNImViHnhtCy9xbjXcfYhGqNeOm3FxwepyP1L2LWSEeAAiBHDDrrPGSoPahvn/6J4hG4VuwCNs+uMwihHf8dp9hJRS0obl0ULXSAUZ72elGDrd837p4Koq/M2ve2etCuRFz+DjiW34ANYsykDrLj96GnC4jHdMUhbb8uLuqdXoechUIJ1gsQvESHfq++AGBtz9J0FUTY3RckpYfp+0ZcLjU9Os+oLqrFSIbtfKMVikKti25B9t/vc9hTW82scSPfT/M7cVoLvrDXWnE7eVxyfAsGu4ZYon78cV4i1tSsQchyXoh2QeXNVCzA4J5YlhifjRrA0eLH8qiEeH00WAioMXPKIrfMXIrkWriMiVEorJp0VLgg6IAh3U+zrEO4Tyopp4FHkUXYzGSHOp9rj1M9VIZHs5nrBHL7WVuinoTipPDho5z8gS66hOdmxMlGAmKNPS3b3VlbQQQp7qIakoWq5uiszV7zE4w36nN+VEu9lv8zt8fNL+4vNmR+qBjH+aOqWSX2jBtve0SNVqIhMIg61ejBtscm9CrXkNzr1neSDuY5QcA6mANoq/Z+xPqy804Kbd4EgfGueFi+YkjfmQpRGWATo3lR7/23UVb7KHuTiHC6zPojcfcr3fZaghbdoLf4RzG72yje3+ROBbbeJj5jKht2Y9fEzrGixGRHdYYMVyB6t3foGrXVykpORLVB0UAsV1s9j6l7nfM7cVICv1h1FjAs1e7GMojIWzRKrfrLh+eEOR5zJuXN6YJW0GtaD25g3Fi6XxU4t4lpTJWlctYX2UGZxM6Hkesp9Y0JQOgV1b3O0ZuVe38ymxZLMuPJp448CCgzf88Zo7+FAW+bo517DcUvQp7zPIWHMHarK7YVqMeT11U7d8cIY+60SlAQwjCxq3ugbaEM5VknJuinpm296G3gNPdk255diIRw/StI/g6GZ/dRIckNmDfurnmsXrcLD9UWzhrO4ef/YXxWQypFiUEw66j10it+nsrWU6XDC3A9JFKgk+1iklR82YtrN8CiZi/u8UFolsptDpW0ZFULbcOkOHZjkX4upCQ5QexrClWq6JjPVk06n+lKuDZED+EajeVpTlmTiK7m8gYPk6Ln8YfxgkVh41VX0wXJk0e6u5xTNMtasZ37boCp+cxUxBu2IvafWbeJzFcZXyu3PklosEyxIOUV0LYsMV1nhzwI3TOqWa25liWH9u1pliGurft65CJnzQh294uhBh5frxULNCNK76HrCiG5UfgONRETXdKIOZbnGxZDgCyndejAUcFRP++X8HdS0XcvkREVFIvWEKNqqrc8SUA/QZLJ9TTEw1axU+4difKNr9vfG/M7UUIhwJPH8s8gbhnaCSEwE/dlyTdrRXD7RUmObhu6F9xw9oAFEVBvaiW5sgSci3D4bPmfYzA/M/hXeKSqJAjhviJl/RLz/Mj+DqB26dm4+a3ObPmctt3m+Uh9GkCNWLO53wY7vz9YSN9vshHbAJJz/NDWYZs7gH6AatbpQLz3YfHkjpN/ATcHsqmwgr61L7kvWqqBhFmfha+vNIo3cELOdYHob4fOuBZ33o7uek2BV6IHfcDNC6OAJiC0jXmJ/aNQJFFIyYoVW4v/Xq35r6hy1vEykbtboWhj8kecG/OoKaHG493i+UmNF+Imnj+uSxvt7jx29VRkHrNL4XIWL3lDmz56VYjQSothPasmoP1iy6Ju9usNxcg8P4XrvOkfr0AjoPcRQ1ot7vYzAVtZXwUhbJ0M8sPIwlMy4/u9ooV82PeJCRFQYMkWgqbBil3Viy3F4iMmqj15nVMDw5n9jX3+adu5s2GI0C2PSgIQFgLwKTdXpL+UA90g6LdxLJlAp9u+VF8kKjipmFb9tjGAp55wmNQjjVXkL34Ks3/1ZgjkORGxE+QM9MHiIqZVdrDec2kapDBa6OT+N3ORJIKR8xif3HcXvowbt6bZ5iLSYlL9WYx4ggRoIMjZe1NbVDJEQDUN8jq3d9YV7DF4mgtNdtMideBxz2ubsejCsq8A9S+jpWzyHhzFpwPTbcReHohTTHf+qYra5Yf9eFN95v2m0X1BIeUMNKOK9l8N20Bb7aaKbybMkqd0EhiwmwqdiYmccpbxIv5UeSoYflJVcCzIX6IU6BrS2h/7cLD3QqTkNuLcs8kNs7RPTM8XEZOJobzmBwWOz1rsleLaaSuUT0dhD3BoxytR0wUxXXAQviEIxEZeRDCJx6pTmjkmnK4thTFjPlhbi9GMhiWHyW++PHaRoHVRMMW8TMkr8CYF1sUKKix+XQDAsEVB5kXIF0KgyNArssL4e+lJwJQ3V41JUuw4asJRvxBp76nQb9ZDOC7Igy1XYpUhJpIhbENKVJt2Wbjbi8Oi0uscQ2XfxdFWHK/AXUlARykXfOxxI9xE6MmRyRrgDRxCRR2hVBBvXHehPTj1t1AAIz4HRrPz79avvOeHOsChEAq7IS8YBf1q8vDyxrzY83wDMCwuhzQ9a9G4Gn+Acfoa8c8BgDgd2kC0DZcUJFFRBucgdRGwKwcsYwOk7Q22MVP1S5NyOl9Se1HD+QmoTD8H5uu0/aEbskplNX8Xo09rSt3fIFgtbtrQydmpXRY3V7+vKKY7UmF5UeM1KJm74/ahqlz1PB60bW9GrP88C7TY5y71HWpxIitjIYqsPGbq1C+9ZOYQdfGPpto+VHiiE9151Gz/ESOnuGZHh2qrudaJiMWMSxcYv/eCJ95AoJ8JVZ+MA5LIvdid8GG2CPL7Jaf6lpzqDuz/LQeW7duxaGHHor33zfdJuvWrcP48eMxatQojBs3Dq+++moaW5g4ihHwrMf8uF8Y9lw+DaIISdatIpxtXqy9iWiQ4r8t14nAAZp3ZVgnglxv7LsuTyRs/fk2hKqL0VCxRp0o+KDfqTnaFB09EvvDprVHdIifWAHP+k2Qhxx0BilurnG/0XG813heSMT9psNDz6Vh9m1Yspq76cG3cRF4M+Ynxs1AUWRI2lsa78k1h6nb8w3IssPl5WZNgc9nxNRILm9/ipcSRC6WH732Fv32TRKMZ9Drm+mjznRqS3+3fO9drsbq0A9P+nj14ySc1yIwSzdqRTX1WAPq/KdHsXlWbwSCrZF7pnUxLCP6z55AJvadyx5qbKPatlzED7V9wdfZEl/W97CbQfjUWX7oQG2r0DLd5UqMUhyRBqslkhgjTxNIckhflzH6s2TtiwhWrseu5TMbdXs1NebHUYLGhrBus/lFi+Eszd/mWK6xkXmWZWOIH/0a2vn7w8Z5sbXbitjW1Hhurzbufm4z4icajeKWW25BQ4NpyqusrMRll12Gvn37Yv78+bjmmmswc+ZMzJ8/P40tTQyzMKce89O42wsAoopssfzQ1EasF9chPdYhGvgfQBSIjaj0uqiCx4/24PVxHuR6CfLiXGc+3uWhw5vixy7K1lSY9b1C1Vst82r2/oyoHmRLYebc4RCSnRaSSIzrjuO9xj0mxKsPkiisFzbP6SOmTFdMOIblR4FiSeZnRwn4zZuBi5VIlsKo2LYQeqN4On7HfjMUJRfx4/zdFIE3Sx+4iCNLbhx7hmcAim5VU6hzyxbPIPVQY3+CZ41zbF9d2fob0w/HXhVD0K9suLoY/fCkzmXd+sRxPvdBdFowuEUg2qrHJ13lPIMxxI/heWlc/CiNCJPEC5sqGHrqmxj5t09x3D8Xoeugsw3xGqwqjrlWbelSBKs2NdpO/Rzx5fRBdudh5gwq4BmubjGgU68TLN9dY4ZiWGkbs1AoimJaHNUp1u2aO9WWb6LFw7DyJxCQ7VH7OyKYv6kcrYckNiBS54wRjEksYaINhrBb4GNZfvi9Lq55NtS9dZk9ezZycqwPoXfeeQcejwf33nsvBg4ciPPOOw+XXnopnnvuuTS1MnFMy4+W5DDBWlsRWUJUD3i2ix/b+bu8ervxChlt5MLrlU3g4QiyPeo2cz2x2+MqfgSfORTedlrN3zwMm6q1EVX7l6uL+7tocxVs/Opfjs3p4pAnPCJwBnWGYx6OYtyy9mapQbfbpe2WJTxaodByDKG2ZyZY4whncRfFizGhxQ9xifkp37IAu5bPNL4T3ufqigIAEo1afP0AkF043LlTQbDUfXK0yW+KHyNfkZvlh0qK6Xir1fKOKLnZkHNdAsxtlh/afZnl7QsCAqlXd+PhqUhhiwvLiPnhvHB9I9b9sLTl0ya4SNBe5LLto8fAadowppuGhvfkNbLR+IVN9dFIvpw+4D1ZELy58AZUt7X++4mhMtfcMsHqLdjy4y3Y+PW/Y7qwjWaI6n3Dm90r1hJGSgjHyE37kH76u9FHMW4KdGyKyzHU7lsCWWygFmks4Lmplh91eW9Ob/cFfOabpi5+aOrLV2P/xrddV3V7cQRcYnX0tugucXt/ulmKJAmBBS7uZT0+icX8tDy//fYb3n77bTz44IOW6UuXLsWYMWMgCOaFcuSRR2Lbtm0oK4s/DDDdmJaf+EkO7URkGfXasPVsW9Bpjc3yQ7+4xLL8PDZWwOl9OFw5zHqz8cZpjodzih+Os1p++shLLfNLGtS26YG1gTwzx4QYjm35IeAM8XNk1HR3RmLE/BDCN3pS89rNXoZ5s45IZgoBov0DtHiJeOJH4KHEcXuF6621rFQzfYybdVQ0LCKAmg2318hrYUcReNf4DQNamBheL7O/RC0DN89RVijbjd24sfE8Gv7+VzOoW9+czR1L5x3JOukSRIcPQeiM4y15YmgrjkRZfmjxk9NNS+onOd1edtrjkPdE3V6B/AONz1lUAVLXbRqWH/dt9R/7H3Tudya6DRnvmJddeIjx2c31FQ3qlgEFkqPiuhV9fU6wP+DNQOKYeYDsQ92p+6XpWo0xkkuOL370bNnmMjFidJpp+elx0GUoHHAOBh1vLUlCX0vE53zR8AS6Ihrc77rpaCjGc87F8hM59GDAr/aVQ9hFXfrOZQRYw/izzXtBGxc/jSeJSDM1NTWYPHkypk2bhgMOOMAyr6SkBIMHD7ZM69ZNzf+yd+9edOnSBckiNFb5s5lwxsNbPfF9Ap/QPmWiGMPWC3x+y/VZF+fFSyKK6/YHFnC4psC5vD/OUHgP57xQOC8lfngeB8hrsJMz87cEZaLuX7u5+fP6orbUHLppb5tuhfEIAiJQ34yOiC6A3Ov/8GupjD8qgBP7WNfheQ4FPUcDOzfDDr19n3bzFQlVOwkEhNNcUxxvWNVIZZXFbP7YgHxUejhM31AJAoAXeENseFZvBPF6EP3zCcbyctRqXqbbUa/sQgH1nSgyarzq8t6sHhhw5B2O4wAA4pZgkN6Hhzcq1/L6jVVRwGvio4bboe5DyDbaoy9H9PNE0cUqD9KtM6JnnQgv9RbIeQTLsciiKn66DPgrhH59IfbrCw6AZ6c62kuRw+AoUaZbfnjeC4XKCM4RDgIHcJpLi/cJ4GJcF7wigzTjOtX7g49X66WVsVt+iEsKjL6H34yuA8/GzhVPonTjO+BI/PsVz+nix/0eU9BzDAp6jjGXp/rFl1UAwnmgyFFE67fBZxNaHOWm5YkY/x6mqPcNXvBbltNFGc8RQ/VxnPX84mwimChhc772IN+3/mUMOPIux265ejMuLrDwWwQPG2YRNrzgt62hZRkXrG3QX4h2LX8cB536UuzjdKBuzxvIR9fRNzrbpw3MkHt1B8fVOOZDiRoDY+wQJeja58J6p5tSHnuosWyoxhYkL0ac27HVcAzeeQ0IAG5/uTZbhiBwGXkdJULGi5/p06fj0EMPxV/+8hfHvFAoBK/XGpzi0/KghMPJB0NyHEFBgXsumVQRbdCSh2lv8AX5WTH3eU7/Qfhgq3oyewIehDQB0TU/B1ccPBLX/fQ1TutThPpaHkbhT1jf0ngv36Rj6ixFAbi/Sfm9TpWVk58PXfx4eACKNRBXFrwoKAgYFeFz8jqBfpext01/McnLzUIEal95EUStpO3DJ7gez15OcB0gQy9bIKruU4mY544n4IdfcyX5/V5kV1YBABR6pAiAD3qq627aVYfB9VFkZXkBKWrYkIRla5B9wakgWnwKB+t5WFCQjSivvQFziqVdcl0NygT17Tka3B/z94pm+xHP5tGpcw6IJjTEak18QEZeXgBixPxdCnJ7IVfbx37NVebzcSgoyEZIu2HndcoGV5ANKT/LEjmVlRuAQLVvP69ZI3M7Wdot1aqj2wiiCOT4jX6SOPWT35+DEBWMLwgE+WLEOPPye3cFodwCkRGDIa/aCADI8XvAp+A6zcuLn0unVdGubfUsVixWbZ2c3FwUFGSjTEs06fNyca9tuU7tP15wv2ZiofeLPiiBl0pQUDDGsky43Pycmysg4OYi1ajUDD7+QMDSDkE7V3NyfIgE1c9en8+yTHWW1VrUo88Q8B61ffqQ78odi1Bwxn8d+xU3BkHfsfLFMLhuZr3AqtxcxzoA0KkgB16/2Qa99EtDVTE65fttcUex0cVnbq77PV4KeBEFwPs86DP0JOxdO9e6Pi+B592tLFk+2XWbocUrHNPyC7JB9GUJZ3Hf8Ypk3At0FEjG3YsbOcTYj5gTgAjAy3PIodbJqOsoATJa/Hz44YdYunQpPv74Y9f5fr8fkYj1Aa2LnqysLLdVEkKWFdTUOHMkpJLKoP4QUi+ghrowKol73oZ/9zsYq8vKsKm2ClW1DQhr5v5oMIohuQV46+jTke/x4eaf1L44/8Aw3tz1nWUbO6trUFkZJy+EjWBdHJOm5Oyb8noRIWUAAEDwdUO+8rNlfm1DBJWVMkRRbaOoWG849rZFNddedY1oRPH0LDoZRxUSrCsHGoJRxzo8z4HjBPsLC/7a91LLssF69diCcg9j2uq9QXg86rkTCUsIB9V20rEyEqWqKrwcUA801IdBGiKgDWVVeyuAvBzIUhTlO639UFlZj27VRfi803J851mFf+/bgxyvKhC4ijqIvLrfLgP+EvP38shK3Au3qrrBiI+pr1e3V1O6BpUVFRAp87YUyTb2EdYiyEPBMCor6+EXJRAANXVhKJX14EIifFp/7MvfAkXagE6Vg4xthTRLTTiiWNrdoHlCasvWI+iXjH6KanFjipIFUTRlcCQSQU1lHfxQ3QFVDVGggZJdfzkJ3q07UC1vRaC8DKjsGacn4sPzHPLyAqipCULKEBO+rOXtUjQXtujSrmBI7eNwWF0mGAzGvbZra9XrVZad15kb9n7JP+AoVO9djH3bfkOg20nWbVebls2qiiqExHz75sx2N2jXV0SytEPSrOB1dUFEg2pbRcna1iCVkr7oT9NQUycDcB6L2/EJO0st12dNVQMUj2ntqSp1WooBoLoqCMHnbgIv2bkB/jxn2Qo3RC1+rr4+As6lfXxNA7wARFmBJPRD536noWK7mZwwEgqC08QPJwQs+X6qqyrB55nb5HaVQMnOgt2WBQDVNUEoWiA5IbzFfSdGI46+I+W1xnbqzxqHem0+HxbhBRANRVBfWZ9R11FeXiBhC1RGi5/58+ejvLwcJ5xwgmX63XffjYULF6JHjx4oLbVGo+vfu3fv3qx9i2LL/ohRPaAUerBs/H129QawCVUIRUVENWsEBwJRlJHLeSFLijHa64AAHCbLlZX7m3RMXJz8Njycvv+5e2ogQh0hRAgPj83iERFliKJsxDRw3s6W+fa26UVGgxHz7coreMBr7YpI7v1FXCw/ROEtyxKtVliDbLpMX90g4tKD9FEZgGxUIze3E6VM5cvyfTiyMqxe7LnZlpurXNsAOSsLe9fMtbTDm90ToihjdV4dFhUAQBjXLTkLzx2lClU+FDFEAe/tHPP34rU3zmy+D+qlnY75oqQYcQ6RcK0xffPP96LXqFuM74qoGPuQtQOVJEn9nSQZBICkALIog9d6tSJ7D4p7LAXWLMXQnofAl9tHW087nxViabdC9NungqgSNfpJF3kclw2ZChRXZAlSVBvpleV37YOS7huwm/8FeTsr0P/gJ137qClIktzi13ui6FYWIikACLyBAwBbSJwCQf2NtBcnWYrGbb+kvSwpIE06Tr1fOEG1dpZvW4juB/0LnoAZThCNmveCaCQEIc72Ze2cVBTrtau/3EiiDNEowyNYl6EuRMLnxjwOt+neYuuAB0lSIOvnvRRG+bbP3bclKdYEaBRrPr8YI8/91nWeHT2IW5Jj9L9+vhMOoig7AsIlMWKEKnG8VfxEw3XGNklFFQIvxx7pLEoKFH1ZTrCkGZFlydE2LqzOl7MDajfI5v0RABTJuk4mXUeJkNHiZ+bMmQiFrA/aU089Fddddx3++te/4qOPPsK8efMgSZIRs/DLL7+gf//+KCwsdNtkxiAbjov4SQ51jAKnimxUePfY1qnRXuoHu5ies/g4QTwuuCR4puY5XYq/VZvWIJ7w8CrW3y2qj17RxI/HbxU/dvQ8P6I2HNujhODxZuuhLIjGyKbsJn44Wz8JWsAzT6ohKmaNsKie2wycYdLWLT+K1wORyqbtlfXgaCB60CBE9u6H97dV6jTNCkInJeN4P/ocPgVQFKzOMwWJpe1REaIufnyx36D1HDuDfP8PKxtmOhegRFo0ZPolqnb/gJ4jbzKXo/rQTOCm3Rz10Yh6cKN2fVXkmAHcDVUbDfFjjiiyugICnczAXLqel5Hnh3hABzwrimzeZGOkfyjh1BGDNQ2rXee3VdRgXy3WSuvOHv3/DtnHo3zrR8ZyemJCPShYcasRZ9muProvsRGlDqjrJ9KwzyJ+FKrgqSw3UjrCeKFyz7iuQIlR/gLW4OMER8Ya2M8jKhhYDFUgFoLX3R3WVEzrsXu7ie18t9f9UuQIZG1VTgiAfq+UqFFqfJmpkqXCTuDLq6zbsaTscCYpdaBXmre7XtlQ95ane/fu6Nevn+U/ABQWFqJ79+4477zzUFdXh6lTp6K4uBjvv/8+5s6diyuvvDLNLW8cfQSGkeQwRm0vHa92M4jIsqW2l05UVhDUruk8L8GIfGuwt722V2OIlLaYd7IHp/amTpWotcyDpfI5AALZYfl5f/cW1NfvM0Z28R6rQNv+632WobSKIkNRgBfXqa4pL4IQvPmG+BFjGKYUWXSp4e4ufhRYb7Cf7fpEXZ4QM5mfNk/q3QMi9RvJdG4SjkP45KMh9lVdMJ6lajI3+uZZdOT9yOkyAlAUa34dmqiI8tzd2rqxxY9+M/IpOeg18vrYy8GsKWZg5ByxPgrNoe7aSSTZBIjW8XqsDgDs+O0+o9iiMUTZJn4IlQGbtqIpevZtu+hXZPNhQD3kKnZ8qWYUr1hrFoZtAivKZExZEsWOeO7cNEM/gHSdyPty0PtQa5CsXhfKTEwZf4i5mbG46f0GWLM724t00vOURhKpmrjf697Y3Qcv7BsFBc48P5bSEPZsz3Hqk0FRwJfYRkqJZn/VV64DAAh+68tytyEXx95mU6ESttKQ+gZkvfo+/Au/VSdouXaIrV5bsGojGspVoc/Zar1V7/nB3A0VGwdbLKwd+8g9t2Sq+mhK+8hO/Z4gbNsNfoczAW1bIaPFT2MUFhbihRdewNatW3HOOefgySefxOTJk3HOOeeku2mNog/lbqy2l45e5iIqS4bby0OJHz3HDwe1aKnPdsLWJ3xjUummXWMeDvDxBMXVptrwi9aRBBW2+5TH1wm8WpeYmsphwR/mUHX7za1q11cI1+0wvkuQIMl9sLdBvYg5RUIgfxA8huXHvd37Nn/huLXytpuOQHTxY3v7UdQ3IwIOnKERtJEYudmI0qkD3O7fWp9zNXUAYuQzURTkRdw88oASNc3Z3pxYuVBMyw8Rpfg3fgCdeluTFOoPSgJiy3xry2GiW4U4PRu1FogqWm++enI4c4iy8wFr3PSpkUF6PiMOPLoN/jvVPsnYNz00fufSBxCqLkbJ2pfgiQjU8omJmXt+F7GhSsHDKxoRCmmEFj+cru5dhvpzvFZjj0ojEHe7enmLplpMNHK7maM2FZt1hxY/jVp+jOryznIzMgj+V94dv9b1QSkpcuQkInEsPz2HXx1zj6TKOXqKTpGgDyEXKQspAHBNtJTHw6xkb3sJW7MJ/G6zJIygCYl4xWo528g0jq7nSD0PiBZsJ3VXX4JDpx5rzJOlMBzJUd2sh7qFTHAXPwDgXWxLE9CGaHPiZ8OGDTj33HON7yNGjMDbb7+NP/74A19//TXGj3fmqshEFMjaC1nT3F6rq8sRkfUkh5T40eJ9crxqVXa/7SEkKQpe3roWX+/biQaxcSHk4wleG+fBqyeqN4EglVeHF60+9JCt6TzvRf8xd0MMfA9JUIdUEoVDhL7AOAEDjra7bCjLiiJDocL2ROJBVuehELSH8fpKd9OPFA05Ap65WOLHZoHR90cIAYmoDyLdqiX16QmJuuk2eCKozCpBdf1a4wEcPkZ9SOhur0D+APN4dD+9osBHJSgcGjQDdsWweaMO5A90PT71ALT1RdHxMLJjD8rU8/EQxbRuAbTlRxc/utuLoG7/cohyAxTIqMixvumFarejtvR3M1bFxbrgVjpD5onRjrwef1JdggCC1Zvjur0idbvR4DP7KV7Nqbr9K4wROjqVwfh5m9IJne9KF9+6i0ECh9+F07FMOB3Eo1oUdddo9Z7vEY3jvolX3iIRCvufZViN7Ll0aAuCIoZRW7oMYsTdreuWJFFrGCQqAmOx5zxsEfvYFnEm5NTJ73V8zLbzpeXOiZTbS7dWFfQ91bo7h+XJSezjsS/o3v9EdBfidrcXDc9bXz4s5YGolxlSr1p8I2MPQ901FyN6uJmvqaFinbYQD55XBwaRGpch9qK7+NHzmm3NqcBqbmPi/ZBhtDnx015QE+qZ3W/P1mxHd3v9UW1ezHTdLz3eRy9I6nV5A5+/qxiPblyOV7etT6iNOR4Cvxb80zvbbJ9oyypqFz8cIQj4O6lv+kZ8EAcv9UbD8V7HWwyNokhQqBFh2VCtKbrlR1SAXXXOiy6v2yGOabHcXvpIO16Pb1EC2vIEwp5SfWV1nt+LKOX2KsnbjTV9vsOmfU+iZq86okvRhh67lV0wzNWyAolWZxHz4W0UP0VW3FIEFsuP7UaZE44f66a7qQBirUJPx/woiiGMqvZ9j80/3IgNq6agJH8LQt46y/bKt3yILT/ejKpdX1u3Q+MifhQ9p1Kluj3BpyWbUiTIugVMEz/0w9Re40mJIX4aKjdg8w83YNPX/7buNyoi8P4Xruukmx1LzSSuRmZu7RpfJZyMj303YYHvJizeqV5HtGt02xJnfhudWBmLm0IgXx3ZZ+9vWnyWb12ALT/ehOJvJ8ZqSYx2EEjUkIEVntPwePUF2FpDPcytTlrr2oS2BFotGL7Pv3e0grb86OKBs4kKR5JFF+haZfGIXV7Eehxi7x5aW+JZfqzttIhRunq9fowcZ4v1Abb8fBsANfRAfzGRiQxSaRVAhtvLHvPDcagTwrhj9Jf4b++PsK7KWtevrcDET5pQIFncLnyM4E6dAO+8GOkMz7rbK08rSxGrVhgA7AnVxZwXi6uGCRiYvxGdsq92vMFINuHGgaB3IBd9pd+g6MELigd+fydjGY+/0GG+tow+gAxZMW/uZ8mvALAGYhfXOF0ew46f1njAM7HG/GRDH6mkWX7AgWg+cyOeiePQcKxp/heph3xd2Uptw9o0SRdTZvtyuh2mHaRiVJsHtMrzenyRlgag0bdOfT+iiE69T0Dnfmeia88/o1t1fwzdf4Jj8SHjzIyykqgOVyUKrG+KdMwPNb1yrzoSLRLaZwl2joWr5UcPHqd+PMMVw+sFWs1zMhqpUj/o4icc26oRq+BmuG6nMd9ePFfY6hwhlwk0VLgEcGviZ0v2n41JayrVPqNLn+gxIa400/IDUC422Sp+6LpietJSve+d7YhVMwsW8aOzuoIW55z7Z1iFiiNw1y2W0kX8EN6D/mOpHEEJiJ9IXePXg7qTGOVFbE0L/fVkrS2xxY9gGyhisfy6BCDby6MoimII2O5DLjZfTIjsrOOlW6bs2dyLeqO0q7ndsrD1haStwMRPmlBHM5knVWOWH/vc0/oUGZ/3NSh4eKV6ouZqLuB4tcKaGvwMAJ39BEf3/BkevtiS+0YB8L3/TMuyHCEgvAeDxe9hJkr0GCOIOvdTlye2wFVZiuCFTfdh/vZnICkSFCUPADBM/B4Hcqqp1tPIGesNdAbXSBzMD3sFVNU/BGhuLolUaceiWW6IaRUxgnQ5HsEhZkmO5X4z063+AFAIwRPDfsa8fsu1Geo2ugw8z3zrkxWz2jxUkSes1YpCRql4nHgYbi8JvJCFPodPRu+B/8LgkjHwKs4irDldzIdkXanuoyfUwwjGjblu/wqs/OgkLD5wPkJCPWr2L4nflgQw3F5a0PTWritQ41OD5omsuXUo8bOvVA08///svXeYHUeVPvxWdbhp5k4e5ZyzLMuWcwIbk01OJsMCyy5p2SUtGQwsaRd2DYvB5LRkbMAGG5yjsm1ZWaM4Oc+N3V31/VFV3dXh3hnJYJnvp/M8tu707dtd3V1ddeo973lPV/puHNn8GTC3dmirMp5c7FF3PB8b/OuGuSoexye2OLjpcBhlOLbtSzhwz3vrhuJqWc3QgQx7UQ3lSY8LJIxOscp38L6e+nCvKorHwl51nk1SSxKPDQovweH/3l7t/mrjWZS7pDs/nhPRqkkqgaKFm4LsMguN0wIBxyQnPmojJ+6cdB+gDvKmV6S3LfAmgXTHy38EZmU6Qn/rzyOxgGtkEdzz2A3+59b5z9YWWjx0XwCAeAr5idwLw8Bfzg74iZVj4dDy34udcX5Ok3FwKKk6ChKrhB619c3hTq/zff770aDT+vUg6zg/hSlwfpLNLxTlbxmheXSZy0N7uZyBUku4NkSurLgNU5Ft1aAdueajpYN4aOA23Hrix+CcgXGREZbiBf8lnVI1gwi5+9GR8AT+tV0EjneW/7dDRRhPhb0oKCxPSguonGODxuqjlYiqKSQmgKPVQ7i/8wh+O+9xMOb56EZo4OYs7PwQDusx6fyogXoSR1gPewUHUmTS+jdo8NBvZTvCzo8amJ2SIGB61MWhzu11j5Vkiat+OZG4nWLVerx1T/CV9C71iWeisBcMDN32dgwfuRWlkb11zlej0rXGL7tbS07sqBYSdj45u/0Yw7YBjht3B+fwnCIGD/0WE32bURh87KSPqddustNCo4xT6veFXDZY8ac1JMsPF9azGoTbk7GgQG1tzs+kzahDeHYTkB89ozMcuo46P8FvY2Ub5DvrrA40vYjG+VEkbUotEEL8JIXEgsJRe4KcH/3XevHkepyfqPMzGfITRb769v5IO4/t9wlGWOi+AAi4cQnldHpYQNSu7vr7lJw44/ycJmPcA4OY3BstC3SSCW9xY3Pob1Pr1PvGgtfosplypVjneN3lIsreyWe9BHocgVVJfNBa39wBEAMmBziRLye3g0wjqlRGw92v4gYTk8sdQBKSDbj+b3Tnp9YVRrdPOCP+54ITH7CIVNb2w16EoNETn0umA5cwTFDg7oEw2XfYEMhUZfyo/F0wSJScgKcSGrh5mPPDCIN54AhIoQii1HIny8rRCM/6cQEkw/wJFs/2iq903UgNt6o5+SpfR3D8QyvkJ2Vg/B2vCX8nnZ9Ubgbmnit4K4xXUbG0vlCHzMsGkyF3V4XOAJS1WbQ1mvp/CpZUQ495wUq4KNOn6xnnHI8MMvSVJMKocVWWn/tV8UFbcRMzUKzXa/ouufx/tWMmZ775qJLqV44D4/Dxk9JpoT7yE+X8JKPIUQQmbPE+mhT2AoTqsfiJ/uJHOT/Ud1oK0fCfXCBULt0Eb6ZwKklRI2mz8Ji09IobsOLqn4aSFWpZNJxac7+kVHfPg3kocNyrGwNnqx7nx445P1obktSV64wlQhNNyVBwGAePhsjgirvIM/GyFVWt9NHhxmHsGtxW8zxPVTvj/JwmY5yhzOcDANJTiC8DwLR0MADqSFFFc9jzNpHH11LTE8jP3z88NdKzbknhGCcBrk5RA4QQmBwB8gPTr8Tur9Qizs/Agag6qUwdhxc4TFNqZ9haUoGQ4f88Fp+5KBETth/2AkXODUIKe5v68d+Dh/Gb4+FV5f+0CC0QNdnpRSgnqiPaik9rUSTsVZW1vDK/uAVGr1j9Ez4J8qOKkOrOD6uxqq5hBAREFzlMGAocM7yqL6SHY/tELcpJADTOD/fAM+GBnbLgvOnG+QDEanzXrEC/ZLT7nprnIzu3+Zktuo31POB/ro4HE3F5kpDoVMxLWPHrTkHPYzegPH44to9uOwY5PrLZxQcfkpOXdH6omYOhMp+0kIWrPauKVuQyRICtlfbvixyK36V/ezuyP/ot7Hs2122jbkpYMU54Tq7kfnzHVxLaoYRB40pcXsIiCgjGNj3UldRXzVQzAKD38e+gOLLPP58fCjINsGaxWDEOBmEan/Mjr8+wsrCzydUBotsThQETLY78WNt2wewKnB+u6fLoyE/KCZdpqhf2SqrkXksoVJkvlAkOa+8hWFsD1NJ3frJxJKrCg36wuf04PnTvG3F4Yk9sv6eynXF+TpMxBAMVrxELj5oeyqpFaF7ZIvapaLB/3opzA6IT+alaLecHgHB+tBKcVZ87LAe6yGBdLobFE1VY0IA7pRi8ssvmvSn093Nnv87/fHAsAfmRmWQ68kO1pg2mSrhzrD/2u8AoOPfg6tfqlQI0RnfyHCeE/KhPut5H4gpON0VA1LO11L2sgfx0zL9M/FRxR2qEvXTzaHgwVQOxRZvQsfilieeZtuxVsW0+8sO8WDYO0eQGfHSBOSilAuRMpefrlqkIfgSjHshoPLVa1z+pOsE5ywmJAydrXsLrGnUKSiPxqtq67ZO6WYNlwGM8EImkRkCY15AfXdeqopd60J5bklCd+CI8+Vp7DwEA7Ae3122jbgHhOYz0eDXS2oePJGXU+RLqISMknOquW1Vddx3kR3wdOE8TfdKp094jTil4WobuMsFkHjg/k/eLBZs+jM6FT8fM1W8O/XYyS1LYNndH6olpmlY64dn0gn6czi9EqmE2pi1/LTqWiPdPD0OScgIyq40Hev+YseofxAdb3hO5ILMeD9qlEDL9fikr83i4s7v498X9OeP8nCbjGuH57JbO+jtLM/SXRw4AXqTMgyU7e1VbBVg1HKUoh2UyU6uvfcYF+FbTi3HEnIFvNr8stp8SWMxmZyLEDxoQqwo1UHluGBqPtqbRFGnblLuJg9Nd3QnZDY6LpTeHnagGU0z441WO3oSFKlHIDw+QHzCG8/vmAgA2tx9Dpm4FZ4ZqoTuE6HztwMd9IcvQuapOPNtLtV2pHtc5E4BgQNOztZIcLc065gktFDVZEhBY23ZpDYv/jtHwytalYrBf1vRmzFwbT2fONC+FYcUJ10EavRfitgBAaleX/1mteFlkYK1GfkONHDrHBPmcEZYoLeBK2QAA2OYFq+XyFFHWehb1TQuDj2DPba8PbUu8D5rpr+24E0xMhBgB90vLstFLJlX0YTvk/NQKeyUTbonr+SKAqdvuRfa7vwSJlETw9zXC/DYAqBb74JT6EvdPtlrE6zjnx5aI8RvucNA1zhB+KxL6uPau+dmXOhJiGvBmybCXoylp90ji/RQQwYaOtVh75eeQbV0GQDjpUzLf+dTGkIT0cf+j5vwYLGjXnA3/CgCYvvL1vjAo567fd3THxT+1rk02HCAzbQuvEU3ys71k+FXye+jxHlh7xAI5yfmpsvg798MDX45teyrbGefnNBnjDFzC1/XS0nVLQn4OjgejaIsG8FS1ibEWmfpgYTRxe20T5z9ono+D9lz8b8srYnukqeEjTW3IQFG7gSCurwaadH5B6LdR1eSyhJUNeP4Kc0Y22GnrQHwJ7m1+DJYbflkNiU79/GDyypjEwl4ic0KRnV2ToCMVj3vrVhzeA09Dfgaq3RhlMq1cl+avOiEnKQn146naMX8Aic5PkJ2W7DqpDBK/FhAnobBZErLmkfD98gwx2POlgjw6bflrQ9+TGtlHOl/k+M5wIVKDabyWWtlLESfStBpBueIqsMQVr0KLWMSV/Ks4P5FH1rvnh7F9JsvEqmgH0Z0fEANEobYaGjAV5Kdm2Csh7KLM3H8YqDqwH94J40QvLJV5GDHqh70CpGG89+QyAWPcI2UkrPOz0NuKKg/+/o/tbug6k5SqQ5o7KrymOz+GERB3Vb/3PGBEhHJpaepJIAq5njryk0A4j1Qed+cHiu6EWrCzQvOnqRg47oadD/bR+pdfViSJgK0t2rru/5D2ezkWK+dH9hHl/KRvuzc4foLzU0kguhfccZS9J86pe7LsjPNzmowhqMo8mbqzMt2JUZ/HNBT6a5cEA4Ye9tKdpq+dfbn/uZwUI65jUymM+K1znu4LLC5As/SXxEvpSmhbOT+mncfKZ/0Ciy8VE2KU6sJkNT8KF53LhHJ3JlJxNZYiXCrD4CY2DAVif0rheSJhrCKcAUQ5BDL1nXugvYPY1D8bANDVWQElyRNLtkNo/xQGHw05PwCCv0ngrBgHDofDXoSjapQxkRqGvzJOCFOGTDq+JBT2qk94NqSgpArPxJ5lEvJDkjkNpFMM1NNWvBat8wP9mVpZKmrQdop9cEuRMgJa2GsqqrqA6DeEqywVL5bOzDlDVYZQywgjMJUn6Px0jTMcGg/3uaSw3GTFRnVnZtzhfnaaQH7kRKQjP9opt6Q6cXg8TqKtFfYKkJ+EvuF5odpXpJJMYPbDXprzo8pqJGacJY5pdRSeJefHJg5eUf4IntMYCOeNViPHm2S89FFilaots+aUWJ95rEcsHBgPyqycRAJsUFB28h9VJo4nZ3tFUHc2M+ATEUKw9IobsM74J2ScQOjV1Iodh8K6pV6A87hODxDK1NIVxP13jYaRH0WypxoCmMT5SUJ+xPaTl3k4XXbG+TlNJgYkcfvrpaXrRhOQn3GZvbSujSBlBN9Xawy+rXYaixua6u5Tywgh4JOQcZvsALUIBmbxoqsBTg9hWek2nyQbHRoVaduAF1KD1uf3XdEyF/IepTxL29/QvwoZBQMhJXk+ge641SLoRAFpeYwhpw/Hil1JlwuaEw7S4MFfwYmE8RyV3aa4FpsfQeqB7bFU94cW/wbb5/8RhdSIuojEcynjfh0u7donITxH1bSjpOrENOgazVAkW0IommZe4m93ir2J+6sitiMn7g7S/9V3zPRDL0l1wZKsOLY/QH7AfH0kZQP7A+L8IWN96LsyNafIsIvbaJXj3fe5IfE9QX6O36jJio3qzsxYVUMHqBGEa4xkzg8AvOs+F4NlHg6l1CQ8q76RIEDpecj8+Kbg7yTeCAKkgWuTm0pzr1eHLqkdUcebaOUtZplDsFBFmxFkDebMKMk5fr/NVEC090NYKj6pUBY7GBOsh3dCCI5K56dWpeQEIwkoWJJx5mL3HwMOHKnj/ETNsBuRNlpDK0JqBsWg9TF0z59eC+NYONTvt0FPUw+VCCHy30DkEEBwz/Qi0xHkx2WuyMbVzJYLH+eM83PGJjMd+anFyYma7iQ1WuJFHvfLWoQHBD3spaMjFqU+MlM5SefHpqlYJfS6FnV+JLQdKsYHgNKUtldgTKIClLsh4cKvXBh8Pl6IDFoqE0obNFTYK2kup9wDISKkpsppKE6AxfRrFc8oFyHMZuc+0/9ciSAAnr8SF2e2HxJcBE9jU+utH83KbK/JnOGksJdPeE7uS0aslEjkGFNEH6mRDg3ipgbF11L2VWUYqGGHBtW5A6tgMhtUEpanQjqVjQ6QH8pCHA4A6Hn82/7nAmkO/5JQOKdY3XygnBBmZUh0OibLBNKdmbLHQ5wfP1yjhUaSJBq6i1z2FSlBURP5kceW++khFjhuWBwvSRQQyanu6nMiv4mzOkVnI86PkfI5P6achFdngkyoNa0U1NIm/oS+uuD8T2vfyzEg4kR6MwNuZeqezQBj4DK0S5NY7DXMtMX1Jsk66OZGEUG93RpxrHLBhsTfc0rRNjELbemzMXPtP9cdF5IKuAIIIT/56eeLTVrWmp7tBQRjn647FHV+qiwgTj7txCK88dAFsOUYXj0J3afTbWecn9NkLIT8nLzz0yx5IWNyUGyM8PV0x0Z/rU1C/WysykmGvVJGFjgJ5ycYpKJhr/Akp/goUVCp7F4kvofnr7YAYFaO4IqZCvmKnJTFMytUeYukscOlDiiR/BCpKK0GJistBjmHt8KFqI784VWbQr//wcAEDFlo0o2k/aqw152Vnfj8I9/GVUtejleuelmY5Bxv0uSOiHJwEjg/tZCfqPPj3x8vQYOk3qnNbM2/DU2FWLdc+zrRRLcE3cWdlbpCfKiqsh4GwhNj7cFehcs4GIz9XaHvmOQ1cQC/T/0zAOAZA4FQYukUQ1+lBH/G5YFzseCCz/rieDUzr9TvtEdX9RDwmoiW7aXX7lN6c9p7nVGXIftL92PfxNEt/xELBQ8d/kNoP/2+pu7bGtq3FnpEEkQOx6QEQS1yd9/uH0S2JPdRw8z4CyNDlprJURevWCxpATQc8knq49nWFZi17h3iLOpeRu+jdj9J1QE5fBTjGaEhdTJhL+XMM6+Mg/f8a01Fb1XzL2i2xlvSQtasPS4PIRpFYHATC/OvQMfiF9VtU60iqXpdLuU8KbK02CbuyXhmQGxIOk5E5FDxfQwYeOPejXhaz2KkJPJzJux1xiY1DubX9pqstIWyGZlg9bMw3wxAq+kVoYm8aLaoCn5R+8zQioES4iM/Jxv2StPMSSI/FEud7QAJh71SDbNDu6kwStQRyGJEHSjmMOWkszcRXRGrauT68eWgE3UQxaG9QORQik6qY3S6gssw7AW8luizurP/OLiCfCOrHldOJLeXt+LBHrHq6ks1oEiSBzsfrZoU+VHOTwLn52TDXsoBniryEzmOrn2io0C6GfL5em4xXGRUapuQSjDzhEKiCPq7btNWvB5EtsOj8cE60yIUx8dIQBZdXBrwHYdTJT0nOj8snKkV8EGmjvxUGCKp7hHEgnFf7+b80UA/SD1pNYENH/4Dhg7/HpXxrtC5FDfHfyvqhVxYMgJCE7K9iFztGxGHWFnP4zeG/q5VwsMpD/pjA1WEWUL8On4uA+zsdBBqgVALVqqGs6BlFYofxhE03Yp/Cko9GNFsizpGrZx/rvG+hzF0+JbE/QpDEaXvkwh7iRMlLHJqmVOjv2mOiyf7gc7Ncysi6UXJWijkhzUFXKOoKb6PTdNiEeUxv2j1GefnjE1qem2vqWZ7vX3xOnx27YX45qanY0lTC4YrHA/1ihcjHwl7Xd45B/979hX41+UbkI2EahSCxKYqzy4tY+ZOyvkh1MC55T+DSDVQFxbmXfA5HDQ6MaJVM/crC0d+b8qw01z2qJ+doCwtm1GO+m9qoEjImFKUKE4CJ4XABaCyJeQ5KqJtraQZ1531E1+JG0gmp1cMsfKNIz/BgOSxQDH2UC649kQK1aTIj4zXcx7wKNR11yQ8R+8HCf2uXukDXVgtihDpzlAtzo5Ch5hbDHMJJAfD7DoWXId2/Gn2BaHjdCx9BRZe9CVMW/4auM9/HgDANSoxkq5ywlqXBmrSzxrcjrR0SE5V66eUwAuZGO0KozYyxFoP+al4HFsHgt7eW6wf9tIdpXcfCbJwArAvksJ+7DjMvYfAihMY63nQL1nSvvgl8ofJk+mYVcYRI5k74oemNeRHtTk/48KY+F6yqWcc6WuE+pwfQ72LIL6au8sFb2zFM36E5Vf9EIadPDHrelIAQIdGVONlexkGzm2BY4j339EUywmzcPDo/aiM9OHx0S2J2UzBeUjI0a8V/hJIZ7x9AJLJyVGjFCNWGbeSO1F0k/WUfHPEffPaAvK5s2JxaDGkBCn1d7Zl7lUAgOoMiaxVHdBjPb4mUum5T4udalwq5qtQFxiDKZ1+bxKu21PJnnje5xk7JeNcR36m5vxYlGJ1UxtMOSr8+wNVDCvOT0KC0KysmJSjadrK+XFP0vlJ0ZMPewl6qXwxYWKHl8fnd96LRbkm/NeGS0P7662ZXQH2+QrPbiyTSJG7q9E5RsXS0/EMBTWJcDIBwtX3HogswcEV7+DgUQDNAKVoT88ARdV3gJL4WWWzERYANwJ/u6EJsApA8iZ4MHCGn4B0SCYjPNPICtIwfOehdqr7ZGGv2n1QDznWJSXXCJ35zo9ThJlpD76Qzo/1yB64C+fAXbkk5PiZRhj5SeVmobFT8COMBpHN5xjVmM6P4loYmZkAgAwfAzOqSDMH40gJleeT7PsAUErwZ/bd8z40czGREWoEatZ1MoFu3O2FnPbfHWF4SbOGwEXCNbrPlfEczKiMoTuVD1LuI/c9fctdyFRa0LekB0fpnf52Q75DpAa6865NN6NkuvhE4TK0tIRrWwWEZ835kddIDRuphtkxDSdAaOEEoqZ+g8PHJtTn/Bi86m/TkR8grm4cNV1JHIwhc9Pton2SDzNy7C84Mvp1NMxqxfojV2I0E7T3Zn43bjkWKF5fMu15uHbhv9Q8l2E1hLKnkoxFS3zIvk0HJ1dKFzsSvO3CXwMAfvzwzfjG+XfW3JXLYtW8IQvI4/PG8PvDZRFafSy1ZLKJa0j+1tAIct//VfCbdHwR+V+PC72hUVeEDAljMCVy9/fk/JxBfk6TCYVnleo+dchVtyMTwSAWJTzr9tI5S3B2Syf+cZEY0JTzkyTTX8/SRhYMcaeizTqBNNmD186LhD2IkGUkkvviERM7xsVAdCBBY0hHQS4ag1/pOdswK6YJVAv54f6qNn4//BV0KIXbk+gPANhifJboibNChA7TNKgfNScbX3V6cjBxI+mfJR5MFLYZlFvgPOAv6E/Ab/FUw15AsPxX/54i4bmmxk60PXW4QUllBwBRMgAAPLeEho6zRDONdEjS39ouSoTo4SLDCIdTDDvglijehWc44MUIoiSdUCafC+UuGPF85KdCTaBGSnc9Swp76crEhBg+/6UeGfaPx8LIi02D6ujUSPkZV2ri0ZEfAxyGDB16tZAf+WwrTtgZ8ZWDayA/JVNc4K6ReNmLJMJzoI5shVSJW+c9K9gnlBFVY7wh1A97KecHREd+pjZO+cgP90L1u5SN9z4EAJiQPB9LU0++JRu+5rt6f1v3XE2zLpu0PV4E+VFOIBmN9o3k6+OTRASURAgAoCRD9/ngHeERro7KztNLoqjPHq/xPiSEDCusFNtmkr8/5OeM83OaLIT8TDHsVc+inB/d5uXy+Pjq8/CsmQtC5/NqZmMkW4pmQvwXZYsyD6HVuBkr8+GVBiFUDMMyo4LB9MnW+vl/tM/FTfY7fJWcRSWgzSVg0jmcvfrNsQE+JQ9TiWZpJBB/Fc/El8qH/oJaUPXHhJn+5OAuX4SdIwOYYCsBAM+ZMS2xYCyXA/+do+EaVKXQgKLBzzziJEZtimEvACBVVThWZW3VQH4ixRJ9R0WGWOpVktaRqLrpvTXDXmKAZW7J17NpW3gNeCoIZRqHj4vja4NnFPkxNUK17giNpXvQ+NmvI/3LWwHPC5R3J0RbDXjghMPKC2eqTM3EyXEye7hf3OOr51CfPxZ1flQbR4/dMeXjVhlwfN+vgmNIoUGVZeMjH4SDADCkMxDU/Azfd5W5wxBGn3z0L8GZKJ21PLbN2LYL2e/+Esbh4xrhOcn5MZGfdq6/vaFjfWwf1TJ5kaHzEGIEIodVoQNFQH3nZ7JqL8GBAs5P6o93ARAJDY/Nugs7fnlZqOQGB/e1beb3rUPKO7kMwLYF2jgYuZ+ccxzZ/BkUh2pUO5+isr7j1u+j2daV/mdjl1g8qPplAGILIRWG08cC9bk0cSC5zNJUM5El99Kdcr2z029nnJ/TZIwHqe5TzfbSzY1A19MyJ0HYO0Xkh6EBHpoBALOoeJGarZTv7RtRVIAYoBxQ9b08mLC0ax13HLiM42cHGbZYz8EY5or2+ecTE4sVlYLH5JwfSgJvsDwqZNqDsFfwI8bbNeQHEM6PEhs08cFHgoyNrcMjAID13jHo5snY95AXhrNLiDhV0vgTDHvpWSu0b0hdiDxE8m+jabIkwvlJ5+fXPF3TrCA8mZTOrlJoOxSnJNpcPxuIwXWCtHam8RN4s0TUtBtiW2Fia6phTtB+ra89NkeEA6w9B0G7+/0Jl3fLTB64ADjSsmOVqVlTz6aeKZ+z4sGfmJkuzEgMTam59jvdkEA2GB4VfWqif2vwDGmY82PKBkSRH0TEIWs6P3WQn1Jo/BC/t2/+C4wTvUj9+X4ftQhxfvyK6HYo649QyxfR052fYLgJ98W2Bc8Lwl6qzSTg6E1VgicIOXqw9hwCAIxm+jDc0B3b16Our21DQHxNr6laSFcowkcsjeytUdtM7h+5/97sGYn7VXbtqNsGQqivacRkF2DNeTApSsjaw+KTCrULaaZpi56xTDxsWYtDGNutR7xrUf2fp7KdcX5OkzF4gNQqsU7B+alERoRcnbBX1BTH6GSdH2iVl9/Y3ItvbnwabjjnaeguiQwUIzII+8iP5vzobsaYUw2lqpudglynMsE9FRY04gOT4vxUos5PoSTPrQnEVYbgcY7HBtXAHV6d6H6kxwJl6ChsXJGD1ssr9+Kfhr4X7EfjcXEAqHIHVaRQrj4NVfd87RyBzsq4CYwZkq9TY2UcM0LAJLxNihKCnkThGQBmrXlL6BiyMQBqpysvufwbaJp5Ud3mzD/vk1j29O+iefYVid9TI+UjB25pQJ7egLt6KcqXnyf2GRkHOPdlDwDAsttDx7Ey4b+TjFQdX2yRy3R4Ay444UjJxzlupECckx+kFQKxsSPgo4SQH2qgsVMoftcuNQHMzIkfv2ZRGTZVGlgar0pmKXkLhbOnwj6WHCYMVS5GcdwjqF7ZFg5mhYZJsj53S/ZjZ/VS/zumoXBOhK9k9PT7uko6kVtxXii1Qs4PNdK+Q8ASkJ+oc5+fvimB8Ex9Zy8q8FjL1DtfHhOODyMe+tcnI5qMuL7AIeEUo3YYZaGTcBupYaOhY4O8nuj4XUeiYWDIL2rqdbZh4h+vBa+RWdVrBYupJqstcR9lnltAyRpHeWYWxTe9DIXXvRjusoWhffywl5Fcqiex1I6G/JTHj6A4tDvxt6aqGHIm7HXGJjPOuYb8nDznJ4Z4nISdKufHUagKSjCsFKZncvBYQOqLOz+S8yM5Nh5M34EAgDG3ikcGg78fGrtEHl8Mk0w6W5YZd34C5Cd8Dd5DosYPKQVx6bETd+OXu06gvyLbFynbMMCuDfYtfQxNjhwwI4jTzLRMzXaLmOENYLbMKKvl/FTg4nf2P2O8/P7wdufi0N8/aQc8BFL7U3ktybi475nf3ib+nqSwKQBYmWC1OpaSasyTaD1lW5aGCM+JbaEm0vl5dUXYVDr0eN/D/m9ACLzF8/196PHe0Eo0uqKeilULx/3Pnk+Y98DBYUnp/vua5wLVk3d+1CRs0QD5iYa9glpJtd8tf92y/6ug3kToOFZmmp+2rJzvAPkBuEFjyE80rX7PzAfgERcFK1xKxFf1ld6+Ny1wJllad37ioU17h9BJUmFJpxxMzMRIhdLdqZn2EYmphL0AaJwf19/Hv8dTRn5EP/WccVSNMrrad2Jg4LbEfRn1/Gd0PJ3AYZlCoVPljEcz+2qJdZKJIrLf/D9Yj8mwpm3VdHwA4JPr/+J/ruVUqPu7Z+YD2LLw93jsjmvBc1mwGR3h0D9zNYK6psKvtTURcZbOj1sZxZ4/vRb77nhrYjtMJhfUZ8JeZ2wyE5351Dk/etjrg2edXNJeEPY6Oc5PQDx0weUgP1AJIOVo6QJq5WTYS7x0VZLChCaiVWUeihqCVVUiiACY1jXNBDJuwPlJbiudCArsEWrjV8c1kjEJD+4empC2hBAc9Trw9BOL5Q/Dg8FL54jBTsXO1XNjEedg4bhAUarcxQ7rqljbVDkNZQ4FihTwmuUEMgVfmEQdV1XYdIowtX8czRldeOHn0TTrMqxOvRVt47OxrOVtAOqHxKZqLMIVUoMua2v2t9HB4ZDzRhKc3slsfCyoVM+4rFDNBefHkLNpg1c9JeRHdVWLAra8z66O2BAjaH+dd8tHMsr9/mSvwj6zz3oPiCvDdtL5Kcim5kwCGAZohPPjuXFyddUs19BRSG5bGPmJhwTpsDyH5GxViyf876xMB6gVoAnESAXOj6fd5xrZXgDg5cQ7l4Y4T1K212SWa1/rf66aRZxo3VtzX48EYa++VJxb055KDkWFTCNY6xZ1RptmXoLFl34VdHgk9N6Sk3DAkxxS3YqpIIEkSWOKaan7etgr3bQ42IckDKYq9FoeRDRI/5pF/+Z/NrmKJpxxfs7YJOZxVytsevLIj1oNpQzgnM6Te4ynEva6rfcIPrVLZEsQMBxxxOC3ezRQiC1FaluZdpPM9hIveS+/EvcOBfoWDmN4YDCoB1WoiErGDa2rMUyCwScR+ZH+Xi3nR78yzhxwfcAl8cE9lxKCZw7JwZEZbQOVsJOStwwUBh/1BxJTDn6evJ+mPOmSCbGaG60mxNAheEZl5/LQtu0NgNcmHLRaWVN1bRLCM1BDZE5jkzZOOwfzN30MObcNK05ciMbccnlIGgprjFc5PrPNwQO9U3eeo6Ezv7AiIX74xdp7KNzeGuJ0SaZW8aPj24ONhwSPxpCcn9Xt4nk5xABxXDCvip1/+jcc3/m/YnupH4fu+wDGe+PZTgDgSG/DpIAtnW+HaGEVQn1ifu3SDsBRmaVpwIGpZCDk/ci1rw0E6ywLv+3y8NHN4u9GW6S/K8Lz9/e5uHG3m6jOfbxldxA/jlpCqjuzgmP84diP4HrhSczef0RcF3NxfMdXsf+OtwMAMs3LQAgJIz9GOnBuWQVHNn8Gx7Z9ORbWNY6cQO7rP0Lu6z/C5qrIRM3yoEyDQn4OjPF4YkOCGWYGdk7IG7AahYiVHZi2FcMN3fDA8YMFB/3tGXfqKdukhqOrk/bt3EzMP+8TyLWtgdF1PLTfVInPQFxGo+6+1bgmkMomBGhYuoIQZFtXAwD6pw3ED6Y0kjSHypLNXtq4zt9mSOfnDOfnjE1qou6TuP2nQnhW45dx8n7TKYW9/nPvdvRLZ4DAwy2jQkPjl0f+199ndm5x6Dem3QSDA4zN97fpNbdczrB1OAzNM9YMQk38OvWvwXESsojS8sJD4T/telhnECNnzEGrpQsLBoODZ4nVIUXguD3SIJyw33d3hdvGGYa6fh+0S4rljQ/JTAu5PSMzR7rrRIuKlZeF/j6S0gbNU5E+8AkgdfpS0oSclEqjJl+tEKQOlX9/n4eH+jg+t33qqzwSDSPoz1SF3jwWbmNqkur2mlVMgfQ5bjB5qkK1JqrwmnIBh4RQoOpgYuAR9B28HT27fwjPKeLo1s9jrOd+HLz3vYnncLXwU0reZgcp//rMVHPw7Go4P2PVoI828T6/nINf946bIErnxzLx7T1BB989zAHbgi2RhuMF4KbDDP1OXGG5p+VA6G9VYkTcGHF81qHx2yKOZtfQLoRNoRwuBg4EhWOV4KCV6RBICKGwMu1+/b7y6EEMH7kVg4d+A6cUnlyzP/wN6PAo6PAoLBmSaeAinOY5hVAS1Y7BKaa7K4VtwkBZbd7OmKyj1xPpYs84vgQAUKlRtTx0rhqOru4otC96YbC/hkYD8J/zVMwjDGySkinKWILMQiBwmIqFp1U5mLIxFvudQpL18CVTQvSag2zaUnH9DPJzxiYzj3s+GpGUPj3p7+sL+tY15fzsnxipKTmvWzFW7yW5gzfbYVKekWpCmgG2GWRMKSFBQJXXiKRj8kZsyl+MY0aQxmkneHg2VcfQlKq1wUQN7JwDR6staJZqrp55ELNJH94yfwvc1GYwU6z6KOdYUBIZC2OmhYGGoxgpB4NBC70JAAeT8HPHkpf6yM8YM8HB/UEhI+Pfrjc31u6M/WPZ1EWh7S7RB82Tf6iKJButw6NbIhqRwPlRcDy3gmdFDBujtAEjtBEP94Wf/4TDsW+U1e1LUedHT5l3Fe+HMa0UA+DOnVnzeACw5vlBRk3JHsNEaghMhmwWDG5Ety2yXbJ8DOWnne+jNVVqimvU7sfo8Tsx3vtw3fP1SiDQokHYtZsuQuOaD2D5Vd+HYeU0FCZ5YhvVohfNvN8n+DpIIdu6CrQsxeoIASICcytbXXiZFPKRFGjScg6qSOEgXY9x0oJjdFkI+Vxy+dex4Pzrgg3S+RlLZ7Hndddi4p2vA4s4P3v6t2FcU0CmNeZpb8mzsX/sERhWA1Zc9QMsv+oHMO2874R4mtCfEkgkHgPtCy96PHnfpjNJBq6OhXSVprpM87OfCAtlfNYyR3vVPrP5Gbi8W5CEC87o5GOjn1of3ByHVXGsfBhFyjFqcLQveoH/na84rawO8pN0bidBZmLJZV+PbWMJApssUtqir8Tx5+MeCg5H59KXAwAmaG+cqxYR7eTgviQJ4QyVC88GAJg5qW+V5PxwDtrdV7v46mmyMwrPp8l0zs+peKAKtTk15EeccdfYEO4f7MYF7fUnmXduuyP0N6kxsEfNtPPIMIBAg2y5DUjOzYTjIDrRV91NuGd0bWhbEpE2rS3qKp4s8qhN5PmUcH4qztPxhfLrgtPTCTRW+8H23ATeEhCdOWzMLw3jUKYVh5oHkLXuw/jhFJCVonwog3HuDwJ2dgZkSTD8JncxNhYf8o+V8SgcbxFGCvGByTIehQqmMdYMSkcAiEHYTx2eAhLIKQ2nzDphnkiS6do4yqJpt4Dm/Nhana3cXPxH7mKAG7BK4fZ9fLOL/WMc7z/LxKbOGjpDEedHnxR9h83zYGdnoDwuwxAJ6rKhYxoppPMLUR47iMfmCF0X5Zdnq034/kKRjZPiBXA767vdDqGA4/jZYABwdOvn6p7r4Fhwn2wakHHvtV+Oew8Cv1qiJlq5Uq6B/IxLPZRpKQcoBATfg8YGnJ077KtV83QqRvTdMXYYP2tPIT8Sdn6qRh63p96DR80glPqi8nVY490h7kVLWMNHEZ5fszMHBoLrL7aQNsPP9Jv7/ws3XkjwwztfJq8q3idHDI7/OfgxAMD7V1+PhY2rgnMoJ0QT+lPvjrVjN3JdATrBADDZ59X9oGYWepOmyvvxuUaEwSBpuIiTmXVTzs+KkQ7Mn2hB2ZDOKK+iyspI1ciMAoLsMp3z8819n8S2obsAWfJuvTOKvC0SDcwjJ0K/5w3JNdEAwE0QHXS9MlJmuD12bnpsvyQtriDNPQPOOd5yl7jOmxsZPrpAjAuMODjW+jjmDAULT0SQHw74Q7bBuS/Eacp3KUnnxzh8HNkf3wRuUEy86w0hRPl02hnk5zSZcH6eOPLzRMJeAHDzia5J9+8uR+BaUsHSjOBpzMwI4cRN7VfGfkfNLNKcgGirCcKDjj/uOn66vzLOM7itb96kbbIjzg+AkPPzzNnXYk16GYxSVHuGweYOUpHBxaUm8jIu3pMVL7qB4HiEVEQxWl/bxMIFbYKXlKY05A7OLqZRjWR0AUDa+jVsM3CSXrXgS5iTEzC7E0J+JrdypOaOX9W5jvPTMuuS+MYk6F05RJqeUMf694gPPL6a3j8mnu+DdThAUeRHQe0A/DIOxGOYv/Jf0Do+E2uPXz2l8F9T0jUBIIwgJyeB+WwHwD1YciCvUgOk6tasv5Uk+NirzaGzckDEV/D5QAHhORk1UOVYUjRCkgURXBnl/GTTmiinMGYdxHebgCY3zP8oIxtyfABgjymkFZpnx2sz+WEvOf48PszgRS8IACP6ext/Fse1rrB96N7Qd77zoxFtVf+mEYVjV3P2FRLWvugF2NChhchrlOSIGtWQH1NTo7fS7WiaeTHmnvuRyLnFv2aLKJ2R8kyYMsQ34cZV6EPmh72CZ7lt6K7QLkoGRB+bKheeDXfuTFSkzEOSVRM4Po4TD8WZqebYNpZAjvbDXkY6RPk6NM5DGV9H2yLhTkNxflSJIu0rzv13tB7hWZUXIR4DHautfP5k2xnn5zSZjvzUSxGu/Xvx7xN1fnaODuBY8eQ6JEUJNhUDy4mSIKme2/70+H6SJzJT4zmYlU2AzMLZMtyHaBcsVl8DFhloP/Lo/bhvILxqooT4oQfF+9Fl49NmDq9qfRFGSFjrAmCwuIusFal7Axt5OVA/IicS3aUhcIQqrJxQCbVwfrtwflwehLwAAaea3jmh4zdmPonGzP+AEKAzI1CPFnsB3rPyy6JVRCMLTgH58eYHWkHgHObeLvExQRDSvwZqwtKqsAM1Ciz6RVIDYvy3DrbBKG8EYUFq7ozIwnXLQD3nJ9yuUPkHFXLxPNw8diu+N6OAryzZHptQk6x94TWJ2x+352BEZiDN8x4B58zXyXGIAXvLI0AN5yeVkN3myRljdQsBJQRrwvpxOF6QGjZ1CM97Rxg+vkVmd010AQBWemKyLJK80ENSzk8mjWE5/xEATuYWgHgoE+Db88LO2eNumGsHAI+al6OvcC0ey7Xiukfeim/u/QRcFQ6JOBJffdTD7YPJquOqVtzPO9bje+nPop8I7aEy4bijOdhv//hO/zMZHYc5ICe8A/uDY9XIWHI1wjaFh8bOc2Bnp8EgBGd3nKTWj4/8eBhBP37c+Gx8N38NiukZmH/eJ9ES0aJSzo/V0oHqWStBQNDoin5zZKJ2thhQm/CsW0o60qZMbweA6kUbUXrV8+HNqY243913c3AMT7w7I+XkYqiNuZWhvw/c9Q4cfujjoQzLIOyViuH2w65W7oJHeFIqo1X2nXSbhu5x5r+7hhwAEwnPbvCe2Q9sS7yG02FnnJ/TZDrnxzgFjodaCZ0a5yf82H/XfajGnsmxZ4oKXLgYKOtp7gn7yRd/Pr8ztJ14IiQ16lQwlUKpW4f78dnHt8S2R0tcWLeFJ0s7l5CuSjhsXkV78wLY2mDMYMOWabwqrGdqk6OBMaHNxBXyE6hVu5yDm7onwMB5OGRjGcFAmpKihiUPSNFgIquqcgFT6A8hJ8dxA8LqJAvkjiUijNHiCMQuUek4Uiesa5zjnh6AsnZQL3C6XBbuH3ad0SRaWDUkiCiRn3EUcOvIb3C4cQSPNXXjhr0fq38xQM0K3x+e/wr/s4UKOPcC58fnMdTXTtFNpbmr22xHSDCHxiIaNgkT4p+0ml4VIpxvld1UJE0S+ZHPI53CARlq00MNAMBJuH1uZj6yfCR2vus7X4PfjP4fuiYex0ODt6NrQgrUJYQ6f3KkNbYNAJiEWG+YvQkHjQ2433oRAOChyG3fP/6I/9l8fD9oSYZJhgOSM1OoaaR/u9pizIAT6sJ+uvuUtX6E8+MYVRyyZuPR9DLsTS3EwWnPTNzfU8gPtXwC8rghUJLe8rHE3/jn8sNetZ0fxUfM/C7Q7JlKyQg9kaRiiPt2rHggcd+0HQ99jRz7C4oaaV0Pe0VBtFv6goKxphdGdjkJIz9cS1Sgnudfi4/8JL1TGuplPbIn8RpOh51xfk6TiU5y6mGv3qJU5n2CyA8AlLx4hz1aHMe+8ZHEooIELlzuoewFoQv9szKl1juDPxb9BgDQU6SgnhQKQ/IqXFRDB1jCrJ72nR8ApUoslTTXtib2G4Ahy8ton3sF3jn8HSggt6XUhrPGBbqk1HbVGZvNHlDiClKz1C2h1A5VeF9wWTBYgbooMN3xKsGgPf5fGdnuksthUguGvB9FWddoStleluk7PMaJXj/s5S2aU+9XaF/4Aiy54gYsmCdSlXUSYn+lhJFqxecBFeBh3/go7uvRBnfNqesvA49r/JN6fdGww8hCfvqm4JDyOsbKA+AccHg7OCdwtNBk6/znJB6XEAOpxvphUotXAA35qaoBvZqcPpzk/ESR1hQN98cRVY9TZUUl8OKK2mtWgXCWs1yEVobpDBzzpoPLgqs8Zfv6Psubozc2fOyuSguaMjkkmQ6i+veTMTgJmi6cx6eDgs1Cb2aBNAMADiXQsZQjTEfHQeWxxjMBsblWpfsw8hO+NutkVZ4lwlhIDWNMqw3nNgQIcHrDl1GRITF1WIOYcKQi8jn9s8VvuAPGPewe3YqjhQDB0k4m9isLB2+sOhTbxXuCqd+cW5gzdCk4T6FUo1ju7NYXYtXRS+O/1TO03OSwFwAMVYPnzqgri25Li4S9GFXaWQDnjo8M1gt7EQ35cQjF3q4R7B5hqE5VvfJvZGecn9NkOufnZH2fisfx0btPPXY6maL0idIE3rblL3j39rti4SZApLq73EVBSys2SZzEpkoamBxghl5fhwKsAVb5IhCuhP2Sr4cnCW9JS2np7g3Xfz9+/sTrZMiyEky7Cc1sAjYRq7vWShvSEglySEruKV6PNBWOHecsVMxRF6d05LUSDgyaeTBN/M40wshaRi5ny4qmIyfMqhcpVVHPCPEVqLM/vkmUh4CYNOv/jCDbvASkUTgjioRZdB28/qE/4doHb/VXsh/u2Yd/eegEfnkoGAwpaw4d70MPaRNXnW5las5PzFmRyM/7NtyMCb4J/d5rMcrC4Yl0UzR8qX03mfMTRX7UZFtJTmcOCfNJi3LsrIjz8729KvZaG/kpaYN9lYhQQ046P/10Pq7reQa2lsWkzG3LL/0yO1ff+RkoA91l8f41urUJvh5zAS7w5vef/efY9zyh4O6P5m1GxQr6lENS6Dc5JhKiqzuGRVantWufXw6jbAfvdS2kzfXJztUY5ulXdp+i86PCqb3Nh7AzFRC9x2RCwP5RhvfvWYVvZr4i2iS/N4jhE5BbKuIZVL0K/njip/jSrnfjkzvfiANj4UVceawLgEBZPObhvVtegKhFS4VMxXQ0daL8j9hq/jvGSu9Dqftg4v4Go2gpTofNw3Ccfr+Diu6pmPOj0wyqZhn7pge8RJ/w7CnnR6qmc0msVppNUlYgOewVtOPrszbhfXuy+MCDLr626wmUKfgr2Bnn5zSZYPNL5Ockw16D5aD3norzHA17RedaneB8YCKJ9OfBIxRVTQl2XesFsb2UkN2sKsAtfeAgICy8UvXsKDqkGle7i+rIz1TVUjkdwfkdc9HQcRYItTC7KiaLVeWVMGVmiNJuURkoirDNEWR7EcPyxSIBwFFkTgDdVrQGVXjkzskRvSTffVveJ0cerhaJN2YJ4QtuT00bx5upcX88D70VDcWT1/t4ZQKGuyj605pWz2cztIrsUVE+rmV1jTMhhljk6wEAM9f/C5pmXYa2GsgPEK9tpdvyyk5R1d1zQoRnAOBSSTnXtgqN08/zlayTwhgq7KIm46WNyRN5wPmJ3ww9dVuVs5hDj2KleyfSXDivPY68N7btk6jtaGS4lnghgHGzdnaSy12/zxzPFWLfswTnZ8wqoxJ6XgQjNWhlAxXhSLOGnI/86OYjERFOn+/8+BIawfVZJ+n8qCLGAGBoYeuyfD/vkShmP50v2iqbQonha4PZciKvsjJu6/6Zf4zNA3eEzlUaDupcRUnGbfJSlTPAWkX/d9Ysm/QaSl7gMJYd0e+r7sWo1lJ5ls5FlJOuiy36YS8jHvZqyDaLsirS+psOB18qzo88lp+VB8nhOknk5zedAT9poHQG+fl/0ipe+aR0frYPMHx+u4vv7nFx3RatUvIpnDsanqiysAf+vUOP+5+HqvHVMSEeXF71X+yFDatidb3EfuJEFicwyTCYIUI/lFPMzTSF9uW0CJAkRyto7HPu/i1e/cCtfnsDwnP4Ljjnr084DsBRAQjHmnPe61dE7pBEwBs7GvD5RYL34JIUGIifDUP83+vIjwVKiI+ivX3bFrg8D8KB3zW+MHTeKp+JE+6/oCzFHrNyRFelPUzegLHiB/Ft6yf4YeYduKHYhnJCKDJmCQrIfIpppLyp0e87pFwJDYijBPhTR+1JtJY5dTqjmdKed6S/80xy8UkAGO9YiPmbPgaaUOJEmSow6f/duRFN8rk+L383ALHyVRPpuJnG0ze8EdsO3e23beEFn8Wcsz8gjxCeaXcNM9zwuOhz6nlnaQ0RPJ8EG1/VlrVHymDgu62vQGXmlXhp5dNY6j4AAKjKPsFtK6BexY40dXE8rs2IHncwVhnE59bcCZfFNahcbzkaq2FHclvTEfxmujaJgvok4XmRW6D4HoQxH/kJfV+VJOjIdocqyY+486M4P06NbK/fHj+I63Y9jAk3QGSVlWjQhyuSd7JvNHycoJqeAVAKZ/ki2FKkdKQ6gDEnCGWZEdI+0zKyXC98MyxfekzJRkgu0orJFxPdpcMoVl6OUuVtoe1eDX01Q6K3US4V18Z15pYwQGbhxvHn4sBY9B4QLL3iG4nHLgw9ikdvfh5O7JBImREgP4xVfWTIkP0skfPjJiM85087Bc7GX9HOOD+nyQRqol76yTvBx7e4uK+X4dddDIfHg857soXZAeBwMSx/XtZeEod5OFAInJBhJ4kXweCwqp89MpUigCKWL4YaQiis2G88IALbAgCzwiGjYaeCnSMixu4jP1FCQK2MpwhRlFATWRaECbY3BwO/C9sPe6lwDtd0fhSx0tQe3QQ7B5QTdFlLIicWD2mEXYUUzaBJhhEUB2S0eg0q7uUokTbso8/BPUMD2DyUnNkROmpSVthUNTQo9XV0SLEc4n2NU45PLUsmwNazeqtzKxOQKsujEYJ9nTbvGJ4844uY4Qm7bf5zUJYTVVo+IOZVfOdH2ffouwAA1aIsQ1IDtfnQQ5qSrTxGcXgvLB6e8DjnmkZTAvKjOemMEOw1ZuB3VZE2pspcOF7c+SExpKf2jW5ywmGvqnuu/9njLrYO3Y3tbd2h7f73bBqsBKflFzMDMr8Ly3d+bJrCxrYgxd5nBzEO16hdi8qj4QnSi2j86IPaZMjPNw4+ivsGu/GX3qNig4ZSlTWRw4qfzBAYA4GZ7RTnVuTlTAopJvrO9qF7QufKGGGdrM6lAane1VDw6Tzrl7rxlaJ9VdrJEzyOTnShUHkjJirhRZRTw/khMRFaYWHkp4yfpz6E7ZVFfsah/x2PJw54cqzcf9c7fKcVCKgABsJhL9MPe9UnPOs2x42jj0+mnXF+TpOJ4oGnTnhWFh3Qp2KVSGd0tfBJ9Lu94yOx3xO4cJgQAQOS+T5REw6ETAd2Z8D1oqv9+GTxtpUAM+OZaKq6vOL8jJQiI2MNrZtoQVNCbdihlzW49rEl/5QY9qoWe+RvxTVfOze4do83o+olkazFcRka8bol/42cfGh3nGA4OsHhsY7w7hwoeg6OFscx7tSeRKLFTblhhLR5JjOeFc+A9g2GEL7yKXbHeqRUI5INFzKFELJ4Zz5R7Jr0vLouT9v4bDTOvAQV3/mRcLwzEXtXhqmsAyU1h0gCahN1hCg8VCaOwXPG8a7iq0PfCdBGhgncMib6t8NzgnBib8gvEfdgm9eIMZqDKYn9TlUQ6w9bvRioiLp30UxKXqNu1QyviFyEr8S4mNw91oq9I4MYKvfB9RaAsWkJRzBjej6cG3C8IL3Zg4VR2cVap52P1y/+IObmlspzyHeJMbi0dhjaNapgmTRKz74c5Wdcgq7LLwMg7u1hcwaOocG/7z7nJ2GRp5fnGXGUBEXQ/zkIwA2AZTAo+V06gFQ66ztITxcSHdR3fjI+8sMiSRhREnuHVEYGAE9T3b6oLwPDEyFExYukgyOQJ4pfSMQKbvI7XK2x0qW9MqMuUgORuWVMDOxAcXgP+kd60WPEJREAcR8JoVjb9H5/m1PDefUUSseBgTLBODNQJga6MA2MNSfr/GhlPaZVxML7bUcfwDrz9Do/ZxSeT5NVNefnCfg+Po/hZCxvhUMIjsZxKEdCYEmZYAQMDqvguweEKu6u0fplAQCgiCYYahBnTTg+FtmBAJyMg/AgPLIg78YxcgRhOsV9+mEXweu172urHIevjVILKb2CNRFZZwQGvjyUQjYlBnX1fJzKsE9jVmJqM9I2/Iy00rXo53EVZU6DWe+jj+3CfNsFsBBlD3jHvQ6yRhQpotg23I+v7NuB6eksvnlOXENJHDgyGNYROEz8eSYDYBSZ396G/7goSGEvnWJ/nIyXYdh5eNUxGFbCPSIkRlpgPI0dw/fi8MQezGuozZXQQ2KNpTawIz0ABO8qbRqoAhg5ejual70x8feBUFwQ4FS2ZSB8j4s9d2P3vk8hP+Mi5DCKdjqEASbDpSwI9TKvjAN3vwvZ1lVYctn/hGp6AQCnAa/jP1teh3PGhLPgTpSwpe0Evlj+KSbKbwHw4oR1QfKNXuSNYT8Jc+kqzoVIW7dieOJG/GIijcb0lzFeTg5xcFggACgnvsDhRPmtcL0V/j4usbBDPr60nYdFbSxqXIUjhb2yXiEAxuHVcX4oN8Cb83DXLkfJ5bjudrHvOO3AN1oEmmIN9uCC9hkBST3hkvXQsCPPnW6cD6conEZGKMzyRSA8gwMQcht6hPzze2egJfUcmKkfBchPNo1UjZpg0YxWETq3wVkVnhxHGM/ga5mfAC7Qzq/EhDMKerw3UFKfQrHeCSd5n2qC0CQZHgUtyPElkkJ/bNsXIVw2ii9kf5I4lgJakWy7DbaTQdUqwTUqgBvPIPRT3Xkj/u3QpSDg2LjoUjxsLAApPB/V/HWx35gHAg5R0RDj5sbxY8j87ggK/3htbP8ny84gP6fJRFX3UyM865YgzDqpPX9WpK6UjvywZIgydE4Mh8jO9WzOhvchP+NC+VfyyqUxIzPK7K2h7bXS31Ubd4/UiPnJmlT6qp2TEnLGo/hAe7CNUBNrK1HdCXVOA0Uq0ApDrrSLo/tDvxWmFyAKT+qXOTeA0cEYetVVDqfkF73ZkTaYUgAS6CkX4dR6JlHCcw14uZZVz12buP1UkZ8qq83NAERfyLaswOyz4oVDeWMObkQ7x4NYPW8dujO2v2468kM4RbU/CNum0wLON+x8DPlZ5orspJmr3yR+m6Db0l0IrmdBI8Gqws8BAGPdIiSS0SZ5h2nokbTikCDy92vkzoXuZnj2Dv/vCk3BU2Rsw8LR3Ij8RrZHC3utyTXjsoHoykFYins+T00ZIQ4YbwdHDoCBihtXHg/MBOUEHx1+PVYOd6KjlEPZuSa0h6utl8/vuFq0UvL9/FU/Y7HQlm7TRxb58gYDNahTh4viGlUx2iTHWl+YlWXfn7H6H/xtHACRxW2p1w7GeSxBZLTaCs515CcN20teRJTdYmwbkZO5J/k/zNOFC9OosBKsXYHAIZ+Cxk/RTT5/hcSdMjoc9HViR3l64mId2ChKiYIk8+8Jpb7OT6Uthcplm2L7ZjrWi++9ZfIMBAczqo5iMwqV2oMHB1CUC5Ws54COxqvPP5l2xvk5TSYG2KmFveoV2DuVsFeDaeHmi5+Hj60SnVtHfvrK8Rc8aibpT05pTLDW+c/EgvM/Lf9KIEGaB2GlRWolN7phkAAlYUQMbh2pDG6++Hm4SNYg+/GR+sqrivOjj5c8dRfeN/IZLM+Ei3VmeAWv7dCyXKSjowZNADDAwHgWv++/Cj9MfQIDZDbAObqLXbhx/6fRQB5MzEpbyO6Bl34Y0Fb54uCT3GNuoKgN7CpNN75fhOg9hUwS3dzli8Bam1CJNH3ASMOorAdxZ4Ij+dxpI7lPvvlOB6UainRNMy/Eksu/hubZl8FhHC+4tYoX3FrFF3e4eGT1OoyUPgbitfj7M5jg3MAPj4zjOXf/Ft/v2p14XD3bi4CgWhH3LsVc5DvWAQBKI3tAI863AQc3ZT+Abe56+eN4mrq6lPOyB/CP7nsxh4XbkNFCqeMOaqpzK1J+GzuK5zvXARINbOFFea3CCpTj/xYKwUClu3O8FEwSn122ESvHk8MFNvfAImNJ1T0P46V3aH/HJzRlnFtghKOfroc5+nF85uEXxvYZpnPguKtgk0788uAyfGePCwoTrjcLf+h6Jl5waxVbjdaayM/Zy29Ays36KMUDNUqijMkwVhT5GalwfHzLID65/RvYMxYkZow7VTw6Ooivdo/4E72rh5N5Hi/5UzVO9uUGOG8OOT9mjQzTaLYXECDAt/XfBI+1YbgY1PNjvAm3df8MvVbgoHynJ4sX3FrFn4/XXqgUa4S9dhiD6CuFhReJI/W9Zk2HYcWRGkCQ6+uZvoayPPEuFS5aher5G2L7GjkZLuVBGHvQCsbP8bEhHLj7PYGCu7Ygc4jh87syngN3ToII7ZNofxfOz8jICD7ykY/gkksuwYYNG/CKV7wCmzdv9r+///778cIXvhDr1q3D1Vdfjd/97nensbVTMyEkpQi19Z2fyskt6KdsKlVbR36mUuqCohz5e+o8k5gRD6PVIwAE7M61LqnCW2kJtbbY4sXsr5TgMA/PmZvcfVXYSwchqITF9QKbKhW/QddskSJ+eiq+w0xU3XOxt7gE+8zzsMN8Osx0C3599FtyDwbqxsUFy1IvyEBksqqTqgz5C93G3eT4e/W8s0J/80kKgSYZz6SxMx/+3QONy0C96TCra1ELK68V4hqtBunE9ex2Te34nh6Gr9OFqLoXwKgGaBTnFip8NspchAV/ejTZ6dWRH8opytL5SXsO7HyAqrmR8gC7zEuxhVyOL2yXJPaE0hRq0nVGd6MwEKA1hiUQpQszgYrugVEWK+AqjscxMSHObfEKjprBoN9si0mEZkTorCetI6qiPVuGe4NjGQZa3WTH4gTN4gV9cckIxzs7cf9YO2GhZDj4KF2B21sX43sz4pMfABSrL4LrnIN7exh+08VQ9ppQdp6BgbJQGn7/kqsxczjBEedEE0wSfXzfaHJfKchrjCo8f3uPh+0Djdja+zr86kig7TXqVPH+nffirv7j+HXjZfK6A46L4c6Jlc1R5ngrQNWzz6TRWQojuGkllpgwTivu3x1Df0SpGnYWmQzh/zZ1BwDAA8Gv+sW79tVHaw/qpRrIj+stxA37PhFpvExzt0y01Sj1Mpnzo5Af1pyHyWzZ1jgk19C50c9eA0/O0HRIHhP9WzHW84BqtP9dQaJkhHNkmAtn/cqkQzxp9nfh/LznPe/Btm3b8KUvfQm/+MUvsGLFCrzxjW/EwYMHceDAAbzlLW/BxRdfjF/+8pd4yUtegn/7t3/D/ffff7qbXdc8piE/k4S9SnWcnycikqkUinXkRykpr28Oa9W8cfZcfAgP418GvwlTDgKNZjMA4M1LPzql8yULFnowICBujnRIZVbB2mlDDAavnBsMqB7nuHpu8FKPaqv/PsJQ9twQMGLKcJZeYFNB1jmNQMqpzPzRXg2XMbhe8KIesc8FMbJ+EUNCPBAvTCCd5h3wV+GhqvbSnPR9sW1+u3h48BupoURcvfBsjK5egT6r9uA8mfFMGqOR2GmfHaAvShPK1cI0AHDlnNod78E+FiKjJtmJYvj7A0U1MAaIW9psBcfkZHqiPXvTS8EZFEhJmrmw0kHWmledBGZPqNWkysgYcCJ9R0wSZ6UDXZlHhzkGvbhWDucuyhK9M1HBoNEMAJjFx5CRTk9jp3Bkq6FsoITnaRjIai/9ps5gHw6Cl/Q9gje2DsR/NxXjFgpW4Fh1ZZpBJPL3woUH8OIFyjlsAtVCvIynwHlz6FCzh5Zhydmfw6r023DOgedifddVOPfA80Lcl/4SD2kf6aaSGlSXZpzDZRx3desodaAePaYtELpNGYaZ8qLMCHF+5hSbQDVHaXHj0+HxbHLYi1r+mMl4OENSiUZux2NgYBicFkY6ar0jvaUaizqY6NND5pzD3CdC6twy0TL3Kiy+7H9iaugsIVymW3+Zo+BwuCsXg82dIw8tx94mQZFonn055p37UY3QnPxeOjJUXZ2Q6fdaJtrB518GAGgwOCqveh7cVVGu45NrT3nn5/Dhw7j33nvxsY99DBs3bsSCBQvw4Q9/GJ2dnbjpppvw3e9+F8uWLcO73/1uLFq0CG984xtx9dVX45vf/Obpbnpd0zMHJkN+ag0QANA8NU27RPOdHw35qcrP7alw/Hhi19eR7b8brWwMtszumpCZDDkzub5SzEhy2rxBlPNjhVYpKo6fkc6PcoIAMXDoaeYvWnctGIAjGRPXnngUb9vylzDyk+D8qFV6o+aUcaXfohX4c0sEpWqg3noYi/H13YEKKnOXgLLwwDeD7ffTQklSiiqpNxGHB6t/f7SGI08p3pQ+F69c83IMWEEo4WSMZ9IYi8ROT4RqBUmFVzoEyxDPj5MCGiNjH9ccvC39HD/aVx+uvOlweMWfxO8qsPNjzk/ShKHXDTM9G06v0GZJMTfkEB7b9qWa7fEY93VSkpAfAw6omUHTTMGZUQVuKaV4+ixx//50jOFt9xIRFtWvzS1jy3BGHsfFHxvEMWaREmz5zIj8Vzk/a/KbEPQD7ZoNiqwXtG9OQ3B97V4JFMCfnc/XvM56Fr3XQ1bW31bwfok1bUrwrinkpDJuxwQSCShyLauQs2cj5WbRUGmB7aV95OeYkcM/3OXg0eFkB8CVz4D6zg/wvxFF4AkWhPD0rEjHv29Tex84TBAEyA8ALB0Vi78Km4M/DixGn/cGlDwnVm2dUMvvuSSClqh7MoECbly6BV+cEa7i/oO98T4/7oxg/8jG5HbyNNKGtjj4zW2wdkvn2zJBCEGudRVsmb7vt2MSJ7C7CLzmz454V6Tyu1KHVv+2LXgeTLsxSGXnyROPI9GunsdvlBtkWM6i+MQJUaw1kyLw5s58Ypk+fwV7yjs/LS0t+MY3voE1a4IUYkIICCEYGxvD5s2bcf7554d+c95552HLli11uTKn25jWtskeQqkOvPPmFaeesJcU9lKhJpsa+K+zLgUAZCjB4moXCLWRa1+HlClWfcqBs2kyBKrbc6c7YOZRcNoHw5ChAjIBw9yGDNnrp5Prq12lypqWELlelsPjPJY4UaEm7msVbemvlEKcn5IMQekiaMoRmm16uLBdrcrUgBQcvJHFCab39R4J2uKuin1/ZfWbaGgQfbbJsbEiFeX9cKzvCDtAhMp4frSyMpJ5X5xzDEtNkh0N008N+bEsFCKqlySU6q02AovbToDRYXj2Y3GuWQTV65mE1jQ9ws1MKoxrUTEx6eYmqFqbdh5tC69Bc3o18uW2QOMnIrhWHH4cr1tmYFrCCr7KoGnEBG1R4T2Du4JbJEOlStGXUAP5yDyw3whPXsyrICUJwI5W9uSZ89bBks4OkeijI4/flpqmhYBFey5qnwlQiowHuPZOGOYgrplv4H3rTaxrI3jTsOAKjWMr0tYtsWuczHiEsD/sq0VXkLNSyJpqvwwsFjzAWdkVierQoCTeJ+WC5n67M7a7a2/3P6sFmboDjMfRwpQmjTCWIAnBE0ZWnsS34yZWNstnJkPmpjy2A1V7MAWGRoxXw0KshFp+cVQSWdxxHoTOb595AKMRSZDjhXifPzS+L7YtsBSW5Nf5f1mPBwkYzrogIy8/Pay2P5nzI/YRKCehsq6hlExQ3B1qimtRXE+OZBFUF0E/4Jz7nKRSClDOfKGeGuqTaE955yefz+PSSy+Frcn233rrrTh8+DAuvvhi9PT0YPr0cFXbzs5OlEolDA8Pn/J5TZP+Tf/TC3VallF33x3xenkAgI9vSmFGY/3f1vsvI1/0oufiP/dtwxf3bvXJxCnDwLLmFtxy+TX41vwssryMhvbVWH7FV5Exw4Nk1s5Meq6VTSZmWp9BZ8Or0Jp7Jy6Z8z50NL4AHdZ3YJACCKTWiub8VOUknDFNmCaFbRn+t8QAUpEZuEzNkMNDNe9ojczqsuyU3yZqKKFChg+vUavIINsLAM4t7YiFoQCgUL0GFUes4DsyAerzbvwZHytchRxGkckuBADMctvw6XNf5u+jrmHjzLBT5clii2Z1A4gbhsgr8NBXLeIzux/GlpE+jLoEn9oWSd03k/uCoQqgGvHviG2gGPEiddIs91vLMauxDC/9ILgxhFQszTCC5JDkd2jHEMd/7HDREylBFXJ+5EfHy6JSfm1wL1gjPrfDw08PerHjzt/4Hiw++yOg3Ag5P2aknc+dOYTvD9yOaU5vaDsxKEwzyPZSx/Xk9ZtwQI0UDIk+clUugBpoSoXPYUUQgJGjt+BEWZxvgSXSfm0KPFz6NZgSSpTOz3FLhHY9tKPiPAMAkJHO6cvmL4VpUmQJATdPgKa3oilj4KJZJj51Xgrtsq4XIUBj5os4WXO9pZgoBb8bsWSmFBkFoRxZWyE/nTis8Vuuf3QO3AR9K8MyQSJ9yzwudLJ+YYY5chfw7eBmUPzXA4dpUlgS3uWExMoylPXyMhpaZ2i6zbFrTG2LbeMwMKdxoXjmtglOCCy5AGE6woUM3nf3a3G8dMDvH06pHx4BGGtCqfqi0HE3tIUryZekxMjzFohjP9zPcbgQfk8e7Itmfmrt5CmkzbS/r25k8VxQg+BbezzcX1yAv1ivxj3WS2W7pxb+KzEKQ2oF/aVk4sZDj8GVAofpbAtMk/rUBf2+6DbhBdmE1h9+h9w3fwoAqKaCMOS6jsLfbF49Gfu70/nZunUrPvCBD+Cqq67CZZddhnK5HHKMAPh/V6u1BeLqGaUELS3JzPm/mmn6PK0tOWTN2tyG/ePJqa1z29NoaTn1R1i0xSBRYR5u6zka+i6fTfv3YPy4GKAzDa1oackhl8oB2uTV3tyMlob696thLBv6+9DE46G/KcpgCB+DSeemOZvx22IQCpczNOQzSNM0oIVbqhH5+YbGjP/9gCHg2HxTE5rlsVJp8QJn0uJ5L8IoDvnZXuLcWVbCIA2X4lA2VvoIOqwrkTaDgXeuVYJaG1q2CVRcGIRgenseWdNE0XWxIN+Eg2OjSGX0fssAoikJV9fBMYNisEbOwo8fewz39nfj4cFe/NOya7C1P3ztmVwKZp1+m8/HBywnl0FRTq6qfcnGsaC1BegWk/e587K48fFgFc1JGURDDgzTSHyHrvvDoEBZEo4fmAnARbWyGJ67CCYAx+wGdediWz+wrd/Dq9bl0ZKOOG1uK6pAyPmJtuHIw5/CWvsK2Dy8Sm/IZ5Flsv2c+b+j1gQEL82FlcoilQ6jnJlMGtOaU9AlD1I87NmdePSbOND8XgArUTA8AAZcNoHtQ/fCtJcCaEU2E0ZI9oyeE1yXvDetTVm0NOVQlJN6mXlobs762kIVHsbPDHoEXkIZC2UzchTdBfUwGDhyKDlx+QOD9sC2TXS0ZqE0rSYzDqC5rQFuNhUKaJqPH4AHghESHrOLkfmZU6ClJYfGoTIAF4ZpSBhOQyWR3Neb/ezIhEmfBI7pjBzQXQAAEx2tzf59LFumj/ww6OG9NAbLB3F3/01427oPAQC86ihcA5govz24Rl6GS9IwI4vEsmzP+pkZ/PaQQFRu6ybYOD+4jjuOt6CWcaRATe73Td3FbmnJ4eHuKm7ukv3aFgKc5zq/qen8UBJOCiGZNDLZLDiAHxQagMIBTKctmMX60D5tBgwrA2NICb5mE4/JtedaPPAAMhD6YW6a+Ii2YXp/+/l1CvZ35fzcdttteO9734sNGzbgC1/4AgAglUrFnBz1dyZz8vWJAIAxjrGxyVO+n4i5Wgrg2EgJlTpy8PuHk7M7OmkVw8NT09tJsmKl9m+9qofhYZGlND4sSMCcNGB4uACTh7ODShMcw059tc5yMTyplr3wBEESUqr7xsUAkWbUb4tBCFwODI0U0GiGZ9HCpZtA2l3gqICDTwwGTqMnJ4xS1QaXx3I9sa0wUcDwcAGvcx/CTSWKbeZSqFVjlpfAUD8lUy06s/YEpnmjvvNTlml6hHOMjZTw3xsvx2i1gpuOH8TBsVEUCmV85nwHd+07ikeH/4TDiBTv5PBhoq7+YewZEhBglTEMjof7y5iZQrHswBuOPwfDoMjnMxgbK8HzwvfMdDwU5Iqp2UyjWPV8/oNuL57FsCQVQNrNvILPnW/h7t4xGHQCvzoUbk9Z6z+ACFMem+A1HB+AQOtT3ASIC4+FB1ii8QwO9AxjVgNDf/kEZmcXiYmr7CIDBOrOzMXwcAHLnvY17Lld1Eka7d0Bl12OqObU3QcmMM2qyFvOMTQ0AUIICiXRLw3ugMNSFIbgOiselmXDG3kSUZmLxU0VDIDh9/eyOw6gFRafACAmPs4pRsrBva54DKBAaaKKYVZAWhWbBNAzOOZz4VKOG3pyzbl3YHD81/G2APjynpvxmyueJyd/oDn3z7ig/aP4/eF4OCqf+QTKlQtRnqhdMT5qZWqid7gCXkLo7Rkx0xi04hNnWaI1S8GwFxT7R0cwPFxAsSjeoVLFw+6hiA4UbwOIg3XN7dgxEpC85xTSWHX0UmBVpIAuKQPEgZP5C66ZuQJ9423oLligsDEyUkTR5egtciynFFXeAdcjcHjQ+vbMSkxUDmLP4CPoHxiBJccXjwCOt9Tf71znt7jPfilKlWB65RwYlCnss6wqnj7bwG3HPPSNO6H3pJ5OFucpHB3t8vdPdbaB9g2i8uKrURouoGc4ziEqkjz6jQCZftf8PRjPrELGBM7tNPDPd1cwKl/dnccLaCxSVLXwnAcDxLBxbGgQFrXxaK9EziLITzM7ghE6F5wHv9V5rUN2GVyGEMvVQuia/5qWz2d8pHsy+7txfn7wgx/g05/+NK6++mp87nOf89GdGTNmoK8vnMLa19eHbDaLxsYpEnETzJ1qGeFTNL2PM4/7BL+o9RY5+muMOYzxJ9TOxOQraVw7drU8IvY3G+G6DHtGt4f2pdyavB010kz9tiSQgkekc5YzTP/4ihxedTw/VKDsEbMVpDF4qW7rPgpgFjg42rh0hIy81lbR/V23CtdlyLij6PQG5GZxnhwrY4hdBgCwSAlO5KXnnPhwbsYeDy1h/XI+EP2p08qg08r42X0PDvTihgMiNXkeNcEjxTCpsxjMFo7cu7fehU6NhD5WCd+vUTMNxuv3W89jse+N0QmUJPLDq/NgleMp+wDQZk2EMvSZx7E0T7A034Ttw1X8sivcSb1I3/zuHhe/7ppqX1UhB40BxonvQADAd/bcAGJsxbHifrxywbtx2fRr/PTpsiLIMweuy0CtSBYOCHI8zLf6j20OgDSeaz4TZ7t/gOu6IMRA1VMtckBoKpSNKI5FkY2IM7okTgZVxGElWKicH8bFzONquk6FyuuRtkno1wBAmXi+WWqCcA5OCHaPDGN1k8huSrluKHxISQEGKcFLCFGsKfTids03sIy9eP68Wfj94fgihNJReIzBrDFGBcfYAtfdAE4IRsw03naXi6K7Ej81t6PFFdXhX7vyxShEarEBQEnKTcwnDdjLi5hwHWzu7wVkIsHOwfi5qbMSXmoH5ufyIeeHgaK5Mis25nCZWAFSQYNdRh/3AFggsOG6DO+918HRCY6XTTsLt6WvBQqAm9oMGOLYXaVlaKc34/DEXlx/zz/hfXetBZYJLIoQ1/enMxCLNtcL+kGp8lL/sw2ODe0Etx0DxqrBe1J0J+AwAsBAg7UXE07gUAEiG/bA+GM4Pn4E0zKzYUtelGfb8FyGrz8af3YP5C7F3alVsMpAAxvE+sZRNM0MC4bhcgAAay5JREFUuGQXTqf4/RFxnM9vc+FZZ+OSzP7QMTy7Ee968HnhtkT6lLrTjNtoLkzDSK4XTE4wHBwfn/cLlMb+BAA4ODr+N59fp2JPec4PAPzoRz/CJz/5SbzqVa/Cl770pVCYa+PGjXjooYdC+z/wwAPYsGED6ClkvzxZxrSBpF6FiiMTwWC2rPmvy4636twfV1dHVpktMqVYH2AJCDJGMgSq22RaQITEX1xFYmzSynEo58fjHLZB8GxN68clYS7VnX0n1BXg8oLImDK1An6K8Kyuj7llGL4TJo67pNoFCyMAgPnW9lgbOdII4HUvJHKnWmJEkADl/OyfGPG3DRgtQMQBJBEC6ohWZHasGt43Sf11KmbuP+yHvQYmkh0fAKiyok+QB8LyDJQQMGs/bGsY53TI8g6RBWxtxyfu9G70xMAaDuKYIeTn4EQXjhXFIP3YiHz/pbilCnuZM4XInS6CCAA8ZeOqwq8TW9NPZZhI9n+1ElecHxIJrRJCYRsEz5sX3Jv8/GvQ0LEB01a8LtR+AD45lqqSKDL85mrhnFL15SCh90V87lDOryV4KYAg9vtt8Rg8zUPtTM9OdHyUvWSRgSVNRcxv/g5eMPfN6KiTt8A5Q8acZAFDSsjJ6uZH082YcEXx0CPpZgDAsJVJdHwAoCIXMuciaMTR0kSNsVFpzYj7srghHJZ2CRH3KPLetaaC/uMwBkrUgsqGxzmOyrH2lqZAAZ+wYLywtfFyOxVJG0u6z4FHANt8MNhPClcaJGhXofpm/3PGhJ8tqZc9OVY4BJVCbtCEbFCJuPfLdHciV1eq0vpoQvDg4dQav14bhRdTIH/5ovC4QZ3luCMXZKW5xMRQOt4xvAjBnUEJy9o+ZYDJ+1uh4UXdYHl5vKGnwZ663oG0Q4cO4brrrsOVV16Jt7zlLRgYGEB/fz/6+/sxPj6OV7/61di5cye+8IUv4MCBA7jxxhtxyy234E1vetPpbnpdC6dh1x5UxiUz/qx2gs9usjC/8a/nANV3fjTtG640N+L72zTtq6PWs6TfAsCm9ivlp/jkuG1EhNvyVjBgKkfi87u3YMKp4k0rTFw+dACAKLqn31flwBFwzPAG0NAZ8CiAIPNLpXMyr+ynxPvIDy+ByZBMW/l2XFH9dugYnGfhlyEA80skAIDnDzphUw6cruJcoFlwI6LPEkknrYbKkIh/1XzkERovdwHglwc9vP3OCt5z+xh+1xV3NEYJw9amDGi1vuCYw4uhbDsa/UyqaMo/iotniKudiv7U8+bRhIrlwLNXq+ekncOdG3IGK86V/me/ppTibMjnas0QiIguggiIdOb5XphzpsyRz1qhcEpcz4ALYqRDhTPFOcXfr19u4hJ57VZ+GRZd/CVMl84PB/fDAX7ynHT2PVkc2IugfkcnNLSKW7hq+lyfkwLTxBX9YoK9pbtLnHPbLpBKFWUjeMYfXvst1LO8TfAf5zXjy5v+Ac+cdS0IIZhZYx3DweFxF5T0h7Z/2Drgf/aQgSOVnfs1teEfTV8PADiSTubOAYHz08yBp3UKJ7ziuYkyIBlblBihrBOZ6gxYkfHnwdY0ft0+F2DhCXpFvgXXzBJJCC5nIBKZGCm9BC/+Y7D40k9JnXlYnRfHKbgsVk5v2thC2K0roMaAi6o/QUoSIisewZuXxDXQbAo/Q3DcAW7v/jl+e/RG7B7dGeykSWGssSQFwxP8GV9rR1InHi9Z+NTWZGpEhZu+Btk4aQMi96rRJnUX1d9qfgl6zFmx7Q7CURXl/HCe951SVYC3NzMO11vo76ur+J9Oe8o7P7feeiscx8Gf/vQnXHTRRaH/Pv3pT2PJkiW4/vrrceedd+Kaa67Bz372M3z+85+Ppb8/1UxNUwQIBrUEG5PefN4S+zxjtnhk6zufeMTSrOGQAIiE4eRnuf+KpiCVt8Km1pGNGg5SSupWmJIp45kihZwZgYz7tFQwIqsJ+EBhFL/vOQyUKzBkW13LDq0ULf/6xPemHUZSlFAdl6qlzC0FyA8nWJuRL7Tio5AqaASp4DwDKlerDCzk5AXIT9hq6TpF03AJr02CL8tmNMhdPEJjVd5LLsf393k4MsHxULeDrz/mxlLmv7h2Jog3C4ZbmxgLAFWviDatdpB+DeqZcM797VHkJ5vQXYVjEXfYXKaWA9o5nLAgWsW9zP8crSRdloheWt54YoSdSN7a7EPysXOrZ+0jP/L8XCI/JIr8BE9XJZvovCYhgqcQQvgFQ/2wl6StOnVCSpyOhhZIpFRGRnqXJ0oizJu+5U4AwP58IPxnUctXQX/WwG7/PQEAd3Y4Qza4hhp9ExyHJ/aA8Y7Q9kXbt/qfq2hGSfLwBuzgnd2SnwUO4JMLrqh5jX1SXyvtMh9hqTKWiPwYNEjOcN01Iadc2Y0d62LbAPjSAg5j/rscTdsu6nIYSKMzlZP7ARzxkKZHCbhEZSxUkJZJFgUXvnK0LpxJCPHH8wkH+Mmh/8HNx76L3x77gb9Ps60Jd1bFMy6RFri8USsgK47568E0tvTXWG1wA4YrkCxOjMRFaGaSteuPcVFsWxXCkc3yEQDAWd7N/nfHjXmiedL5Odg4hFI1CJtRMnkVgSfDnvKcn7e+9a1461vfWnefSy65BJdccsmT1KK/jvloyiT7jUnkR8GkV82hmNdEcfbcBlQLT8yDrud0edrsFUV+/mn5dXj7g1ed1LloDT87JTWCGuk9sPkxVNIcJacHnAYyBXOyWhaR1ua+chHEdX0ugptOg+m1ZCITvdKw8P+WE5lbHQVnLjhzQCVEu6ihBe9fezkOHfkPf2BjpAwamaRWNV+JwaJYBY1Ui6HJkLkMIHFkL2mwBgDQcIp0LSExcGD/qCQppwhGqhwuoTGPo6cYHxCLLpCTfansubibVGB4HbH9wsZQZSVkTRPXb7gcBiVhFAiBw6MmK4dxFF0XWRmKmttAYoVoKx4DQzVMdoaYNNKGieoUC/72l0+E/lbIT0qG8wihmLfpEzj84EdgplpRPWctWE9y+GWUinuh+ryv8wMH1GxODHspk5ngOFHgGKlwTDjAsqt+gvHhR+E+Kle+xAGQApFhLyKRxmqN4rVu6mFwOohNbYGgn7twDl64ezd+Nz0nfqfVfhuxxZjQlpoOSgy8agnHpnv/jHWDR/CXloUoSUew9NJnJ56vVgiec4ZxZyS07UW9j2J2ZQxf6r8L327dhq2ZFTAqzQCAwbPWAUHmOkrU8s+t7KWLKH585DFwOurXOstNlJGSBN2i5yRKVxn0KNzUZpiVjRC9LzK2cBslGXLyrD0wnEAZXqnTlz0XBi1Akcx1q0Yc3Cs6FuDP/SLz8q1z341vHP0cUl7wnjsInFuLl5GlYhGzf4yjt9gIzgmasAujWI1rl4jfqUULB8B4GwzSL4j+0s5pPweHJUXJ8spypjZQ4sv90h+KVHiwJI75nLlCSuLohP6eRUjfCePwm1eYePs9ssRLjXeO8xRcNhcmPYA5mXnYMSrQsNeU3odx2o45bAvusl4BIIMRowlZBMiPQ5lEyGWz+allYf+17SmP/Pz/1RQ3ZTJ1Z5XU0ygJkJQQrGkzkLP/to8uY2oDAA8jPxYNJo70FPg+QHiFrJtCfihxkKH70Jl2wI0h6OxaEkIZguuuMA/wAiKmy4Fv7wlqGxUcmW0l0QUSqbukdH6Gj9wKJjVSVA2wnGEjbyvuibhej1ZgRlJ9t/e9CEzGuF142KyFEslRMWDGkJ8pTuqAFU1KEr93F6DgivO0yPnEjYS9OOd47wPxMNfvjgT7vG/HvaDuAtBIaY6EM6IsEb65uUbMyoQRNB/tAYfSS9wzPoKX3v97H2lK4jfe2X8cXCsM2pwSqMUP93lIUQPRYrFJQogAMFA5gePFg/7fFd/5CfZJNwpki3MPMA3wdLJj2WWsF0KEKuylwotw4BT7YsiPHkZQslN/PsHw+jsc/PO9Dn5wuAl9qTUAVF8SqIAi+Kt/nYSQJaPD4MYgQIA2Owjd8YYcWiS8VPJcQFsE/XjhDgDAvJyY8NMmwaZSN7LMwYKSWFBQAEglX3/U+TGUrgsY/mfPB0PfzZWJEGuP7sOsyqBMQBD7j0XUoscSuD4L8xTMOgxujPjbGvcegi3RmT/3HqsxQbngVBM/04nN3IRZChbCzAj0nAiIj3bf0X8M+yfuTDx61CgyvrM/61dCB80lzO+P9/LD4HKhYqKKBhnWYRy4YdcaFCpv9LWzpmelbpR2o4cmfiSOyebJLR7yGvIzYMu+winG2SX46oECPM5BPA+9dgP6quKaNk2juHpOhF/ohRG+Xw3FUZdp0SE8ITllpPAFjBSux0T5XVjcsAlMiXHyY1jiPYwU92AZIpS8JXOuuH7Zd6qGF0LMKB3DrpGHY+d4su2M83OaTC3SJ3N+FISenpxW81e1F80KSH/1OD9TNZrw21VN52J+w4rQNmsSvyDGU3I9H873IshH0Q2HGKLOT6PGAXIrIwCCwV5xPWate4cvPghSwWLvYXSmg9DChJOC5aMBDF2aq6MIlzSSXh595vpfVuoXyFoTcjtFEjZINC6DKjngEQpSDRCAkhcPPQHAYFnVIeI4UBgFdZPDH2utzaG/K15tlFFdjse5NnmKD04EQQkdk3lC9ZtMwDLvx8YOce+ypnJ0otdeRTr17dhxAOBYQXBPSs++HKWcCFPo74zvfEunhhOOV5fe73//j1pa9ARpBZM8MF3heaznPiDC+clPD8ihSeuRm48wnCgFDhOjygFRyI84T9lz0USj6E/wd14j/XPL9MNeDEC1GIRLDUv01XkNeqaQuI9vPfYgFjVwvGtt7cGkPcJtfeEiUaDSlaHhxsynRHu8CjaOBaHpR3KyiKh8f4Yq4c43aqZx1WC4MG1SuCVFDWRltt60dDbmjJl0LyjthR4urXKN78KzIIp8a5wAIqHknNRTm5nOoS29O96ABKswww+hG0z83qMcjszyMzwOKOQHZaRpeNHhsfl+RqhRZ3zjXKFQBjZ2UCzOE6xrI8i3hQPoRQ9wmAcwhmOa/MTSJuLXotPOHnwy9+N4grqyQQjStsblihYt5YDLBEm56p4Lm4oxw+IlWAgQIyqfiXoyCvkptTeAa8dsTH8Ox4uHat+IJ8nOOD+nyZhPxq1vKtskVk7gb2hfXHcxGrTBNkB+Tt0DS+L8vHPl52HT8IowCZbV7dkz5mvHJCDMgynv5U/3ewA3QZ35sIpXw6gI3heFUuMNOz+ZluW+Q1QtihWiKSc3RdhtX/RCMBLI/F/0zOvxvEW3hY7jMT/REz+i4uXfbS/At+aKQcLwwpOa7vxYhPorXQCwrPuxeppGfKyjGfPONQZycl4dtLL4r8ps7B0Rz2qsBrL8x2MMPz/o4eCEUiNK7oHPSG3Fonzw3Z6xbSh7ydpXQdiLoygLTFLWBFpdgZf8+Rief9thdEko/lPnhJETbvbAzdyDmfkb8IzZQgfkRBGoVJvjbSMODHNH8Ftthfrro6KWn7t2OQrTBJKlIz8KteSa87OIbcXPH/8MbnqmjStnG2iQTftp6iMYKok+o94/kepuh8JebQuei1RDQAa1asSMHNlOy3gYx6WSuUEZZmYW+OGvzcN9MKwHwz/UpBwaDK3vWiYyjPvgqLvtUXGejmYME/Fcz2l7WqwdK4v9+MJGgotnhN/F33d34WOPPoC7+4/D0FSWAWBGVhyvIonZaetOdOSvxM/3/xLTNG2vrozSBxJt3hWp2XVL21L8sS2cup20oMtWHCyV2j77JkawYyQsY9KU/YAkSgZI4Hh1xP/+bY3zAYi0di+1M9aF5mVFiFqUxwmrfEeNS8f0uq0U7sTlsIpX471LXgImM8DKhoNHc53YU30nqq5AOyxegR2RPqi6m+BJh+w3x/ejp1TA5oE/x88n0aMVzSXMyBJ8/nwLH9tooUoV8pMDZFkRj3PAY3DkuLo4T2AbJJSlCwCEBWE9ZvagUot+kH1M6CABoJ54DxvZiGyYDg1VkTLOBgBklXyItEZ6LwBgR1qEaBlhcJbMR3HFXDie+M2m6TfDNI6jUmMseTLtjPNzmky9HpMhPz7s/iQ+KX2VCQQThh4PXtsiHIvLp79gSsecmZkf+vtcOThH4/Vzs/WFKRdF0lrhhvVHjOoyGE44lZLKlzqK/BBCYNrieNWiGPR950cbvzw5KBFUYJhZVLwiCHRhMnVA8WGfvQA/yQeChaYbdn6sEE+E+jwEYQztKf3v+INXKd+NFvFXxo81TMOtdBre96AYKAtuAuwj7Yf7PPypR01yyfsdoseC7CVDCJttGbwjcV/Vhzk4fn3ssL/dcOeBejNAvUAorjWV3N8tSnyODgCw8jpEr53Tgh/CFBb008FKDyYcOVHL260fT2VpcRZojwCyT5eFAzIhF+w9xmLc3auIsUGqe+fSV4TCXiSSRdZUg6KljkGICybbbBGgwWoC0RTK+yMhCj38MOoEat/cNEEAZOSjqx4WCMyh/Ki/T17TNiJFDbVLcNCu378Tm4f78LndW3DXUBgNUc82ivwRJzm7iNcgkt/UsSK2zU5wfkwOZHYHGWS/Oh7WnCGkhKBfyGytSsD5MlVWXYJ0RsnlfvjKA/frVNU0DTVSaNK40Qy3KsJqFcPFZxZcgoobELnTKIAXDiNqZYhn++jYAG48tAvf2Pfx2D6KN2RH4KEKC8Ya6sqML88D4RyORMLV/LCoKeL8hKQOGCo19NYWNDT5YWYitZVUvUV1TmEGhqsiizKqZ5Xmo/Is4pecMBjd/ShptfQaLMW5Ov0ZX2ecn9NkykGfHPkR//6tkJ9UNHUXQGPE+YlyfgDgzUs+inet+AKeO/sNUzpPS6oTH1pzAz667tv4x2XX4ZUL3wMgjgi9bUk4I+Q188KOzMqmNpzdIlaZHueg4xNaLR+AaBOtMgPK+Ynz+42UcH5KI6KgoGmEkR+PcT+Nk5AyJlgJj408hObcu2X79ZCO1LUgFhxNJbUpIkjYaAXfWZSGQnkEDGu1AWxFvi3WZqUFkreTneKSy/1+054GPnGuhesuDaem9pcJiJcHlXymV3Zvx5dWlpGxf4K2hpdglIzjmXMpXrvsKPKZ6wCgJvKjJhSXMeybqK/cWoqsFpXZhISQGs4NEKnwTKxdgH0HPPvRkKsWRQnH3REAQcHIpLAXZ1V4bhHqWRFOgASyca8cmx2J2hlwMG35q0Pctah+0NNmJ7+kgUipA5dLQULqosFsAtUmaRIhuDOZ+QgAByd2wZHFVFXxzYx0qsbkaYsbAwfD1trmzZ0ZHDQSNvaiudu0BDd1H86fN4BvXZ4KSmdEJystxMoAUHkcZsYn/lqmQmlRs0cSNG58c/DafSrbVJzTpi4+v+4i/PeGy1By5TtO4tDn+nbqcwY9zkPnTxvAR842MUMDOdzUI8lNkBo3DBy9dngxNtPbi445l8V/ggb/032D3XB4/L1WiRX6ezDhOjhQ7AejCgETfcST/dKV/VGNA3MaONzUA3DtbUkNR5kxlD0XA5Xw85yZyYGZ4RJH85z90jkPxivGO7FvVLRhsfswsq2rsYy+HKuPXI4WJuonglBUkUaVuDiU6cOu0QCtnZGVmWtu8jjwZNoZ5+c0GUNYsbiW+cjPVDmyJ2kxJAVCUVm3gPMTvJUpI4OVzefATHAoatm8hqWYlV2I9a0XIivr3uhcoAUNK5ExUpifC+LYHek4ErRBOT9VB5lf3AJTI4uShARG3/kx4ktzhfwMHvoNAMCSzo+Cjx/oCyaHCq3gvVuuwdHiflAqNHk8DhR9URvRDjuyosxH6rY1mkE7LGr46bfCOL61/6P+izkvG9YqIYCfBdZokcR+8eo/O9g1OgIAKHoVnNVhYEYu/KpvO7EAZuUCPxa/cfw4FqQqaEh/C5SOIE0ysCjBqtYCKBXH+mnXV+MnQxD2KnhxgrVunBTxjm06yTTY36JGjDOjssBMcxDE2iszpeKoWEdKrEwnnBE8NsRQlr5M6Hha333s5uf7CBAB8cXidLutrwmV4iAqVcG/StkNINQMOdBRDlytsNfNR8Q9drz1cCGyySziIGc2+mEvIAE10Ryjb++/Dl99/H1iv4jz85kFMpSTFfdreiYsW8DatIymyHjjJhCtuTGGu/o3o8F2fWQ2KmmhH6VgEJ/Qa9Ewr6eeffDRuxO3p0Z1Um4EySDArEKzbINo+yODM7Ei34r5uTy+OyKulZN4X+xIB1mKjIeRn84MwVntFBdN155pjZRsLvWmvASNKgtlpPPzYtuj19PvvS7hG/H80hL5qTIPL7//D3A48zXAlPyFcn4cPwlFHMNlDNwYAadJzgVB2fPw3u134/UP/UkLfct+4Nc9E+dv5MOgKMckNx6V9b06+GEYVg4t6RVoLnUiy1yoWopF0oQfzT2Bf191E3rLgX4ZLQiHvv/E1Mjmf0s74/ycBhMZMEH2Vj1T/LRaA+sTtXcuWY9ljS1455L1WN7YghfOXhRPgU9Afv5aRkMhoJT8V1cSjp9ThYk8WcPtwtH6q83ZrnjhkpCf6OrdlI6fmg9PFIIBbswKJipVhR4IMvKU89M2PhtpuUonnOOctetD51ioOZwmIchozqaaDFV5mqd3hgfS1flOX/03bwOrWymWNoWfl8eBP3aLMEnBFYPRgmYDGztrPz+TefCc4Pqen3ouAGBR46qav1Gm92FunKizp5hsXPtR2OYomCUytHJkCyxqocmGH2rTbVnjPYEisrYKbU/NwtUzX4mMKQs9eiXc3xtM5mntceuOO2cOOJNZV5z4WXJvXRlGIXt7tsKV57Nl5l/jtIAk77lx6P6Vi2vz4rimivusWRfAIFbI+WGaYCAQEEab6B8BALvHpKaOzMRcVpIEUzWhy1PH1NT1sSOC/NTTFxqolP2xoFBnpT4qZ16CKijCDsM/N/Qk/QQAUPTKidstXWaDjsa+jyJ+Zc1nbFQlFbTfvXQRxdkdBOd2Ek0hnsFlDhrS/41pGRevXiruWWicJRwLmgVBfU15X3B+LvqbRzjSXrg+ogkH7QtfgBctoFiQKEgbXJtn7dKOCX8hosK1Q5Xg/vhZkdIRYa5yfiTyoyUdiLaHF2BLmjyAFFHyXHQVx8EBPDIaOCUTruOXXhGjbgnTvUMC+eHJfXpaykPn0lcAtmhTihkg0oFykEJfqiqvTYyxBuEwJL2g7BVimmNPtp1xfk6DMXhQt36ytOc9Uhvlb8X5mZVtwBfXX4wrp8/FF9ZfjDcsiE92qkDdE8n2qmW6jL8tNX90TkySJo4PXTMPv5iRwxvOzoDbj8X2U3ZB9VYAccKzaED4xVYhNAXmlCR3JmP/HAU9ddqw/dVWSQ6+CxvEirB1fCFsT0xQ1684D9OWLA6dY7aWKt5dLiKvIUFUpsk6PuKXxqu10J8tdUkIODKG0Pn53Hnx6zohC8mqCdSkBB89xw6VYdDt/mn70XciIFq3mu2yPZOT3EMOPGFwsrf45EndFLLBzWPoaH4UIC4yhocm4w6Y1AIhBO9ea4aI1s+aS3HJtOWgUjV3TUsQFn3urK/j6NgbwZlAfipeMVzVXGtXVJnZc5TzSnxP9xlzDPz3jG8gxQU0Pzg6hCoRE13nPKEobWfrywK8ZJGBXz3Dxqc37ai5T94YxLNmvQSL86t9p040pQpK9dADw9z0fuRoOPyikJ+Xy9hcWU7YSnpGPbMJ18FX9m7HV80JVGsMM0nIj7IK8/zFR62QJxA4PxnPASVOSJJgCT+BWeXAEfHMrtD1xdqzYA4mLO1chGF6Y3doH64yrwzBB/L6hpD56c2A68KR4ymnIiNzfrYRr1hs4t83WDCo7vwIxeqM/Rt86txRbOwIc2cA4E1DDF/aNA2/vtjDl3fdBZgC1VJ1rRhhMCMCm7nV78TXuvbhollFfOkCK6gnFrQ+uHozuK40vwGOt0Z89vWp9PdKODOUtQOcgJflOEEV8iNDz74zG27XP691ASL6hH9+7WW5s/+437Y06cJ083o8lJ+Q2YjJnefSi/8ZDR3rwWUYP+WZfmatRyw4MntRD+fZkjPnEGCif0vicZ8sO+P8nAZjnAVp0HWQH73Cb74GmfJJsb8h8pO3Aki+NSVCAnr2U7LzI7aVPA9fWdQMAPASqsIra+ZitRElPIttkUmxImLrii+sHBuC+CrfiYzdisBZpQSOvFVmOq5vYkZW3zMzQSkAE+GV7o27PaxtbpdtAEZLEtYHCQ2Oa1qjaJ06b7iR6RpRyltm78Knq1/w/za0EGHWaEj6SbBvYh9OIr4GA7LSkVKFPUuuVgFea3KzTTDujPjODyGNPpDxhR0e7jjBcHTs+QCAMiuFUurz2uOOPnvuI3MB8gMAhplFVhI3Hy82+9tbmwIyMjUFMSQ/LRAejNoN+z4Z26Y0fmwqM+KIEUJ+hOmTFkOTFe8/ivOTkvXdKgYBpxQq6VChqfcPdOOPvUfwW6OCnfkUuB3v//WQn4pXe+LTbdQUHT/NqiDwQokRv0w7KGqZakq8lKMSO/T0dBY8ncIPFt8X2p62VFaWRFm0WlUAUKUGzINHYe4/DNcn9CqnP/yuGZrz48i+Z2gk9tXae6QQKFMSsA0ZJuMIkJ+KJpzaxHpww4iBW3oO41933CObGn0PeOLnYxPz4XqrAQTIj+6Y6urvhLWCPiwWKlHOj5dAJs1YEz66XNH4bXHdLHE+LpEeRiDLsCSP+/6cZAfOj0J3PVhByrvUuLJYCSlJkq5QoPfx7yUe98myM87PabBQ2KvO4NKtKfQuzk8+CP2t7K+h81PLWlId+LdV/403LP4QXjD3HwCEtXySJlYlEHbc1SBnbZCZ2dSDT2w08bplBj51Vhl5PiTbH5/5o+KLDU3zAQQTcMlV+8VXvpfPDN8P1e6+lAFHcSDshMkLQMYIzvuGBSvxnqVnoc34MYwIz+DAGMeKfCuuW3MB/mfDlRgpi4m3LReusfSBsyLKwz55lmGkGtyndE2hEddPqQUAovGUXrtIcE2iXBJlOocJANY2tSOpYKn+jBR6R+UAfMm0QP5+eUvQxmfOpSh7RR9Or/IGPwtFWX9pFTg3UPXKmJA+8BUzqS8MCoTDmxXC4frZXmFxSGpm/RTe42UxaBtwMZ6djbLkNC2/8ntYeNGX0DgtKPMStYIbD9d4KTFhLcwclMc1QEjY+QhPlgyXTbsS18wRdQoVosOl45iWzk+ZEvBM2kdoFVpzsBC0Yezyc1H4h1fE2pSE/ChnvOx5NVXgy8+6DOVnXYbCG16CgXPFpJ3xHOToNnCtD/faFIuagveEG71wU5vhpoO0/u+ceyU+sfo8fHHdxeC2icP5HrQbP0CGCNE80+pDU/Zf0drwGgCA1yLCxkpt3VGZfIUSXDWeyvsa1QXTnR8ms1hNzTFe0kSxvPFROOk7/KrpSj/LkM4Wo+L+jD3nMjjyt9Ot/8Jry/+GXfJVK9Xgv3HCkSNC4C/aj5WlZcxbd0z/6+xzYSvCO7fBxsQ9rmqcH8Y5jhWDe++k74ZnHsCSjv1IG/Gxz2EMJbeAfWMqwy8IeynTkZ+r5wTbX7KQ+k4at6Uzzgy/Zl37in/wnfHlBRHuzWIMGen8lEmQRXy67IzzcxqMwYPDxUqyFpWn4HC8817xAuVt1ByEngzzO+nfwPkBgMX5NTiv4ypkTUHcfHwsUG9NQsaUSusAD6+Slc3MD2FNG8Xz5xtY3qITGOPHijo/6bRM4/SRH5WmHEZ+Gq0WtEW0wFLyVN+Y3wRXPtha9dPWNgUlJRosG1dMm4MUifNlVP9YkW/Dxx4yMFoRg0ev04OjxSArJl5xWw3oHNfedwt6i7IGVI0oFolmx2jOWUaS02NlBKSljPBB37BwZXLKMw8ckAmfXyR5LXaQ/dKZCa6lwSKwaRqGRH4eGuqN1J0TNjB+Cyqs5BcCXteW/L5UCMc3pwPfl7I0UeSHmhlkpPNznysEDB06in/adidedv8fwDiHlWlHY+eGxOMDwN29NyVuV+nXpizlkBxS1K6NcHSmm3HxNMG/YtwD4yzI9pKTsksJ3ExKfAeB/ByYGMVNJwIhuWpHK3hjgDAqS1KWbpZo00ODvTXL0jjrVsBZtwJsWjuGOwUamWMuDIyFQp47Rwcxs0NLoSIQ5F0aLCbaUxlsaOlEk50CpNNtk16kiODyFT0HtrkdhlR1Znnp/Mh75fNe/nSv1kLRD6LZbMrpZtp2k4QRsYw1BtBywD1yxDhjGkrET1xPoanZ/00rvQVNvL5uEAA0WUAjvV+2sL7zoxzTdjuNRQ1NWCtVzAm34Um0RUd+rt+/E5/drYmT0gKYvQ9ZkyKdkNVbcCv48PZr8S87JJcsoRqhcH5Ee1Zpi5L5jVq/kA6mQH7EvUq3r/d7cmtVPK8sCsjKbLUy/dsspk/Gzjg/p8EYZ77eR8FNXiH0lYIX49lzn2R556j9DZGfJBvX4tLZhBXL6qak9O/AwinO+u8TJsTINXUsFDWPAs6POk4Y+Xnbsk9iSKO1XDidImvGJ5KYIrW0tyxajaWNzfiXZcEk+i8r/1P7nbgHG9rF78cdYFgt/MgoOB0IZWvELospVWoXLufYPzYCIHxvOEqwjM1otreGqnUvGG8JGNcALAnt10pNjppw+OLOD2WtEhUCBqri5hkyK0cPPVw6k2JRnuAFC0QbnjHrFVjSYGNaSin0Jk8aZa/kk8/zdrLz0yfnuaIqehrJ9jLMLFKIonwBWlB0J78HXRNiJZ3PfAgGPQ6CotBKkpW6x6viXivnJ0Me9X/LtWzFZfkGrMi3hiZnjzsBx0ILi5cbs37BS0oMHC6EuSZx5V9hBS+4niUNzfjwynM1xIEnLrretuxTob/V+9rguqJMjRF2pM+f4QrRQSueCfbGCMdQ8ZkA+PyRSkQktGgqpEGWBvF5JPo4Ka6htxx+loZGeFZmRkKirkJtJbJGlPMjJ3YmRf8m/FtXQhouJmjgXAZJG8F7xOgA0mbJV/Wu1Y8zMoyonoMaQ5q9gPTsyMK0PueHAIfkM1fZrcpShgGT0thCbNwpYrQ6BKal4Yv/h9RBofp/xiR4xhyRYBFaXMjno3N+HAYf+fFkFpuNCjIypOZSwD1963kAfweFTf//aBwcFbYQAPC0aXMS91FCbdMzwEsXnV7npzgksxKegMLzqVo+gfPQYqcxP9uILg350B2blAanhVOT6yM/6fwCpFINAJx42Evj/Hxwzf9iTm4xqixwXN+7zsRX9sbvTy3kpzOdxZfWXxLatqzpLFw546X4U/f/YWPnA7i/52I80MfgcY4bd4sOYVHgrNlduHeggrE6EzHhYrWlskRGqxUgJWo9+fsgg39c3YeHem7Ffg3Yeu8jFwMr9NCjLABbRxRuY0snNg9LvhRjoRCXbhe2z8DO0QGfeGmSijxHcO9aUwRfOD+YkBqtZnx03ZcBCB7L57bUcH7ciq8k3RjhyHUVxvCLhqswz9sGQLSTgwv+SCTsZfHB0G+5Vh9qzK2G1c+lHS8exB+O/QAOr2LbkEjhTlkPIWU9BADweA5F760AGMpMhCaU89Ni3AqLDWKMXQq9mO0X118IQJYykOYyF5YpwnG25muPn7USnB/xj1uJaBexBHIxAIxJBG5JQzO+fJboj73VIvaNj+C3xw9hbQQt2tR+Jc5qvTjxGA2u4owcBhBoC3FShJsJ83iUXTNrYXiD5vxkDBvDDBisDKFDbi6yVfhxWrx3Wc/FiAGUDWBvfgCjfF3oikVbwofXw17BtuCcR4vj2FoSiwq7Ip0N6fzYckHieNMxPPFV/Ol4N4AloGQMaQbcmT3XP06VMXxt/05wagNMvIteejNsasIjHAReyNHVLWUQjDoVfGmP0OpRY0iT76ja6EY/VgOodErpBBrweZrozWDIYYQ9U7ZbOtmGgXGNFFf0HLhoD06ssr2k2GHV3YBM6VJ4ciwxCPDWlQnUAZl5lmIGIBczjsc150e8yyZc2EychhOgnCAV8GTaGeTnNBjjno/81HJ+K7KPpuoVg3kSTE9HpBFF27+VLWlo9j+32snnzEa0czgJCLO2hlqAGD7Z1dZKEfhfa3BweexQoJfBhcChXx9MQ35aUyLj5+wO8WxapH+WhPLUQn5qmcp4Mw0xADMOPDbEcW9PkIWmODZjTsDlKXsuOElCgsSAOVoR+0brKdk0BcsM3+O0Z4ZmDSVBUGXJqckAcHFHcG9bU2nMysSf2/PnU3Smw1UU1UrRSOBjJdm0dBa1Vsw9xUBCoD0dfm+u378TWzOrcVfmKn8bg0B+1OQGAFamDRbC6cu6ZsyYEyUoC/vTif/DQ4O3+45P1NRqmsDD6mZBlNYdPnUfIAnB0MKshob8uNwBKAU3BFswLb30sm0F2mGgMeenFvKjrkdXddcJ+AcLYacpKVSn+mGnvG22KRw+aojFSV8EfVFhtY5UJrYgYVrBVRWK5Zq8wSi7AntlFlFnRWUT2fjN3F24uUMTRJWH3djaCd0CNXLRxQ1ihuQ2PrAzCJ1Zjge4HoirnJ/g2btsObb3XyLbOQHbo3gwsz50rt91d/n6PCrEpdYeooZg8jNJGcC9/SfQXRZjWmtKvEsdBalXxi084IlQldL5MWmAkBHi+AkCAPyQV0cqrJlW8hyUWFDxnvqq9WL/QvmNmNAcylpTEZsjhGUF8iPuUVUna0snz6RCmyktv+JNyRzCJ8vOID+nwfRYrwoDRC2Q6H8yWlTbVFYMAGRbltbZ869n1629AD84vBvnt81A1kzuoq9fsNLPqACA1yycj+8feACcVGHSQOWZEIIll/8vnFI/si0r4weKEp610024ItwEAC9f8BpU2E6saj7Xz1C7ZAZFo0X81GwScWUpyKQ6TlFTyrwW3QFAlMjo0YjvjANNcqLaMz4MzkVoYtSpwk1tg1m+KCz0KImfivQc7U82TcE2w4NiipmoaM5PzhSExaI7AcZZrEjtcKUPKxs5Xjx7OqalMmixUljb3IJuicI8ey5FzgJevNAAJeHJqMPaiwln6s7PglweiGjJKOstBjyqpkjYa5fkkQ0a0zCDGyDEQ8EAKDfAB0eAebMBQpBpXgaLh4u66uTt0RrOT0/pSGzbB9d8Hdc98lYAwQSQohZePv8dAMKOhJo0HKsHhDJk7QKAy+R+FJQYYNyDyxyU3AK8rIPmcQMpxlE2gEHuYsL1hF4MaIj4CgDHShN+X9HtgAyd6s7POW1BZlsg4ClMd9iGq2WMOVUMy761crQR980B0tYfcNXMK3HH0Dh6q0E4BgD+ZdlZOKd1Oh4ZGcC8XCM87qLilXy+X3nFAkBm9hOutJ1E28S1ic9vWbgKcx55DNsXCeeobLhg8v17Ue+jWDinEYcWzsDzZ4aRJSPUd2mM7zOiPV+Lc6FkLZ3jNPXA6IBIN9eMkCpmDC8GEmoEc2MIbuphbXGmMsy8mmEfm4YFQ9+99CwAQKusm0dYDkUZAlOhPosS3+GlcH2JCyBQ7P/gynOwfbgff+47hl1jQyh5bgh9ytM7MIFLkDY6wDmBy+aH2mXUWMexOTNgvfVlMMb+COyTyI/m/KjnZ/AKSmMHkbaAkgHYsy9KPuCTZGecn9Nggpgoen66xuRe9ZR0+5PVqmRjmojXk4X8ZAwTb164uu4+M4bDg/v5bdPxvS6RHWJFHJpM00JkmiLwurTS8J7Q3wYlyJlAwQVGKtyP62/q2IiW1DmhfSkhPvoDxAmMrMbKrp4p5OeR0Ttg0w+iygj+cCS8+lYT1dbhfvzs2H68dM4SjDtVgJZh231wqkHIIWOI9dyonKCihGeLppCi4edqcBoih+dMGUIDQ9EdR4MVICw7h+/Df+/+QOj3RecVyFlvglrZPm0WxYJ80JHnZRtxWIYsTYiJcapK4YSIemZJ+mh7hoUGUFT0MWr93qvRYXwH3+8EckPHcOkf7wHpOo7yi64GIQSpKHlcC+F9t+txbGoLz3LjzggOTsR1pubmlsGmaYmYiRufNVPIWcKZTER+iAdudsOKiG9axEaFl1D0xvGJnW9AccMYPr3lGUh70zBqAf96XJw/Q56BR8ZnYsA5HPr9L47tR6Np4cVzlvjb7uw7hpu7D8m2BNdsEIKr58zHLUe7sG0kHOpUDtv+iRG8Z9tdoWBas8Nx1uBMbGs7gQVNx/HTHnHffn5M6PHMzTbi8k4R5j+/XSxQrtv5FnQVduNzG36GllQnthUe0I6okB/VN4L7dcW0uejzlC6VBY8weNKxWVAawmVowAWR0jjR6wRojO+jm804iOP4dcxMQsGNQSDq/MCByZKzOgGI30g7XjqKdgPwWBFAch1D2whQnGfPmI92idg0uQr5yWPcEwiqSyjAFfKjHCYXLVYTBmS3VUjx9HQOV8/IocG0sWtsCGXP81G1RnovDKniPeG0wMW7oNfOAwCjznhmLJ0He3eLn+1VCTk/4vnxch/K1QPItALDAG4+8UOsar2g5jH/1nYm7HUaTGRPSaGuGpwQlW30ZFZzTzKmXjhiJiokny7L9g37n18+ZwlmZhpwdmsnZucacX57whKshhWHH/c/z97wrwCAjKqUXg6A6cbaY6RvV9Tgb52MrWoOeAMZUw0k4UFnY2sgtHdIrtxH5arQimR1rMg3AwBGZNhL5/xQ635wAOe0Py3WDm92cA9NavrIjMPCyMfRQrjwpGjT49jUSTEjK7Ku5jaEnYlnTJ+HVjuFi9tngkgUJ1rjrZ6RSbgCT0+osTVNC7e5aPMH/a8vF2nH1t4gM2pu5aHIr100J/B8lJ0odiVu1xEyFfbSHXNdiTlFjoV+m4ssitQkPVDuRsEdAyfAsdwIntMbDimV+GoMOK2J7dkzPhz6W0dkJmrwxzKR5b5qc1dhLMYiamxshDFLvAPViPKxOFZ8/OgqCHL41qG7AAAnyoHTxrk4hnpWy0aCfm9RClty7ji3wQj3kR8KHlOyVqY7PxwEHelwKFxVfQeA5RPS8XEV346CGScQD1c5qIcjbBwOwsWeVPmO6zsFljMDFEfPpFx4zgL/8xgTKGdV3lODcBSl80NRxgXtm5AiB5AzJrChJUBEgeA5lFmA/DRZecxtCO5Z2XlWrF0zc/XfO7FwE20oSRkSygNVdkM6+CtKQIvZggs74+d4Mu2M83MajIH7Eu3JAnFBttFJUkb+6uaLwZm1Vzanw1LlYHC9oH0mDELw6XUX4BfPeB6WNyUP/pNZ6zzxMiqHc+eQGN6zZqAtVM+WNbbgBYUnxtGanpmLxY1C6TVjinvfHUk+mpVpwD8uXgtAZISU3AL+dOJm0faIM92eEs/tLyeO4oeHdqOi6c9Y9l9QZWWsa70w9Bt30dxYx1MrfhbJ4kriAe0d244yfxDXX2zjYxuFsq5uz5u1EN/b9Ay8b8VGMMSzvSaz8NodeOfaQAG50QKunB13pKL3xUOz/3kgVcD/LnsQD/b/CQDQOm12aN9/Xb4On1h9PgDBb/nh4d24byBQ51WozyL53JJMTTI6B0wPe9GIInY+4myp+6MrLZcMF4Z1N2ZUamf9zUgH/J2og+OEauKF7dxOgcwcLboY9S6Dyxsx4j0NN/fOwUODPbEMLACwXvocWI3NAICfdP1X7PuMUdvBfaD/j/jY9tfhdye+72/zuAoVmVg1NB1vb3yX/51JKCw/Y8uCS5lf5sPgrGaMhkZ6z8vm/1Poe8WL+bfDE8h6HKnb7w+QH2oAtIJrV4YJ8YQ4sfpXun3hsWB/7hdJrp08kLdFXS8gXHja3LQWGSLI+sfwbBxLG3Dl93f2H/VdsoUNC7AwvxJtxq9xdv6+GM9OOVQ68vOc2a/0kwpqGY9qUnGOHx/Zg6v/8mt89OF7kTLSPk/r4LgoB5JmwCOmWFwp52d5ieBTa76NizqfXfd8f2s74/ycBhOigUrkrYbzI/vZaeY7+2EvSmuvfE+HWaVgsqhFip6KNXYGoSzFh7DlZH13t9T1OInoldncNPlOk1jaEINVyoivnv3zkEAL5OZj38HOEREC6MyFq6q32sFz+37XbjwweKf/N8U4ZmUXIGrmgTh/RSEzXkSYLGmFDwA/67q+Ztt18/jJOz9UQ35sA5ilrdbHa8wpUW2gKg9Cg7+d+zjumHEI39ovUri/4obLkcxvSKNBEuxHnCp+fGQvrnv8Yf/73pIoScG4h0unCbVplRG1vlXwGqalRdhVd37yVnPoPA0sqLU0XXNaxO+kPopWYHRHazdunrsbQ+nwZKzMJDS06o+StfV7cl7bjNB3Shm54HEU+Nno8/4BRb4eY66FT+x6KEaoBkR4pdnuiG1XFuXE6Xa4sAcnSodC24im2p5xc3DSqkaU4NLR2QIJ4tyGaxvwiIb81HJ+QsgPRYPZHPpe3RO7LO6VefAIaI+QJkjJe+LFdKZcQC4OSSQe2+4KLf9zLPE8s1K40UhUQBezQoMZZG5FkdwsF+MeZe341YwGVCUav3ci0EZrtBphSaQwSZ4i66s9c9/5SRuGKP+R2CqAk7HYM+8uF/DDw4I2cMvRLpTcINV9/7jYbnJghAoU2ZZtBzFg2o043fbUiWP8P2SMe5MiP2rCPd3OD5cvT1JpiNNptFDCjY/3YmTTWjTXUFGeis0/75Po3vUtNM++3N+mkJ8hOa/ryqaTWW7mdODwCADgQyvOqb9zDVPODyEjAJI1jdQk6nCG48UjqHIB38/Ll7E8R3HTYTFAz8pm8bE1m/CxR4Sibl+1ApL+OaqYiRwpYlY2mQsVNRXuYFHnJ4L8vHz+O/CTrq+gv3x8SsfVtWmmaib14MhmvG+9icX5JUCd8ibiPOKFonAFB0HWZzKJia1tYXHJMgzovX1uQyqkkq2svzIBlw3i0ISY0FY2bcQzZ12LFU0bsaLpbADifixv2oAyW4Rd+/aGnJ+WVCfes/LLOFrYh3FnFJf/ror/ay9g2vo1uGz+ktC5lHNY0ZCfg41D8pripVcA4MtnXYzOVBaUENx04hAOF8fBOMeoU4FJqI/8LGtsweWdYbTLngRy3jc+EtuWMgxcPfOVuKv3JhTcUbxsVjd+1zvXR5yeF01rr2GNTgrjVgVCK0osFNNuFpW0BZQDx59dfi6wWYTF3HwWfECOqZyD12g/JWKCV3lxDWY+9H1JIlp6cVWlA5WXDvChwjCAgLhP4MBbuQIYBPIuw6cPFfDYMy8E4xwX/EFwmN7TNAc/tvbioT7x98qmddgyEoQdp+Um8OL5TViYJzAo8furGZkf3pw7hM8WRJbUhEF95EddUYocQqPVFLyvCRIHigBd8ggAMW4oXpBJgWrkJ0Z6N8roQcUL83OiGnUOLKiwl+MRGDSL88Y8HJBexkZXoNNLLvvaU4JCcQb5OQ0miLFylTJZ2Os0KjsDAJdx9adCZ9XN2n0Qi4ouVuaan9BxqJnGrLVvR641yASL8qyWNE39NclrjpjITDp5U85PT+mRmvtYGvKzeXQdylykrDaYRqjshk0JzmufgbWtgqT5x740qrQBoGOYnp46N4r6yrhR5yfsFCj+EIOH4Uq4BEeSqeOdDPJj0mBiWtUqapwZJFj5KpFB3ZRabp4KdGWUi1Cfy10MpgOHQqkk80h5jiTJgtc/9Ge8f+u/o7vUBQCYkZ0H20hhQ9slfqX5BqsJF3U+G2lD9AU74uQtb9qAK2e+DC+c9w+YUzLx3gMjeEHH3JhDr7KS9BpoIymJAiQ4P+e1TceCXBNypoUXzFrkb3/ePTfh1Q/+Ea944BYcKwm+1YXtM2LjzGQSDXcPxNXIASBj5nDVzJcCADw2jE/KcCEAzMqE0axaVb2v6F2KrGuBkAD9sVka3ygPhNpmNijCsAUXHjy5nXIeUiiPWnCp1FcvV6Z4UVZC05SDcHd/mJ8F4oDnGmU7gdUjZTx75gJc46Uxv1+EJJvTGWxsyYPKcFejFb4XhLh4+mwDC/NhBeroc5nbHLS3aJh+eQvl/FjoQc7MB2HqhBISjdKJ4yB+9pwKsyYV0M6mewBaxh+6u0Lbo0jQ7T2jfjhvpPwSDI7/BoNcjAeUu2jg4t4+WVnDk9kZ5+c0GAsRnus7P6cf+VHOz1MI+WEMXN431nFq/J56ZkfGzdXRoqF17KyWTszNNuLsls5YrH2qllJhLytZMwYIJoAqYxhxxUBKUMWapizmNBCsbiWY10CwQkrSVxLKGGzquHTKbaK1wl4a8vPy+e9AgxmE/XrLRzGZnUrYq6NhEJyU0ZEb8qtZP3P+gzDoITRlP4BjxQMJ5xEvVN4KnKQ1Zjzk53EX00kFXmozOBnH0swnANQWq6xq+c2zs4sS9wEAhwek2ZqmnlECv0wRniss7ujQSOmVDHVxRWdAvu9IZfywnW4q/T/KhxLtnBoSd07rNDRbNq7VMquUNMKEO4r5uTxW59twdktnLJSn9yUVEpubW4pn9q7C5d0LYSAIo8yd6MCgHIsUed3yb5MBjwNM3lsDrC5ZUn3DQUKk9LKWXr6wEEcSL/RL0oTfJQIPc3Li+i3GRS0wzkG7+4JrnTktxJfLRerhRctw+M5PJFSYmhNo45SpgbL/vUR6073Y0HppzTA1AKQNM8QlSlFgUYN4b6OJji9YQH0UcMwNh02jvC+XE5CIuvRDmbeI1hET6YY5mLbidbH2nC474/ycBmMIqrrXyvYKkJ8nq1XJ9lREfmj/kB9b/1s4PzryMy1Tu1RCknWkMrj+7Mvx8dXnnTJql6ZSwdfciY78lXjB4v/0v2uX9CbFydg3MQKFIk43/gdzs2mYlOCDZ1Vx3szrcXvP/8JlLs6fFuZ0AMCKptoE3agZNVaSCvl5/eIP4IoZLwIhBPNyy0LfRa3ojuPHh/4Tvzz8DV81+mSyvZ4zNws3cwfa8wf9bW9c+nxcOe9HsM3NiTwkxeUouUFBzfGGt+OS2S8P78ccpAkHN0aQz70Xw9IBjVYHV8Z4kK5cq/ArEJCLax1HHkz8m+T8SOTntu6fAQDm5wJnY24hQIlyZDNeNPMoLmgPa119ak2AwMSOfRLinBe3h5GSj67ahB+cdzVePjdYzSseTcEdg0UpPrvuwsT3wdMUw79y7h/wjfPvxL+vvQGNLItrD5yFVzW/zs+Ksp0OjMmx6K2LRL/VFykug5/qLpCf2vdZNWN5U7gwbX9FOJEGIZheiTsNyxub8fnzLkXU+WlN70LOFOOQKcel1F/uR/rPooZX9Zy1QMr2UUUAyBhhZ3SwGnYalExG9J5lcs1QpWM25xfhYEGKZ5ISrt+wHF/ceCMW59fURGqV6ZIXH1+1zFeB1se+f99g4jVLTf/Z/qXvGP573w4MyPt0rKQr7AMO47DMsEbWkCsc1UtnUCy/6vuYfsb5+X/bmEZ4fspzfuTKPKki+ukyc5eWXl0H3j5V0weAJBj4b22tqbAQYJVVsFAKKV4xSzQolbAyJ4T5K71tQ3fhzz2/xK0nfox9YzuxrDnuJKa1e3d222Xi+CcWwlkyP7ZvAKNHiMPS0bBoMAErraJaitCbB/+Cv/T8Crec+KG/7WSQHwXRj0dWovXOq5wfAhcGRCjivoFujHnLI/s58PxhUdzLgXK3fE/j6BnTtFrq8ZaU4m1NLg3nID7yE98nqkeTt1sxtyie6arR4DuDFEKK0Mo67GRNGQBoSeDMRYvVKlvaWJvQrCwnBQsL7ljd/XQyrn59pCzDeWMTfljmYM7GqERm8mY8RFNlHMwInB+Wq426UigNtfA+j40K4jjnPJmabRrSKQyjNB0ZFhCl5cBtP7gj2EEiJLM1fp3S7uGyj3EaJq0rJCg6P6SMIJ3ccHRF60pIOqEWUqus4gahu1Y7cGj1sU9JfuiI3S09h/2CuUcjQpoOBwzak3i+kerpLWWRZE+dGe3/IZtK2Osp4/z4hOenTldRcvPu4nl/k+OLbC/xAKzTwLk6r+MqmNTCPb2/w77xnSh7RXz0bBOPDnGc0ynakxTGAIIw0qgTDKZlr4hLZ87Gv604G//x+BZ/e1p7pq9c8G6sbTwXZ+fnorw4kLxXZtRIdR+qirpXtiaUqMph6PwU3Uaq8eykk3F+mvzyHlHnR5XhCCM/RdfxnQ8ChlbjVxjnr0eZcQxVGvDOrmfgv+bfCkBMyH1MpiPLa+0a2gmXDMp6TGHHxOWt+Ofln0OL3YGi69ZUJFfIT1KICUBItZEn7BNVIn7VgneD9G5G1+N34pz+NpTWerh74DakyW6YNC7u12Sn8JI5S/CzoyIFeUNLB85umYZmK4VzNN0oZfkaSQRLGmcCOJT4nbKUFEONInBjzjBKbgFNdivKXtHnhBGQ0MTNOtpg9PQDHLBJD8p8MSqUoCQncuX8iqwvDsYJCm4FJN8IlAD3grPgLQzr9xQc4YjlrLx0OExYEXFPpaq8uLEZQJywz00DlsEAArQ3b8fa3DxkrX14/rw3+GVAzKQ5Xg7mM7ML8K4VX0CL3YHW1BxkDAOHxo/hN0cHQWg/+srL0WKnMeZU/b4dRX4oMUDggCN4Pq69EzZ9HAZZ4W/TkVqXOaiysq+iDQB5ejNsvgg26UbODKQuGiwCyKLaqhTOqnx44VRwHXDOcVQKlc7K5HC8VMDhwgSyJHnB48XXDafdnjoz2v9D5nHXH0RrE54V7PmkNSvRnophLyU3782MD9p/DTvdyI9FUzi/42oAwL7xndg5fB/yNsEF04POENWBUaacnwknWHW7zIFBKOZmR0FQ8QdOHflptJpx/oxnA/HoGIDkleSe0W0YrIiVnq0jP1Kd+PsHP4+LOp8dK6lwV+9vY8c/GeenUUN+9JINygG7v/8WPG/O6wEIx+faB29GoA7swSKDePb0dvzieD8e6OtGNr8cKe82VAwPPz7yKCry3SRS1+Qbh6+Tv307oATbiMjIcTADBl2CHx/twl39j+EbG5+GGRFiLxAUJ7VrcWl0PYVEzk9wf6Zn5qIl1Qlz2jLMuU+IAq7OW9gyJKrDRx0lZRe2z/Cdn39cvDbGwdGtyU7uX3nTRs4wQ+UXopaEwO0a2Yz/evxfwRPQM5NYoT7iTRPOj8UoTAwAWIyetLh++v+1d+fxUVRZ38B/Vb0nne7sJGQhIZBAIAsgmxDAQdABEXEGlxFUBFHnGXkGxeXBUVFeUQkiM6M8MwLjuCG+ozjAMCPi8oKiAnFBZsAAAQIkZCGErL1W1/tHdVVXbyGB3kKf7+fjR9Lprq666a46de+55wKIlQX+KpZxLgWkxjlbI4A0ICfDrffsdMcxPHdwIRgwmJW9EDaHHUAclKx7b1ibM+AYHJcIXqsBY/YYPlUqoWKdx8224cGhfQAI56DKdiEBXOWrLobGtb+F8a4ZoJP7ZMOWwuHvZw+DB3DP/k+8XuqrFArD2N0qnPOKs1Cz9R51o1zBz4qD96HOdBrPlL6BFG1ftNtaoGRaoWeEhVPlNy4G2Z9d50wAYhhGCnBEb1f/hP84c8byDQmoMXWg3W5DOxbC16cvNoJSRkU07BUGJs4K8WTsq+opQAnPXRF7fnhVcAKycAc/olStMP1YwSi9ZsYkqDRIUrl6UGJYIblSHONvlxUzFPNqqtsrIe+y13YzqRXwPdX9ePsh6d85eldvQ1GCK7/EV4JujMcMGwBQ9GBfxMDP6nC4zTgRA4R4tWv5gTOmdlgdwrY1TBVYmJCrL8Q1qa7erSNaFhaFs5enw3WCV8KVsCpwtV1hnOsu+mj7BexqrAEPSMtFeLI5h0X8JjzLhxN9DXsxrquSmFRuz8kE1ycZtsEDUJAwAn20WUjSpKEoYbTPt+gXY0ChIRGl8clI1XSdjB+nUiMzRvg7Lew/FJk6PYqNyciIicUzQ8cgU6fHM0PG+HytK/hxBQ+nOo74DHwAQOF5bnH2no20DUWyRlhHr865KJ1eqXa7YYxxngIcfKwUYHrGjifbD8PBc+B4O3bUbJSSqB0ehQnli7x23jodXFICeNlCq1AqpODVs26UOJtQYfCuX2MdM8zncQNCYnlXxR99jQw4eNd7CDOHeaiZU+7Bj/P7auI6cKazCnbeiqOtwlCcfCLC8MSJ0uxSAEjVud5PJzu9ymcMWh2clCwPALf2c5+9xam8Z1veXRBBN89OkbdHUaDNJo51O6SCU3Ifneawt0Ec8w3hjvkgBT8RlPMjrcLtZ4jhcskTKcMZ/GTGCMX2ON6OevNppOmy0WSpx0c1b8PMmZDA7kMTFgAA1BCK7q07+gxYRuG20KaYWyFcjFxtpvETePsidqM3W4Whioqmz/HhqdcAAFPTb3M7gY5LmYaNx9fAzlvRbmuBVhEDu8OObWf+ggvWJp+LgMqHPS5GyyqgZFjYeQdabVZonceRbyjFv2regZVz9Th8XCe8lxINeHnYdGTHLpZ+9/LwCVj83W7YGQZjGjOxL+WMs7IuAyO7EyxjxyBLAn7SCFN0Z9bV4e9pwgwxvZJBDPM9Ovlhfld6lzvsvFj4TXh26/nxFfy4/lbibCpoNei8ZzYAIBnA8mFvd7kPKpbFypLuLSbJMAzWj74WdrtwUZfX6BlkSMSfrvqZ39e6hh/NUs+cv/wvAFB59FSJNzW6Uw34+eRf4n+rDuKss+fHs8fToGLQbOFhs4+AzSEMdXm23uEW11Bvm/0CWJjAAdjXrIfmxH/AgsEPFxpxTLbIqyO9DzoX3gbt1k+h+s8R4cUKBZSs0B6NFhNsDg4qVoEtNVX40jn1X5EYD65vKhS1QuBsnjIefIz/fCsAMCg1MMnqN8n5GhnobzyE4y3iZAUOYAA1at2CH/H7Kr/5sDos+PTs+6jtFAL0vrpc3F/wrNu2y9JZfHRaOEad7Ct5fXoO7DyPP1UdxGcNrnyh5UPHICfWgNn98/G340I7OVQn4VCdRAK7Db8ZtBx/OPoDtpzNwH15RfjX2ZM41HoeCobBz9NzUBCX0GXbBFMEXdGiR5uz6JeKsXoNCXTYeLx2iJPuMXsy0ygYpITnCBr2YqxC+wWr50ce8PiY9BEyGtlCsl837sCs7Huxu34rdvkYNhI1+CguKPb8CDkY8iGD7kd2Zk44idZ0HAefzOO1I8tk23G/IDEMA73SgAu2c+iwtyEZ6ahs/Q7/qnkHvqgYtdf3oCsMw8CgUuO81YxWuxWpcE59li66rmDk03oh+GEZExLU7onkYiBiZwCdXWgXofdAKeX79LfE4SdNM9I69dDLpvayDCfV12mWFUD0V7FdLPRn81FyAIBrmruwca9fG9SuvItGs+8aO5FCLfvc2hxWqBUavzP/AO+eH7GAN2OySD3jrc7uWM9cN/Hm0GxzrU8X53HOFAN2EcsIi/Y1WlXYfMa7LIJ8HTi3WWMMgwRZNfkfLpxDTqwB6467FrVNUGvAy3tyujEho6ueH1/Bj94tsYgTd81txiTr42a1qu3f2Htup/SzfKhalCbr+fGsd+ZryFYs5zEyNU0KfkQ2PgXLDwnr5G2rPYGxSelYe+xH6dpmdzhQMGiE1zZDhYa9wkAMfpSM9x2jmRM611kADxQqMC07vH+iiEx4ds4G4XXBWWVenuRcmBDe4LMkQUhGPG8REostziBksHEEZvf7tdfzY2V1dkQNphrUd9SgtvOkV8Jud+U6h7XMjk6cNbmvGC7PYxCJF0Dxjr/edMbrOXf0fxg3Z9+HR4e+2uP9Eavttsl6XcSTeYOzW9/ucMDmHC40srsQ57GchDikwDGAlhM+352ceKcsXFSuajbg14dH45GDE1DQ7pra6+A5aT0ucYV6wDugNHN25+wh4b2GGn1X7GbkwY+PC970jDulf4t5XZFKflEVe3989faJPHOU7LlCjSKG47wSyD17zq5zVl93OFzJahmxrva7YD2HTrv7lGx/FbFFpfGuGW2elaKTdTrpG9Rut+InZ49enFKF+/KKcFfOYNiGD3G9vosp96L5/V3PLza6rxjvK5jWy2/6ZNcQXz0/cifbK91+lgepokQtg+UjlVg1Rul1Q+I5w/TpIaORoROGRiekZ+LO3MHI1rmGjfvFDnZ7/t6mOvDO7SzsPxR35xYinCLnihZF2p3DNirG+yQm5vooWWBqVuCncfcU7xxHj6jgpzPIwY/sfOW5InmoDTZehQPNe7D33E7clL1AyrnJiyvClL634vdVQi8Q48ynGJ08GZ/VbQYA6BR6mLh27KjZhB01m5xbLL2k/einL8C+pk+xu36rV8Jygo/1nOQzr5otjV4LXWoVMZjY58ZL2hcAMKg0ANrchpzEXBMePLac2oBvzscB0ALgka9P9dqGtD4aAIezu6HF2gIgDgw4MDyg7rCirGEoAKBe6zqx23i7dBGVr5Yu79k5ZzHhvorPMCqxj5SbZPS3Orxz2ItnGJ/BT6zKVS08VumdVxJJWEYBJaOGnbfC4jBjy4n1+LH5K7/PV3qcWxwG4YLKmMxeOZGeyz3kOktA8BD+9okaK+CcHv9x7Sa8X/2/3vt3keDHbf0vrfffa2RSGvY21eGlyu+lx3QKJWb0FYZEHSmyALcbPT8D9fHSv3+RNQDxag12Nwo9uL5yfuTBDy9bIFXhY6o7IOQONpjPoN7sPwCVG5roO2DTyAK5JLXWbZYgwzD4VU4BONt2bKlpQDs/BrGqZMiXndlSK9TlSlBrur3USTBRz08YtDsTdtWsd/Bjj5AFTUVSz08k5vxogpOErYig4GeIrFflTEeVbC0sYSdn9u2PgrgE3NbvGvTV5WJ65l24Jm0W+usLcUf/xT62eGnH49mjJC6BONh4FRI13rPuxODH5rDgdOdRt99pWB2uTvn5Je2HSOwRMMlmHYkJ4gBwsuMnnBHrxaADY1KneG1DKfX8MDivES6IvPMCwsABngGS2l0LoKp4BjHMQagYEwbrHdAwpxHDmtwSx+UJ2DvrTsHi4PDFuVrpcV/1mQCAsTqDuC4+0/MH/A6p2kzMzXvE73MihTzvp6rNNSx0a86DMKgSEa9KRpwyHlpFDEYne/xtnAEHY7Ei1iP48SwKG+NRklitcLV/VZtr9ltmTB4yYvpDw+qgZauggHuNGtG9/Ye6/WwrKYQj3gDrqBLX7vkIaBosroDKkWiEPSsdjgQjuCw/0ydlYpUqXJ2Ujn4xcRgUl+BWDsHXsFecPICWBT/ygCdenYxBxhFI1vT12UMMXLwOkyd5Wtr4lL4+n3PBek5a4kLNxvt8zqSUTJ+Ph1oEXdGiRzsnFjzz3/PTjd7SkHDl/ETQbC9OLAwWnJ4xqyzPp19ceIOfProsDDKOwE8t38LMdcrWwhKO/d4818l6euavAAC35/5Wemz90eUB2Q+9yhX8aFgd/jj6oy6fL/bCvHfyj9JjQ4yj8N+F5QHZHzGI8JztNX/A77Dh2P+B3cGh2RYPALgtKxHXpF3vtQ2FLOfHxjo/U9Ldsx23Hi9CfGcazNdPhPqLfWB5FvGKj5HOfYdU60womA5cm3wYC/OX4f3TR/HXk4fxz7MncXVSOnafq8H3za5ck3qzkNDqr3igqzfTf3Ls6JQpGJ3iHcRFIrVCi06uDVbOArMzmfexoa8iL24oJqf/ssvX8rJp9gbe/UToucyIxuM8ycrqUInve2feoxiTMrXHxwAAfKIRHQ/cIby39J7ef8NB8sRdhQKmOTd1+z0YhsHSQtdNjnxoz1fwEy/LO3IozkBaptUt54fFQ4WrpZ8HG6/C4Rb36stMD2+ErLLv2oLcIT6fY3PYwDiLMFa2uwLMu3IG442TwgLAc3K861CFQ4RcYqNLp91/8GN3iKv5hnSX/IrIOj9i4qkyOMGPiXPd4qjCXWgJruUuzFynVGSwJ7OjRP7qv3SHfPVrzwRnX4xqoeu/yVIn1QJK6sFCqhcjBT8e6wspnJ/TJqtraCjJT80asefHDmBYk3gn6yxwyHBIMQt1cPgYLfjYGCh45xCLxQzb8aPO/RD+NomyC9Lv/v01Pq47JS2XIGIAxKt8Fw+Es6YMr/Xz+15GzYrlCMxSECKfEdglpUJau8/oMeHAcxjIcx0+lpEHP6aevW83JWq8h9vHJl+8h6e75J8RX/W8UrSyXljGgRhGWACZ9VdAE76Tm8V8wu7KinF9p/xNUBgaPxoKCMPD4uc/TqlCoUehxEgQQVe06NHh7PnRsN4zPyKp54ezd8JuFbpGIyb44XkwYrnQIDWSKcLyScWTt9Dz432X15VnSt/E9po3cFfRg6g734gHKrxrcHSHfMFSNXvxXKtf9LvfbWYJANyYdc8lvbcvYg+KZ4Ah5j202V0XwTQ/AYU4hOJggOJzBbh3QCGe4+MBBrilOh+jG4UAzt4vA47EeNiPqQB8CpPSjiaLUGMpVmUA096BCRojXmVZtwVkr0/rh4/qXMnhTw8Z7TZbSE7qzQxSQB9qYl0ijrfLghD/RRXdMIww/Ge2Qmu1Qc3xsDrzADwTnjUKz5d69/wEOvj5RdYAbKp2zWxanF+KiQEcypmV0R8Jag3ilGrky/KBREnaOIhLXExIUqOy7f8B6PrmZlLaLBxo3gMAuCHzLiSoUzEy2X+5Al/y9EY8WTjKfTach4lpN0Kr0KPR2hc2XvjeFcUnoyAuAU8MHiklSEeCCLmiRZdOjgfAQNtF8BPunh9rx1lUfjIPDmfNlIgJfmQXFz4I63pFInnww3kMe11Muq4f7h+0DAn6WOhsSTCqjqPFZvW/zIIfsbJhr+5UY45XJ2Nin5nYVb8FAFBoHAmDKnA1PcSen3/VVaM4PhllKUKNF1fPj9DlrmUqoWQn+dyGPHn29pF9obTxsDt7+iZ35kPJX3C+mRoOrQa8rhA4CLSozfhcLeSxGE+1QL/xTQDAbdlxeCPb1UP28/QcKfhRMgyu8rGMhEQM1q6Qz7S4VpeZM8HOC/lMPQlCeLUajNkK1mKF0e5Ao7NdvHp+PD7G7XZnlWfIg5+u6+z0VJxKDZ1CKeWb/Sw1q0elGi5Gr1LjBmfytC862cWB5w+AZexeVbI9petcSwENNo7AQEOJ3+d2ZXRS1723CkaJq1N9DzEGsncsECKgfyH6WJwRjob1LoUeKau5m1qOSYGPUhMPQ59R4d0hkXyRmCD1/PyivwLpMcDdBZFxIZKCH4dJyvnpbs+PpwfyipGg0uC/80t79LoYhR4lCeOhYjXdzjvRye705TlDgTAiwTV76yfZbCsxMBNXW2dhcisQKKf1SKa1y750+qJCOHRaWEsGSbOvPNs8XpmI0jNCQMezLMZcsCLRykHl4DFQH4/sGD1+mTkAWlaB27K910tzIwb1V0rw42zzDlml8Z4EIbxaCJ6Y9g50ymZ/eAY/Qk0p+fu6zqkWTsyzCmzPD+C+QG0gA5/uiJUdr8UhBPkXuyGJVydjsHEEMmPykB2b3+Vzo0WE3M5HF4vzPOd51wK4Znt5TukMNQcn3K3pU4Yjr2z1RZ4dOozNNbshWBeKZC2DtWUXz2sJFfHkbeE68cP5LwF0v+fH0/iUvn5nanSFYRj816DnevQaeZ6BPGcoEIrik/Gr7AJsPFWJLTXHYeLsKDEmo49GCZMjH+28sMQGC5PXiugif9WWf1nTDm5KP3SMcr87lrf5wJYkPNU4F8ozQj6T6Vcz0C9Ghw9fE0oKmKf0h41V4O7cQq96JsqDlVCcPgsAsA/MATcwB4xdHPa6Mu5HxUDxreOrAAiFLHuyfhucwY/2X7swo68OmzKFfBPPhGcAeGyYEk/uFxf0bcAP5/fgx+Y9UtVkLRv44MdfMctQ0Ms+zlVtVVArLx78sAyLxYWRcx6PBFfEN83hcOAPf/gDysrKUFpainvvvRenT5+++AvDxCYFP95fICn4CfNfRuz1YRWRlYDJ1tbLfrgiPr4XpXMGP532dinh+XSHd2XaSCOvrJukCVyys0g+c+rjulNYfeR72B0Mmh2uafQMwyFOGd+j7aZZ7D57FWNkAVyyOVYKfADAYYiDIzZGKoqn3fklmPMtXtuA2QLt9s+hPnAY6gOHofvHZ8LjYuJ2kGYwhpo4vV3sqTTK1lvrDkec0GvIWG1Ik5VZ91UnKV5W0dnODcS6o8/gy4bt4OGAilG7rWYeKP4WpA4Fpey6wTJC7lkn1+bv6cSPK6LnZ+3atdi4cSNeeOEFpKWloby8HAsWLMC2bdug9jPTI5yszp5Zz2Q9ALA6/P8ulBycMPuE8VEFNJwYk7BfjtjAjuNHMnEtJ3kw0Wo77+/pEaOTc011LeszI+Db95xyzPE8TpvskJ/WRiZNRqrOfzLqxsnT8e+6BmR88T2+b22CnuNxXX0nHD4Sj+PVSfivghWob6rEpK9dQ21cn2TwRuECa7plGmI2/QMAwLZ3gEsUhvuYThPgcIC50AaG58EzDBieB2O2gGlpk6a6B2sGY6jJFzG9KWsBhsT7XmzVH8vkcXAkJULz1be4vr4TvDEOnaNK8LNU779lplstLjVszqU0ZmTOw0BDsdsyMYHiq/hgKL04hsHX9d9hT5P3cjake3p98GO1WvGXv/wFS5YswaRJkwAAL7/8MsrKyvDxxx/jhhtuCO8OeuB5HjaH8MXR+Oi5kPKBwnwOvHBGuCNlFZEVPDIm4SLB5URGoaxQ0DuXZTghW0VdE+AkzmBgZR3LgZ5xA/iut/Jq1Vm3n3P0eV7PkcszxiPRoQKTdR5Dd7hmZrX56YEpSRwHJI6DLuufwDHh+bZiV90SLjcLXN8+UNTWQ7t5Bzp+Ow/qLyug+WK/23Z4gx5obQfD89CvdS1I2p3lEHoDDauDxWGCTqHHtMy5PX49b4yDdewwaL76FjoHjxvNSpi6URWYYYRp1iyjwA2ZdwUtHydGqQIsXVeKDqZ8owr5xtE48l0GGi0UAF2KXv9N++mnn9DR0YGxY8dKjxkMBhQWFmL//v1dvDI8LA4OvHO8WOsz+BH+7ysfKJQUzotrxMzychKDn2AtbRGJcvWDkKrNdKvtMyPz7vDtUDfNzF6AJE0abs15MCjbH2JMRJJaixSNDhNSMqBgGLBgpKU+MnSxmNonu1vbsudkwKGPAc8wsOdkArquh3ttBf3Bq5RwxMaAy8lw+x2XJQzxMTYbwPNQnBTWNeMhLF/BsyxshQNgHzJQ+Fn8T60Cl9fP8616pV/1/y1ilUbM7f/wpW9EtowD29L1sM5vixRgmQbE6V4EIAy3BTMR+basfMQolPhl5oCgvUd33Jg1D1pFDKZl9DzAjHaRdWW7BHV1wrh7err7NLrU1FTpd5dCGeCkG4vNgkWf7UYzHw+WERIgK6pUaKj8wu15tUwfgM0BX/cDzm79vz63xTBALcvC4XCA954wFhBmTuhlSKmLh+7j3cF5k0vAnhLu7JlYndffSOG8a1ZcIXfPIoPSiBdGvnvJrw9Xu/TVZ6F81N+Ctv3sOAPeGeddubm73NolNRGWxfOk3130xDi8EObhwveYhftdJDdpFLD3ABg7B92O3VCcE4bIrHNuhMO5aCcg1OW1z/Kx7MYlHEsgBeLzUpY+DWXp0wK1S2Ds9i7PyZOzWdTb/o5PaoX6O2NTrwv4OVzeLpPSMzEpPfy9z+PSr8O49OvCug+99bwb7u/ZZTOZhK5Hz9wejUaDlhYfCYfdwLIMEhK6WZCrm/6+7xvU2ssAQLp/r0Y2qv0MbykcVWiwh7/nKubwOSitEVb1D0BM32Qo/PyNDIbIHxIKB2oX3wLdLjwfA0uMFug0Q/m9a6gyLisVbIDPK8EUCZ8XS3oK+LONUBbnX/ScnJWQBdQK/84wZgb8HC6KhHaJRL2tXXp98KPVCsMfVqtV+jcAWCwW6LpYJ6crDgeP1tbOgOyfaFzOCHxUvQP1nJD7YORNyOfUUPoYeVTDjrGqehjUviN6BkLPlN3uQJA6fgAAWkUy1GOHy9bljQx8jBamnCygucPtcYWChcGgQ2urCRznXUAyWlG7+BbMdmFvmQb2xBnpZ0dyAkxKjddnNhJF1OflthugOHoS3JCBF227qwzXwdzfDo7nMD5pGpoD3NYR1S4RJJLaxWDQdbsHqtcHP+JwV0NDA7KzXeP7DQ0NKCi4SGGxLtjtAf4jMgosn9STbmD/heSUShYJCbFobu4I/H56MAd165fJz7FznCPo7dIbUbv4FpR2Se8j/CfXy9o+Ij4vWi3sRc6E8ovsiwpaXNPnF9LPwdr3iGiXCNTb2qV3DdL5MGjQIOj1euzdu1d6rLW1FYcOHcLIkSO7eCUhhBBColGv7/lRq9WYM2cOVq1ahcTERGRkZKC8vBxpaWmYOtX3GiOEEEIIiV69PvgBgEWLFsFut+N3v/sdzGYzRo4ciQ0bNkCl8r/KLSGEEEKi0xUR/CgUCjzyyCN45JFHwr0rhBBCCIlwvT7nhxBCCCGkJyj4IYQQQkhUoeCHEEIIIVGFgh9CCCGERBUKfgghhBASVSj4IYQQQkhUoeCHEEIIIVGFgh9CCCGERBUKfgghhBASVRie5/lw70Sk4XkeDkdkN4tCwYLjes8KuqFC7eIbtYtv1C6+Ubv4Ru3iW6S0C8syYBimW8+l4IcQQgghUYWGvQghhBASVSj4IYQQQkhUoeCHEEIIIVGFgh9CCCGERBUKfgghhBASVSj4IYQQQkhUoeCHEEIIIVGFgh9CCCGERBUKfgghhBASVSj4IYQQQkhUoeCHEEIIIVGFgh9CCCGERBUKfgghhBASVSj4CZMLFy7gqaeewoQJEzB8+HDcfvvtqKiokH7/9ddf4+abb0ZJSQmuv/56bN++3e+2nnrqKTz++ONej/dkG5EkFG0DAN9++y0GDx4c8P0PhlC0yQcffIAZM2agtLQUU6dOxWuvvQaO44JyPIESinZ56623MHXqVBQVFWH69On44IMPgnIsgRaq7xEA8DyP+fPnY+7cuQE9hmAIRbvMmzcPBQUFbv9FetuEol1OnDiBhQsXYtiwYRg3bhyeffZZmEymoBzPRfEkLObNm8ffcMMN/P79+/njx4/zzzzzDF9cXMxXVVXxx44d44uKivjVq1fzx44d49evX88XFhbyX331lds2OI7jX3rpJT4/P59/7LHH3H7X3W1EomC3Dc/zfEVFBT9q1Cg+Pz8/VId1WYLdJlu2bOGHDBnCb9q0ia+urua3b9/ODx8+nP/jH/8YysPssWC3y6ZNm/ji4mJ+69at/KlTp/j33nuPHzx4ML9z585QHuYlCcX3SPT666/z+fn5/Jw5c4J9WJctFO0yduxYfuPGjXxDQ4P0X3Nzc4iO8NIEu13Onz/PX3311fwDDzzAHz16lN+zZw8/fvx4/umnnw7hUboowxNyRbfq6mrs2bMHGzduxIgRIwAATz75JL744gts27YNTU1NKCgowOLFiwEAeXl5OHToENavX4+xY8cCAKqqqvDEE0+guroaffv29XqPN95446LbiETBbhu73Y7y8nK88847yM/Px4ULF0J6fJciFJ+Xd999FzfddBNuvfVWAEB2djZOnDiBv/3tb/jNb34ToiPtmVC0S1tbGx5++GHMmDEDAJCVlYWNGzdiz549uPbaa0N0pD0XirYRVVZW4tVXX0VpaWnQj+tyhaJdmpqa0NTUhJKSEqSkpITu4C5DKNrl7bffhlKpxMsvvwyNRoMBAwZg0aJFePfdd8HzPBiGCd0Bg4a9wiIhIQGvvfYaioqKpMcYhgHDMGhtbUVFRYVXgDJmzBh8++234HkeAPDNN98gLy8P//jHP5CZmen1Ht3ZRiQKdtt0dnZi//79WL9+PebMmRP8AwqAUHxelixZgvnz57s9xrIsWlpagnBEgRGKdlmwYAHuvPNOAIDNZsM///lPVFVVYdy4cUE8sssXirYBAIvFgiVLlmDRokXIzc0N3gEFSCjapbKyEgzD9Ir2EIWiXb788ktMmTIFGo1Gemz27NnYvHlzyAMfgIKfsDAYDJg4cSLUarX02I4dO1BdXY2ysjLU1dUhLS3N7TWpqakwmUxobm4GANxxxx147rnnkJSU5PM9urONSBTstjEYDNi8eTPGjBkT3AMJoFB8XkaMGOF2sm5ra8O7776LsrKyIBxRYISiXUQVFRUoLi7G4sWLMWPGDEyePDnwBxRAoWqb8vJypKam9pobiVC0y5EjRxAXF4dnn30WEyZMwPXXX481a9bAarUG78AuUyja5cSJE0hNTcXzzz+PSZMmYcqUKVi5ciUsFkvwDqwLNOwVAb777jv8z//8D6ZOnYpJkybBbDa7fQgBSD939wsUiG1EgmC0TW8X7Dbp6OjAr3/9a1gsFjz66KMB2edQCGa75Obm4sMPP8TBgwexYsUKJCQk4JFHHgnYvgdbMNpm9+7d2LZtG7Zu3RqWO/dACEa7HDlyBBaLBcXFxZg3bx4OHz6MlStXora2FitXrgz4MQRDMNqlvb0d69atw/Tp0/HKK6+gtrYWy5cvR2NjI8rLywN+DBdDPT9h9sknn+Cee+5BaWkpVq1aBQDQaDReHyjxZ51O163tBmIb4RastunNgt0mjY2NmDt3LiorK7F+/Xq/wx2RJtjtkpSUhEGDBmH27Nm4//778eabb/aaYDsYbXP+/HksXboUy5YtQ58+fQK/0yEQrM/Ms88+iy+++AK333478vPzMXPmTDzxxBPYsmULzp07F9iDCIJgtYtSqURubi6WLVuGoUOHYurUqVi6dCm2bt2KpqamwB5EN1DwE0Zvv/02HnzwQVxzzTX405/+JI2Fpqeno6Ghwe25DQ0NiImJQVxcXLe2HYhthFMw26a3CnabVFVV4ZZbbkFTUxPeeecdt/H/SBbMdtm9ezeOHTvm9lhBQQGsVmuvSJYPVtvs2rULjY2NWLp0KYYNG4Zhw4Zh27ZtqKiowLBhw1BbWxuU4wmUYH5mlEoljEaj22MDBw4EIKQjRLJgtktaWprUDiLx55qamgDsfc/QsFeYbNy4EcuXL8fcuXPxxBNPuHUbX3XVVdi3b5/b87/55hsMHz4cLNu9eDUQ2wiXYLdNbxTsNjl9+jTuuusuGAwGbNiwAenp6QHd/2AJdrusWbMGOTk5WL16tfTYgQMHEB8fj+Tk5MAcRJAEs22mTJmC4cOHuz22atUq1NXVYdWqVUhNTQ3MQQRBsD8zc+fORWZmJp5//nnpsYMHD0KlUiEnJycgxxAMwW6XkSNH4scff3Sb2XXkyBEoFIqw9DBT8BMGJ06cwIoVKzBlyhTcd999bl2hWq0Wc+fOxaxZs7Bq1SrMmjULu3btwkcffYT169d3+z0CsY1wCEXb9DahaJOlS5fCarVi9erVUCqVaGxslH4XqdN1Q9EuCxYswEMPPYThw4ejrKwMe/fuxYYNG/Doo49GdLAd7LbR6/XQ6/Vuj8XGxkKr1aJfv34BPZZACsVn5rrrrsOKFStQXFyM8ePH4+DBg1i5ciXmz5/v1WaRIhTtMn/+fNx88814+umnMW/ePJw5cwYvvvgiZs6cicTExGAcVpco+AmDHTt2wGazYefOndi5c6fb72bNmoUXXngBa9euRXl5Od544w1kZmaivLy8R/V5Bg4ceNnbCIdQtE1vE+w2qa+vl+7qZs6c6fX7ysrKyz+IIAjFZ2XatGmw2WxYt24dXnzxRfTt2xdPPvkkZs+eHejDCSj6HvkWinaZM2cOGIbBW2+9hRUrViAlJQV33303Fi5cGOjDCZhQtEv//v3x5ptvYuXKlZg5cybi4uJw4403SrWDQo3hI7noCyGEEEJIgEVuvy0hhBBCSBBQ8EMIIYSQqELBDyGEEEKiCgU/hBBCCIkqFPwQQgghJKpQ8EMIIYSQqELBDyGEEEKiChU5JIT0Co8//jg+/PDDLp+TkZGBmpoafPrpp71mUVZCSOhRkUNCSK9w6tQpnD9/Xvp57dq1OHToEF555RXpMavVCrVajcLCQqjV6nDsJiGkF6CeH0JIr5CdnY3s7Gzp58TERKjVapSWloZvpwghvRLl/BBCrhibN29GQUEBzpw5A0AYKps/fz7ee+89XHvttSguLsZtt92GEydO4PPPP8eMGTNQUlKC2bNn4/Dhw27bqqiowJw5c1BSUoJRo0bhsccec+t5IoT0XtTzQwi5on3//fdoaGjA448/DovFgmXLlmHhwoVgGAaLFi2CTqfD008/jSVLlmD79u0AgP3792PevHkYM2YM1qxZg5aWFvz+97/HnXfeiffffx9arTbMR0UIuRwU/BBCrmgdHR1Ys2YN8vLyAAD79u3Dpk2b8Ne//lValbq6uhovvvgiWltbYTAY8NJLLyE3Nxd//vOfoVAoAAAlJSWYPn06PvjgA9xxxx1hOx5CyOWjYS9CyBXNaDRKgQ8AJCcnAxCCGVF8fDwAoLW1FSaTCQcOHMDEiRPB8zzsdjvsdjuysrKQl5eHPXv2hHT/CSGBRz0/hJArml6v9/l4TEyMz8dbW1vhcDiwbt06rFu3zuv3Go0moPtHCAk9Cn4IIUQmNjYWDMPg7rvvxvTp071+r9PpwrBXhJBAouCHEEJk9Ho9CgsLcfz4cRQVFUmPm81mLFq0CBMnTsSAAQPCuIeEkMtFOT+EEOLhoYcewpdffomHH34Yu3btwmeffYYFCxbg66+/xpAhQ8K9e4SQy0TBDyGEeBg/fjw2bNiAuro6LFq0CI8++igUCgVef/11KqpIyBWAlrcghBBCSFShnh9CCCGERBUKfgghhBASVSj4IYQQQkhUoeCHEEIIIVGFgh9CCCGERBUKfgghhBASVSj4IYQQQkhUoeCHEEIIIVGFgh9CCCGERBUKfgghhBASVSj4IYQQQkhUoeCHEEIIIVHl/wO/s2gaLZIxpQAAAABJRU5ErkJggg==", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "sns.set()\n", + "sns.set_palette(\"husl\")\n", + "\n", + "window_size = 2592000\n", + "\n", + "n = 5\n", + "leaders = [x[0] for x in degrees[:n]]\n", + "timestamps = [dt.datetime.fromtimestamp(v.latest_time()) for v in g.rolling(window = window_size,step=86400)]\n", + "\n", + "fig, ax = plt.subplots()\n", + "\n", + "for i,vid in enumerate(leaders):\n", + " deg = list(map( lambda v: v.in_degree(), g.vertex(vid).rolling(window = window_size,step=86400)))\n", + " ax.plot(timestamps,deg,label= get_ordinal_number(i+1) + \" node\")\n", + "\n", + "ax.legend()\n", + "ax.set_xlabel(\"Time\")\n", + "ax.set_ylabel(\"In-degree\")\n", + "plt.savefig(\"degree-trajectories-top5.png\")\n", + "plt.show()" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Whole graph metrics and different window sizes, including the growing aggregate graph" + ] + }, + { + "cell_type": "code", + "execution_count": 7, + "metadata": {}, + "outputs": [], + "source": [ + "window_sizes = [86400,604800,2592000,31536000]\n", + "window_names = [\"1 day\", \"1 week\", \"1 month\", \"1 year\"]\n", + "\n", + "# Aggregate graph properties\n", + "views = g.expanding(step = 86400)\n", + "timestamps = [dt.datetime.fromtimestamp(v.latest_time()) for v in views]\n", + "\n", + "aggr_vertices = [v.count_vertices() for v in views]\n", + "\n", + "agg_window = np.zeros(len(timestamps),dtype=int)\n", + "df = pd.DataFrame({\"time\": timestamps, \"window\":agg_window, \"vertices\": aggr_vertices})\n", + "\n", + "# Same properties for different window sizes\n", + "for i in range(3):\n", + " views = g.rolling(window=window_sizes[i], step=86400)\n", + " diff_size = int(window_sizes[i]/86400)\n", + "\n", + " timestamps = [dt.datetime.fromtimestamp(v.latest_time()) for v in views]\n", + " vertices = [v.count_vertices() for v in views]\n", + "\n", + " to_join = pd.DataFrame({\"time\": timestamps, \"window\":[window_sizes[i] for k in range(len(timestamps))], \"vertices\": vertices})\n", + " df = pd.concat([df,to_join],copy=False)\n", + "\n", + "for w in window_sizes:\n", + " diff_size = int(w / 86400)\n", + " df.loc[df['window'] == w, 'new_vertices'] = pd.Series(df.loc[df['window'] == 0, 'vertices'].diff(diff_size), index = df.loc[df['window'] == w, 'vertices'].index)\n", + " df.loc[df['window'] == w, 'prop_new'] = np.where(df.loc[df['window'] == w, 'vertices'] < 1, 0, df.loc[df['window'] == w, 'new_vertices'] / df.loc[df['window'] == w, 'vertices'])" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Plotting out the number of active users and the proportion of those that are new" + ] + }, + { + "cell_type": "code", + "execution_count": 8, + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "fig, (ax1, ax2) = plt.subplots(ncols=1,nrows=2, gridspec_kw={'height_ratios': [1, 2]}, sharex=True)\n", + "\n", + "for i in range(3):\n", + " sub_df = df[df['window'] == window_sizes[i]]\n", + " ax1.plot(sub_df['time'], sub_df['prop_new'],label=window_names[i])\n", + " ax2.plot(sub_df['time'],sub_df['vertices'],label=window_names[i])\n", + "\n", + "for i in range(6):\n", + " ax1.axvline(dt.datetime(2010+i,12,25),color=\"black\",linestyle=\"--\", alpha=0.3)\n", + " ax2.axvline(dt.datetime(2010+i,12,25),color=\"black\",linestyle=\"--\", alpha=0.3)\n", + "\n", + "ax2.set_xlabel(\"Time\")\n", + "ax1.set_ylabel(\"Proportion new\")\n", + "ax2.set_ylabel(\"Number of active users\")\n", + "\n", + "ax2.legend()\n", + "plt.tight_layout()\n", + "plt.savefig(\"new-existing-users.png\")" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Null model comparisons\n", + "Number of users according to real and timestamp-shuffled data" + ] + }, + { + "cell_type": "code", + "execution_count": 9, + "metadata": {}, + "outputs": [], + "source": [ + "from raphtory.nullmodels import *\n", + "from raphtory.algorithms import weakly_connected_components\n", + "from collections import Counter\n", + "\n", + "experiments = 5\n", + "\n", + "for i in range(3):\n", + " w = window_sizes[i]\n", + " results_vertices = np.zeros((experiments,len(df[df['window']==w])))\n", + " for ex in range(experiments):\n", + " sx_shuffled = shuffle_column(sx_df,col_number=2)\n", + " g_shuff = load_pandas(sx_shuffled)\n", + " views = g_shuff.rolling(window=window_sizes[i],step=86400)\n", + " results_vertices[ex,:] = np.array([v.count_vertices() for v in views])\n", + " df.loc[df['window'] == w, 'vert_shuffled_mean'] = results_vertices.mean(axis=0)\n", + " df.loc[df['window'] == w, 'vert_shuffled_sd'] = results_vertices.std(axis=0)" + ] + }, + { + "cell_type": "code", + "execution_count": 15, + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "fig, ax = plt.subplots(1, figsize=(10, 10))\n", + "to_plot = []\n", + "labels = []\n", + "for i in range(3):\n", + " real = list(df[df['window']==window_sizes[i]]['vertices'])\n", + " shuffled = list(df[df['window']==window_sizes[i]]['vert_shuffled_mean'])\n", + " to_plot.append(real)\n", + " to_plot.append(shuffled)\n", + " labels.append(window_names[i]+ \"\\n real\")\n", + " labels.append(window_names[i]+ \"\\n shuffled\")\n", + "\n", + "sns.violinplot(data=to_plot)\n", + "ax.set_xticklabels(labels)\n", + "plt.show()" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Hourly number of users" + ] + }, + { + "cell_type": "code", + "execution_count": 31, + "metadata": {}, + "outputs": [], + "source": [ + "views = g.rolling(window=3600, step=3600)\n", + "hour_vertices = [v.count_vertices() for v in views]" + ] + }, + { + "cell_type": "code", + "execution_count": 32, + "metadata": {}, + "outputs": [], + "source": [ + "timestamps = [dt.datetime.fromtimestamp(v.latest_time()) for v in views]\n", + "to_join = pd.DataFrame({\"time\": timestamps, \"window\":[3600 for k in range(len(timestamps))], \"vertices\": hour_vertices})\n", + "df = pd.concat([df,to_join],copy=False)" + ] + }, + { + "cell_type": "code", + "execution_count": 33, + "metadata": {}, + "outputs": [], + "source": [ + "df['week_days'] = df[\"time\"].apply(lambda x: x.weekday())\n", + "df['hour'] = df[\"time\"].apply(lambda x: x.hour)" + ] + }, + { + "cell_type": "code", + "execution_count": 34, + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "ax = sns.boxplot(data=df[df['window']==3600], x='hour', y='vertices')" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Temporal motifs" + ] + }, + { + "cell_type": "code", + "execution_count": 16, + "metadata": {}, + "outputs": [], + "source": [ + "from raphtory.algorithms import all_local_motifs\n", + "counts = all_local_motifs(g,3600)" + ] + }, + { + "cell_type": "code", + "execution_count": 17, + "metadata": {}, + "outputs": [], + "source": [ + "df = pd.DataFrame(counts).transpose()" + ] + }, + { + "cell_type": "code", + "execution_count": 18, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
0123456789...30313233343536373839
208333000200050...0000000000
342390000000000...0000000000
1826490510001580...01244400371
881630000000000...0000000000
423250000000000...0000000000
..................................................................
697030000000000...0000000000
196030000000000...0000000000
179770000000000...0000000000
385780000000000...0000000000
388380000000000...0000000000
\n", + "

24818 rows × 40 columns

\n", + "
" + ], + "text/plain": [ + " 0 1 2 3 4 5 6 7 8 9 ... 30 31 32 33 34 35 \n", + "20833 3 0 0 0 2 0 0 0 5 0 ... 0 0 0 0 0 0 \\\n", + "34239 0 0 0 0 0 0 0 0 0 0 ... 0 0 0 0 0 0 \n", + "1826 49 0 5 1 0 0 0 1 58 0 ... 0 12 4 4 4 0 \n", + "88163 0 0 0 0 0 0 0 0 0 0 ... 0 0 0 0 0 0 \n", + "42325 0 0 0 0 0 0 0 0 0 0 ... 0 0 0 0 0 0 \n", + "... .. .. .. .. .. .. .. .. .. .. ... .. .. .. .. .. .. \n", + "69703 0 0 0 0 0 0 0 0 0 0 ... 0 0 0 0 0 0 \n", + "19603 0 0 0 0 0 0 0 0 0 0 ... 0 0 0 0 0 0 \n", + "17977 0 0 0 0 0 0 0 0 0 0 ... 0 0 0 0 0 0 \n", + "38578 0 0 0 0 0 0 0 0 0 0 ... 0 0 0 0 0 0 \n", + "38838 0 0 0 0 0 0 0 0 0 0 ... 0 0 0 0 0 0 \n", + "\n", + " 36 37 38 39 \n", + "20833 0 0 0 0 \n", + "34239 0 0 0 0 \n", + "1826 0 3 7 1 \n", + "88163 0 0 0 0 \n", + "42325 0 0 0 0 \n", + "... .. .. .. .. \n", + "69703 0 0 0 0 \n", + "19603 0 0 0 0 \n", + "17977 0 0 0 0 \n", + "38578 0 0 0 0 \n", + "38838 0 0 0 0 \n", + "\n", + "[24818 rows x 40 columns]" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "# display(df)\n", + "display(df)" + ] + }, + { + "cell_type": "code", + "execution_count": 22, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "[[17595 3826 2553 501 6088 22084]\n", + " [ 2012 1621 898 197 3543 996]\n", + " [ 2045 2676 2044 5964 2635 2027]\n", + " [ 4395 1615 8820 1687 1109 651]\n", + " [ 836 4088 1477 3219 2323 4780]\n", + " [16637 1930 9213 5081 3317 21493]]\n" + ] + } + ], + "source": [ + "motifs = np.array(df.sum(axis=0))\n", + "motifs[32:] = motifs[32:]/3\n", + "motifs_3d = to_3d_heatmap(motifs)\n", + "print(motifs_3d)" + ] + }, + { + "cell_type": "code", + "execution_count": 21, + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "fig, ax = plt.subplots()\n", + "\n", + "labels = get_labels(motifs_3d)\n", + "ax = sns.heatmap(motifs_3d,square=True, cmap=\"YlGnBu\", cbar=True, annot=labels,annot_kws={\"size\":13}, fmt='', cbar_kws={\"shrink\": 1.0})\n", + "\n", + "for i in range(6):\n", + " offset_image(\"x\",i,i,ax)\n", + " offset_image(\"y\",i,i,ax)\n", + "\n", + "ax.tick_params(axis='x', which='major', pad=50)\n", + "ax.tick_params(axis='y', which='major', pad=50)\n", + "plt.setp(ax.get_xticklabels(), visible=False)\n", + "plt.setp(ax.get_yticklabels(), visible=False)\n", + "plt.tight_layout()\n", + "plt.savefig(\"sx-motifs-all.png\")" + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "base", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.10.10" + }, + "orig_nbformat": 4 + }, + "nbformat": 4, + "nbformat_minor": 2 +} diff --git a/examples/py/math_overflow/motif-pics/motifs.pptx b/examples/py/math_overflow/motif-pics/motifs.pptx new file mode 100644 index 0000000000..6007bb0709 Binary files /dev/null and b/examples/py/math_overflow/motif-pics/motifs.pptx differ diff --git a/examples/py/math_overflow/motif-pics/x0.png b/examples/py/math_overflow/motif-pics/x0.png new file mode 100644 index 0000000000..16e313620c Binary files /dev/null and b/examples/py/math_overflow/motif-pics/x0.png differ diff --git a/examples/py/math_overflow/motif-pics/x1.png b/examples/py/math_overflow/motif-pics/x1.png new file mode 100644 index 0000000000..899b1a58a2 Binary files /dev/null and b/examples/py/math_overflow/motif-pics/x1.png differ diff --git a/examples/py/math_overflow/motif-pics/x2.png b/examples/py/math_overflow/motif-pics/x2.png new file mode 100644 index 0000000000..52135d3fe4 Binary files /dev/null and b/examples/py/math_overflow/motif-pics/x2.png differ diff --git a/examples/py/math_overflow/motif-pics/x3.png b/examples/py/math_overflow/motif-pics/x3.png new file mode 100644 index 0000000000..8629200e6c Binary files /dev/null and b/examples/py/math_overflow/motif-pics/x3.png differ diff --git a/examples/py/math_overflow/motif-pics/x4.png b/examples/py/math_overflow/motif-pics/x4.png new file mode 100644 index 0000000000..b10c2081ca Binary files /dev/null and b/examples/py/math_overflow/motif-pics/x4.png differ diff --git a/examples/py/math_overflow/motif-pics/x5.png b/examples/py/math_overflow/motif-pics/x5.png new file mode 100644 index 0000000000..4969a69ccd Binary files /dev/null and b/examples/py/math_overflow/motif-pics/x5.png differ diff --git a/examples/py/math_overflow/motif-pics/y0.png b/examples/py/math_overflow/motif-pics/y0.png new file mode 100644 index 0000000000..c62c237c5d Binary files /dev/null and b/examples/py/math_overflow/motif-pics/y0.png differ diff --git a/examples/py/math_overflow/motif-pics/y1.png b/examples/py/math_overflow/motif-pics/y1.png new file mode 100644 index 0000000000..32c039c523 Binary files /dev/null and b/examples/py/math_overflow/motif-pics/y1.png differ diff --git a/examples/py/math_overflow/motif-pics/y2.png b/examples/py/math_overflow/motif-pics/y2.png new file mode 100644 index 0000000000..e3b283e26f Binary files /dev/null and b/examples/py/math_overflow/motif-pics/y2.png differ diff --git a/examples/py/math_overflow/motif-pics/y3.png b/examples/py/math_overflow/motif-pics/y3.png new file mode 100644 index 0000000000..8e15974413 Binary files /dev/null and b/examples/py/math_overflow/motif-pics/y3.png differ diff --git a/examples/py/math_overflow/motif-pics/y4.png b/examples/py/math_overflow/motif-pics/y4.png new file mode 100644 index 0000000000..693a0f5b58 Binary files /dev/null and b/examples/py/math_overflow/motif-pics/y4.png differ diff --git a/examples/py/math_overflow/motif-pics/y5.png b/examples/py/math_overflow/motif-pics/y5.png new file mode 100644 index 0000000000..d4aba40ae6 Binary files /dev/null and b/examples/py/math_overflow/motif-pics/y5.png differ diff --git a/examples/py/math_overflow/new-existing-users.png b/examples/py/math_overflow/new-existing-users.png new file mode 100644 index 0000000000..e7ad71affd Binary files /dev/null and b/examples/py/math_overflow/new-existing-users.png differ diff --git a/examples/py/math_overflow/plotting_utils.py b/examples/py/math_overflow/plotting_utils.py new file mode 100644 index 0000000000..42bc922bd2 --- /dev/null +++ b/examples/py/math_overflow/plotting_utils.py @@ -0,0 +1,121 @@ +import matplotlib.pyplot as plt +import numpy as np +import distinctipy + +from matplotlib.offsetbox import OffsetImage,AnnotationBbox + +# Mapping different motifs to their place in the heatmap. + +mapper = {0:(5,5), + 1:(5,4), + 2:(4,5), + 3:(4,4), + 4:(4,3), + 5:(4,2), + 6:(5,3), + 7:(5,2), + 8:(0,0), + 9:(0,1), + 10:(1,0), + 11:(1,1), + 12:(2,1), + 13:(2,0), + 14:(3,1), + 15:(3,0), + 16:(0,5), + 17:(0,4), + 18:(1,5), + 19:(1,4), + 20:(2,3), + 21:(2,2), + 22:(3,3), + 23:(3,2), + 24:(5,0), + 25:(5,1), + 26:(4,0), + 27:(4,1), + 28:(4,1), + 29:(4,0), + 30:(5,1), + 31:(5,0), + 32:(0,2), + 33:(2,4), + 34:(1,2), + 35:(1,3), + 36:(0,3), + 37:(2,5), + 38:(3,4), + 39:(3,5)} + +def to_3d_heatmap(motif_flat, data_type=int): + motif_3d = np.zeros((6,6),dtype=data_type) + for i in list(range(24))+list(range(31,40)): + motif_3d[mapper[i]]=motif_flat[i] + for i in range(4): + motif_3d[mapper[24+i]] = (motif_flat[24+i] + motif_flat[31-i])/2 + + return motif_3d + +def human_format(num): + magnitude = 0 + while abs(num) >= 1000: + magnitude += 1 + num /= 1000.0 + # add more suffixes if you need them + return '%.1f%s' % (num, ['', 'K', 'M', 'B', 'T', 'P'][magnitude]) + +def get_labels(motif_map): + return np.vectorize(human_format)(motif_map) + +def get_motif(xory:str,y:int): + path = "motif-pics/"+xory+str(y)+".png" + return plt.imread(path) + +def offset_image(xory, coord, name, ax): + img = get_motif(xory, name) + im = OffsetImage(img,zoom=0.04) + im.image.axes = ax + + if(xory=="x"): + ab = AnnotationBbox(im, (coord+0.5, 5.5), xybox=(0., -40.), frameon=False, + xycoords='data', boxcoords="offset points", box_alignment=(0.5,0.5), pad=0) + + else: + ab = AnnotationBbox(im, (0, coord), xybox=(0., -40.), frameon=False, + xycoords='data', boxcoords="offset points", box_alignment=(1.0,0.0), pad=0) + + ax.add_artist(ab) + +# For making CDFs and CCDFs + +def cdf(listlike, normalised=True): + data = np.array(listlike) + N = len(listlike) + + x = np.sort(data) + if (normalised): + y = np.arange(N)/float(N-1) + else: + y = np.arange(N) + return x, y + +def ccdf(listlike, normalised=True): + x, y = cdf(listlike,normalised) + if normalised: + return x, 1.0-y + else: + return x, len(listlike)-y + +def lorenz(listlike): + tmp_arr = np.array(sorted(listlike)) + # print(tmp_arr[0]) + x= np.arange(listlike.size)/(listlike.size -1) + y = tmp_arr.cumsum() / tmp_arr.sum() + return x,y + +def get_ordinal_number(num): + if 10 < num % 100 < 20: + ordinal = str(num) + "th" + else: + ordinal = str(num) + {1: "st", 2: "nd", 3: "rd"}.get(num % 10, "th") + return ordinal diff --git a/examples/py/math_overflow/sx-motifs-all.png b/examples/py/math_overflow/sx-motifs-all.png new file mode 100644 index 0000000000..52ca79e954 Binary files /dev/null and b/examples/py/math_overflow/sx-motifs-all.png differ diff --git a/examples/py/reddit/demo.ipynb b/examples/py/reddit/demo.ipynb index 20f63c1b8b..8413604f12 100644 --- a/examples/py/reddit/demo.ipynb +++ b/examples/py/reddit/demo.ipynb @@ -9,7 +9,7 @@ }, { "cell_type": "code", - "execution_count": 1, + "execution_count": 31, "metadata": {}, "outputs": [], "source": [ @@ -25,47 +25,119 @@ }, { "cell_type": "code", - "execution_count": 2, + "execution_count": 32, "metadata": {}, "outputs": [ { - "data": { - "text/plain": [ - "Graph(number_of_edges=0, number_of_vertices=0, earliest_time=0, latest_time=0)" - ] - }, - "execution_count": 2, - "metadata": {}, - "output_type": "execute_result" + "name": "stdout", + "output_type": "stream", + "text": [ + " DateTime Name Recipient Type Layer\n", + "0 2023-09-06 10:00:00 Alice David Email 1\n", + "1 2023-09-06 11:30:00 Bob Eve Message 2\n", + "2 2023-09-06 13:45:00 Charlie Frank Call 3\n", + "3 2023-09-06 13:50:00 Alice David Message 4\n" + ] } ], "source": [ - "g = Graph()\n", - "g" + "import pandas as pd\n", + "\n", + "# Sample data for demonstration\n", + "data = {\n", + " 'DateTime': ['2023-09-06 10:00:00', '2023-09-06 11:30:00', '2023-09-06 13:45:00', '2023-09-06 13:50:00'],\n", + " 'Name': ['Alice', 'Bob', 'Charlie', 'Alice'],\n", + " 'Recipient': ['David', 'Eve', 'Frank', 'David'],\n", + " 'Type': ['Email', 'Message', 'Call', 'Message'],\n", + " \"Layer\": [1, 2, 3, 4],\n", + "}\n", + "\n", + "# Create the DataFrame\n", + "df = pd.DataFrame(data)\n", + "\n", + "# Print the DataFrame\n", + "print(df)" ] }, { "cell_type": "code", - "execution_count": 3, + "execution_count": 33, + "metadata": {}, + "outputs": [], + "source": [ + "df[\"DateTime\"] = pd.to_datetime(df[\"DateTime\"]).astype(\"datetime64[ms]\")" + ] + }, + { + "cell_type": "code", + "execution_count": 34, + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "Loading edges: 100%|██████████| 4.00/4.00 [00:00<00:00, 18.7Kit/s]0:00, 3.19Kit/s]" + ] + } + ], + "source": [ + "g=Graph()\n", + "g.load_edges_from_pandas(edge_df=df, src_col=\"Name\", dst_col=\"Recipient\", time_col=\"DateTime\", props=[\"Type\"], layer_in_df=\"Layer\")\n", + "df.dropna(axis=0, inplace=True)" + ] + }, + { + "cell_type": "code", + "execution_count": 35, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ - "Total vertices in the graph: 3\n", - "Total vertices at 2021-01-01 12:40:00: 2\n", - "1\n" + "Edge(source=Alice, target=David, earliest_time=1693994400000, latest_time=1694008200000, properties={Type: Message})\n" + ] + } + ], + "source": [ + "e= g.edge(\"Alice\",\"David\")\n", + "print(e)" + ] + }, + { + "cell_type": "code", + "execution_count": 36, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Vertex(name=Ben, earliest_time=\"1560419400000\", latest_time=\"1560419400000\", properties={type: person, _id: Ben})\n", + "Vertex(name=Hamza, earliest_time=\"1560419400000\", latest_time=\"1560419400000\", properties={type: person, _id: Hamza})\n", + "Edge(source=Ben, target=Hamza, earliest_time=1560419400000, latest_time=1560419400000, properties={type: friend})\n", + "Total vertices in the graph: 2\n", + "Total vertices at 2021-01-01 12:40:00: 2\n" ] } ], "source": [ - "from raphtory import Graph\n", "g = Graph()\n", - "g.add_edge(\"2021-01-01 12:32:00\", \"Ben\", \"Hamza\", {\"type\": \"friend\"})\n", - "g.add_edge(\"2021-01-02 14:15:36\", \"Hamza\", \"Haaroon\", {\"type\": \"friend\"})\n", - "print(\"Total vertices in the graph:\", g.num_vertices())\n", - "print(\"Total vertices at 2021-01-01 12:40:00:\", g.at(\"2021-01-01 12:40:00\").num_vertices())\n" + "# e = g.add_edge(\"2021-01-01 12:32:00\", \"Ben\", \"Hamza\", {\"type\": \"friend\"})\n", + "\n", + "# g.add_edge(\"2021-01-02 14:15:36\", \"Hamza\", \"Haaroon\", {\"type\": \"friend\"})\n", + "vertex = g.add_vertex(\"2019-06-13 09:50:00\", \"Ben\", {\"type\": \"person\"})\n", + "vertex2 = g.add_vertex(\"2019-06-13 09:50:00\", \"Hamza\", {\"type\": \"person\"})\n", + "edge = g.add_edge(\"2019-06-13 09:50:00\", \"Ben\", \"Hamza\", {\"type\": \"friend\"})\n", + "\n", + "# edge = g.add_edge(1, \"Ben\", \"Hamza\", {\"type\": \"friend\"})\n", + "# edge2 = g.add_edge(2, \"Ben\", \"Hamza\", {\"type\": \"friend\"})\n", + "print(vertex)\n", + "print(vertex2)\n", + "print(edge)\n", + "print(\"Total vertices in the graph:\", g.count_vertices())\n", + "print(\"Total vertices at 2021-01-01 12:40:00:\", g.at(\"2021-01-01 12:40:00\").count_vertices())\n" ] }, { @@ -77,29 +149,30 @@ }, { "cell_type": "code", - "execution_count": 4, + "execution_count": 37, "metadata": {}, "outputs": [ { - "data": { - "text/plain": [ - "[(1, 1), (2, 2)]" - ] - }, - "execution_count": 4, - "metadata": {}, - "output_type": "execute_result" + "name": "stdout", + "output_type": "stream", + "text": [ + "[1, 2]\n", + "123\n" + ] } ], "source": [ + "g = Graph()\n", + "\n", "\n", - "g.add_vertex(timestamp=1, id=\"ben\", properties={\"property 1\": 1, \"property 3\": \"hi\", \"property 4\": True})\n", + "v=g.add_vertex(timestamp=1, id=\"ben\", properties={\"property 1\": 1, \"property 3\": \"hi\", \"property 4\": True})\n", "g.add_vertex(timestamp=2, id=\"ben\", properties={\"property 1\": 2, \"property 2\": 0.6, \"property 4\": False})\n", "g.add_vertex(timestamp=3, id=\"ben\", properties={\"property 2\": 0.9, \"property 3\": \"hello\", \"property 4\": True})\n", "\n", - "g.add_vertex_properties(id=\"ben\", properties={\"static property\": 123})\n", + "v.add_constant_properties(properties={\"unchanging property\": 123})\n", "\n", - "g.vertex(\"ben\").property_history(\"property 1\")" + "print(v.properties.temporal.get(\"property 1\").values())\n", + "print(v.properties.constant.get(\"unchanging property\"))\n" ] }, { @@ -111,16 +184,16 @@ }, { "cell_type": "code", - "execution_count": 5, + "execution_count": 38, "metadata": {}, "outputs": [ { "data": { "text/plain": [ - "Edge(source=ben, target=hamza, earliest_time=1, latest_time=3, properties={property 2 : 0.9, static property : 123, property 1 : 2, property 3 : hello, property 4 : true})" + "Edge(source=ben, target=hamza, earliest_time=1, latest_time=3, properties={property 1: 2, property 4: true, property 3: hello, property 2: 0.9, static property: 123})" ] }, - "execution_count": 5, + "execution_count": 38, "metadata": {}, "output_type": "execute_result" } @@ -128,11 +201,11 @@ "source": [ "\n", "g.add_vertex(timestamp=1,id=\"hamza\")\n", - "g.add_edge(timestamp=1, src=\"ben\", dst=\"hamza\", properties={\"property 1\": 1, \"property 3\": \"hi\", \"property 4\": True})\n", + "e=g.add_edge(timestamp=1, src=\"ben\", dst=\"hamza\", properties={\"property 1\": 1, \"property 3\": \"hi\", \"property 4\": True})\n", "g.add_edge(timestamp=2, src=\"ben\", dst=\"hamza\", properties={\"property 1\": 2, \"property 2\": 0.6, \"property 4\": False})\n", "g.add_edge(timestamp=3, src=\"ben\", dst=\"hamza\", properties={\"property 2\": 0.9, \"property 3\": \"hello\", \"property 4\": True})\n", "\n", - "g.add_edge_properties(src=\"ben\", dst=\"hamza\", properties={\"static property\": 123})\n", + "e.add_constant_properties(properties={\"static property\": 123})\n", "\n", "g.edge(\"ben\",\"hamza\")" ] @@ -144,42 +217,121 @@ "## Loading a real graph" ] }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "In the cell below we are pulling the subreddit to subreddit hyperlink graph from the [SNAP data repository](http://snap.stanford.edu/data/soc-RedditHyperlinks.html). This builds a web of the references between different communities on reddit with NLP analysis on each post (edge/link) providing properties such as sentiment." + ] + }, { "cell_type": "code", - "execution_count": 6, + "execution_count": 39, "metadata": {}, "outputs": [], "source": [ - "reddit_graph = graph_loader.reddit_hyperlink_graph()" + "import requests\n", + "import pandas as pd\n", + "import os\n", + "\n", + "url = \"http://snap.stanford.edu/data/soc-redditHyperlinks-title.tsv\"\n", + "file_path = \"soc-redditHyperlinks-title.tsv\"\n", + "\n", + "if not os.path.exists(file_path):\n", + " response = requests.get(url, stream=True)\n", + " total_size = int(response.headers.get('content-length', 0))\n", + " block_size = 1024 \n", + " downloaded_size = 0\n", + "\n", + " with open(file_path, \"wb\") as f:\n", + " for data in response.iter_content(block_size):\n", + " f.write(data)\n", + " downloaded_size += len(data)\n", + " progress = (downloaded_size / total_size) * 100\n", + " print(f\"Downloaded {downloaded_size}/{total_size} bytes ({progress:.2f}%)\", end='\\r')\n", + "\n", + " print(\"\\nFile downloaded successfully.\")\n", + "\n", + "if not os.path.exists(\"reddit.pkl\"):\n", + "\n", + " #Next we label all the nlp features from the 'properties' column and make them there own columns which we can reference in the Raphtory Pandas loader \n", + " df = pd.read_csv(file_path, sep='\\t')\n", + "\n", + " #Define all the features as per the spec on the SNAP website\n", + " features = [\n", + " \"number_of_characters\", \"number_of_characters_without_counting_whitespace\", \"fraction_of_alphabetical_characters\", \n", + " \"fraction_of_digits\", \"fraction_of_uppercase_characters\", \"fraction_of_white_spaces\", \"fraction_of_special_characters\", \n", + " \"number_of_words\", \"number_of_unique_words\", \"number_of_long_words_at_least_6_characters\", \"average_word_length\", \n", + " \"number_of_unique_stopwords\", \"fraction_of_stopwords\", \"number_of_sentences\", \"number_of_long_sentences_at_least_10_words\", \n", + " \"average_number_of_characters_per_sentence\", \"average_number_of_words_per_sentence\", \"automated_readability_index\", \n", + " \"positive_sentiment\", \"negative_sentiment\", \"compound_sentiment\", \n", + " \"liwc_funct\", \"liwc_pronoun\", \"liwc_ppron\", \"liwc_i\", \"liwc_we\", \"liwc_you\", \"liwc_she_he\", \"liwc_they\", \n", + " \"liwc_ipron\", \"liwc_article\", \"liwc_verbs\", \"liwc_aux_vb\", \"liwc_past\", \"liwc_present\", \"liwc_future\", \n", + " \"liwc_adverbs\", \"liwc_prep\", \"liwc_conj\", \"liwc_negate\", \"liwc_quant\", \"liwc_numbers\", \"liwc_swear\", \n", + " \"liwc_social\", \"liwc_family\", \"liwc_friends\", \"liwc_humans\", \"liwc_affect\", \"liwc_posemo\", \"liwc_negemo\", \n", + " \"liwc_anx\", \"liwc_anger\", \"liwc_sad\", \"liwc_cog_mech\", \"liwc_insight\", \"liwc_cause\", \"liwc_discrep\", \n", + " \"liwc_tentat\", \"liwc_certain\", \"liwc_inhib\", \"liwc_incl\", \"liwc_excl\", \"liwc_percept\", \"liwc_see\", \n", + " \"liwc_hear\", \"liwc_feel\", \"liwc_bio\", \"liwc_body\", \"liwc_health\", \"liwc_sexual\", \"liwc_ingest\", \n", + " \"liwc_relativ\", \"liwc_motion\", \"liwc_space\", \"liwc_time\", \"liwc_work\", \"liwc_achiev\", \"liwc_leisure\", \n", + " \"liwc_home\", \"liwc_money\", \"liwc_relig\", \"liwc_death\", \"liwc_assent\", \"liwc_dissent\", \"liwc_nonflu\", \"liwc_filler\"\n", + " ]\n", + "\n", + " # Convert the property string to arrays of integers\n", + " df['PROPERTIES'] = df['PROPERTIES'].str.split(',').apply(lambda x: [float(i) for i in x])\n", + " # Convert the 'properties' column into a DataFrame with individual columns\n", + " properties_df = df['PROPERTIES'].apply(pd.Series)\n", + " # Rename the columns using the features array\n", + " properties_df.columns = features\n", + " # Concatenate the original DataFrame and the properties DataFrame\n", + " df = pd.concat([df, properties_df], axis=1)\n", + " # Drop the original 'properties' column\n", + " df = df.drop(columns=['PROPERTIES'])\n", + " #Convert the datestrings to datetimes\n", + " df['TIMESTAMP'] = pd.to_datetime(df['TIMESTAMP'])\n", + " # Convert datetime to millisecond precision (datetime64[ms])\n", + " df['TIMESTAMP'] = df['TIMESTAMP'].astype('datetime64[ms]')\n", + " #Save the data so we don't have to parse it again\n", + " df.to_pickle('reddit.pkl')\n", + " df.head()\n", + "\n", + "else:\n", + " df = pd.read_pickle(\"reddit.pkl\")\n" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Now let's load this data into a Raphtory graph - we won't use all the features, just grab a couple for demo purposes, but obviously you can edit the code below to choose the ones you are interested in." ] }, { "cell_type": "code", - "execution_count": 7, + "execution_count": 40, "metadata": {}, "outputs": [ { - "name": "stdout", + "name": "stderr", "output_type": "stream", "text": [ - "Graph(number_of_edges=234792, number_of_vertices=54075, earliest_time=1388506820000, latest_time=1493570870000)\n" + "Loading edges: 100%|██████████| 572K/572K [00:25<00:00, 22.7Kit/s]s]08, 726it/s]es: 24%|██▄ | 137K/572K [00:05<00:18, 24.0Kit/s]" ] } ], "source": [ - "print(reddit_graph)" + "reddit_graph = Graph.load_from_pandas(edges_df=df,src=\"SOURCE_SUBREDDIT\",dst=\"TARGET_SUBREDDIT\",time=\"TIMESTAMP\",props=[\"number_of_unique_words\", \"average_word_length\", \"number_of_unique_stopwords\", \"number_of_sentences\", \"automated_readability_index\", \"positive_sentiment\", \"negative_sentiment\", \"compound_sentiment\"])\n" ] }, { "cell_type": "code", - "execution_count": 8, + "execution_count": 41, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ - "property names: ['post_label', 'post_id', 'word_count', 'long_words', 'sentences', 'readability', 'positive_sentiment', 'negative_sentiment', 'compound_sentiment']\n", + "property names: ['number_of_unique_words', 'average_word_length', 'number_of_unique_stopwords', 'number_of_sentences', 'automated_readability_index', 'positive_sentiment', 'negative_sentiment', 'compound_sentiment']\n", "sentiment history: [(1404952792000, 0.2732), (1414676601000, 0.2344), (1418639874000, 0.0), (1420030124000, -0.2481), (1426362695000, 0.0), (1427198700000, -0.2023), (1427894452000, 0.0), (1429187302000, 0.5562), (1429644527000, 0.296), (1431911341000, -0.3595), (1433653011000, -0.34), (1435258425000, 0.0772), (1439068701000, -0.5574), (1439249314000, 0.0), (1440456620000, 0.4019), (1446586617000, 0.0), (1447125847000, -0.7042), (1447422296000, 0.0387), (1450563607000, 0.8192), (1450658697000, 0.6841), (1450863723000, 0.2732), (1451249771000, -0.4767), (1455119795000, 0.0), (1455295188000, -0.4939), (1456505801000, -0.6908), (1456949833000, 0.0), (1458061181000, 0.3384), (1460498612000, -0.5267), (1461879765000, -0.6136), (1463741129000, 0.0), (1466862772000, -0.1779), (1471350739000, -0.6808), (1479538764000, 0.0), (1480262620000, 0.25), (1482314435000, 0.6908), (1483690844000, 0.0), (1487778524000, -0.4404), (1488873853000, 0.0), (1488966224000, 0.0), (1489359306000, -0.5789), (1489999301000, -0.2263), (1491144265000, -0.34), (1492064865000, 0.8149), (1492451552000, 0.0)]\n", "Most recent sentiment on 2014-10-30 13:45:00 - 0.2344\n" ] @@ -187,24 +339,24 @@ { "data": { "text/plain": [ - "PathFromVertex(Vertex(name=cancer, properties={_id : cancer}), Vertex(name=soccer, properties={_id : soccer}), Vertex(name=pics, properties={_id : pics}), Vertex(name=funny, properties={_id : funny}), Vertex(name=bitcoin, properties={_id : bitcoin}), Vertex(name=propaganda, properties={_id : propaganda}), Vertex(name=conspiracy, properties={_id : conspiracy}), Vertex(name=askreddit, properties={_id : askreddit}), Vertex(name=trees, properties={_id : trees}), Vertex(name=cricket, properties={_id : cricket}), ...)" + "PyPropHistValueList([[0.2732], [0.6249, 0.7957, 0], [0], [0.1779], [0.2003], [0.34], [0.4215], [-0.3182], [-0.4767], [0.296], ...])" ] }, - "execution_count": 8, + "execution_count": 41, "metadata": {}, "output_type": "execute_result" } ], "source": [ "edge = reddit_graph.edge(\"conspiracy\",\"documentaries\")\n", - "print(\"property names:\",edge.property_names())\n", - "print(\"sentiment history:\",edge.property_history(\"compound_sentiment\"))\n", + "print(\"property names:\",edge.properties.keys())\n", + "print(\"sentiment history:\",edge.properties.temporal.get(\"compound_sentiment\").items())\n", "\n", "date=\"2014-10-30 13:45:00\"\n", "edge_perspective = reddit_graph.at(date).edge(\"conspiracy\",\"documentaries\")\n", "print(\"Most recent sentiment on\",date,\"-\",edge_perspective[\"compound_sentiment\"])\n", "\n", - "reddit_graph.vertex(\"conspiracy\").out_neighbours().out_neighbours().out_neighbours()" + "reddit_graph.vertex(\"conspiracy\").out_edges.dst.out_edges.properties.temporal.get(\"compound_sentiment\").values()" ] }, { @@ -216,22 +368,29 @@ }, { "cell_type": "code", - "execution_count": 13, + "execution_count": 42, "metadata": {}, "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "1217it [01:06, 18.30it/s]\n" + ] + }, { "data": { "text/plain": [ "" ] }, - "execution_count": 13, + "execution_count": 42, "metadata": {}, "output_type": "execute_result" }, { "data": { - "image/png": "", + "image/png": "", "text/plain": [ "
" ] @@ -241,14 +400,15 @@ } ], "source": [ + "from tqdm import tqdm\n", "views = reddit_graph.rolling(window=\"1 day\") \n", "\n", "timestamps = []\n", "edge_count = []\n", "\n", - "for view in views:\n", - " timestamps.append(view.latest_date_time())\n", - " edge_count.append(view.num_edges()) \n", + "for view in tqdm(views):\n", + " timestamps.append(view.latest_date_time)\n", + " edge_count.append(view.count_edges()) \n", "\n", "sns.set_context()\n", "ax = plt.gca()\n", @@ -267,22 +427,22 @@ }, { "cell_type": "code", - "execution_count": 15, + "execution_count": 50, "metadata": {}, "outputs": [ { "data": { "text/plain": [ - "" + "" ] }, - "execution_count": 15, + "execution_count": 50, "metadata": {}, "output_type": "execute_result" }, { "data": { - "image/png": "", + "image/png": "", "text/plain": [ "
" ] @@ -299,19 +459,12 @@ "negative_sentiment_in = []\n", "negative_sentiment_out = []\n", "\n", - "def edge_weight(edge,prop_name):\n", - " return sum(list(map(lambda e: e[1],edge.property_history(prop_name)))), len(edge.property_history(prop_name))\n", - "\n", - "def weighted_average_degree(vertex,prop_name,incoming):\n", - " edges = list(vertex.in_edges() if incoming else vertex.out_edges())\n", - " return sum(list(map(lambda e: edge_weight(e,prop_name)[0],edges)))/max(1,sum(list(map(lambda e: edge_weight(e,prop_name)[1],edges))))\n", - "\n", "for vertex in views:\n", - " timestamps.append(vertex.latest_date_time())\n", - " positive_sentiment_in.append(weighted_average_degree(vertex,\"positive_sentiment\",incoming=True))\n", - " positive_sentiment_out.append(weighted_average_degree(vertex,\"positive_sentiment\",incoming=False))\n", - " negative_sentiment_in.append(weighted_average_degree(vertex,\"negative_sentiment\",incoming=True))\n", - " negative_sentiment_out.append(weighted_average_degree(vertex,\"negative_sentiment\",incoming=False)) \n", + " timestamps.append(vertex.latest_date_time)\n", + " positive_sentiment_in.append(vertex.in_edges.properties.temporal.get(\"positive_sentiment\").values().sum().mean())\n", + " positive_sentiment_out.append(vertex.out_edges.properties.temporal.get(\"positive_sentiment\").values().sum().mean())\n", + " negative_sentiment_in.append(vertex.in_edges.properties.temporal.get(\"negative_sentiment\").values().sum().mean())\n", + " negative_sentiment_out.append(vertex.out_edges.properties.temporal.get(\"negative_sentiment\").values().sum().mean())\n", "\n", "sns.set()\n", "sns.set_palette(\"pastel\")\n", @@ -327,6 +480,89 @@ "ax.legend(loc=\"best\")\n" ] }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Running some example algorithms" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Lets get the top 5 subreddits in the graph as per pagerank" + ] + }, + { + "cell_type": "code", + "execution_count": 51, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "The conspiracy subreddit has a pagerank score of 0.0028709357281156145\n", + " Key Value\n", + "1746 askreddit 0.019556\n", + "295 iama 0.015616\n", + "3236 pics 0.009884\n", + "22085 funny 0.009283\n", + "40067 videos 0.006105\n", + "The top five ranked subreddits are [('askreddit', 0.019555592169738754), ('iama', 0.01561587791951029), ('pics', 0.009884204062062652), ('funny', 0.009282589235120708), ('videos', 0.006105153065518092)]\n" + ] + } + ], + "source": [ + "from raphtory import algorithms as algos\n", + "\n", + "#First lets run the algorithm and get our result set\n", + "result_set=algos.pagerank(reddit_graph)\n", + "\n", + "#We can then have a look at the values of specific nodes\n", + "print(\"The conspiracy subreddit has a pagerank score of\",result_set.get('conspiracy'))\n", + "\n", + "#Convert the results to a dataframe\n", + "print(result_set.to_df().sort_values(by='Value',ascending=False).head())\n", + "\n", + "#get the top 5 most import users via the intial top_k function\n", + "print(\"The top five ranked subreddits are \",result_set.top_k(5))\n" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Getting the largest connected component" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "The largest component has 52468 nodes out of a total of 54075\n" + ] + } + ], + "source": [ + "#First lets run the algorithm and group by the component_id\n", + "components=algos.weakly_connected_components(reddit_graph).group_by()\n", + "\n", + "#Map the returned dict so that we have the size of the components instead of the vertex names\n", + "component_sizes = {key: len(value) for key, value in components.items()}\n", + "#Get the component id with the greatest number of nodes\n", + "component_with_biggest_size = max(component_sizes,key=component_sizes.get)\n", + "#Get the value of this component\n", + "lcc=component_sizes[component_with_biggest_size]\n", + "print(\"The largest component has\",lcc,\"nodes out of a total of\",reddit_graph.count_vertices())" + ] + }, { "cell_type": "code", "execution_count": null, diff --git a/examples/rust/Cargo.toml b/examples/rust/Cargo.toml index 7a062f7116..99817d23ab 100644 --- a/examples/rust/Cargo.toml +++ b/examples/rust/Cargo.toml @@ -7,8 +7,7 @@ keywords = ["graph", "temporal-graph", "temporal", "examples"] # See more keys and their definitions at https://doc.rust-lang.org/cargo/reference/manifest.html [dependencies] -raphtory = {path = "../../raphtory"} -raphtory-io = {path = "../../raphtory-io"} +raphtory = {path = "../../raphtory", features=["io"]} chrono = "0.4" regex = "1" serde = { version = "1", features = ["derive", "rc"] } @@ -25,9 +24,6 @@ name = "bench" [[bin]] name = "lotr" -[[bin]] -name = "healthcheck" - [[bin]] name = "hulongbay" diff --git a/examples/rust/src/bin/bench/main.rs b/examples/rust/src/bin/bench/main.rs index 2978b92d77..166c08b8fd 100644 --- a/examples/rust/src/bin/bench/main.rs +++ b/examples/rust/src/bin/bench/main.rs @@ -1,13 +1,13 @@ -use itertools::Itertools; -use raphtory::core::utils; -use raphtory::core::Prop; -use raphtory::db::graph::Graph; -use raphtory::db::view_api::*; -use raphtory_io::graph_loader::source::csv_loader::CsvLoader; +use raphtory::{ + algorithms::pagerank::unweighted_page_rank, graph_loader::source::csv_loader::CsvLoader, + prelude::*, +}; use serde::Deserialize; -use std::path::PathBuf; -use std::{env, path::Path, time::Instant}; -use raphtory::algorithms::pagerank::unweighted_page_rank; +use std::{ + env, + path::{Path, PathBuf}, + time::Instant, +}; #[derive(Deserialize, std::fmt::Debug)] pub struct Benchr { @@ -43,40 +43,26 @@ fn main() { println!( "Loaded graph from encoded data files {} with {} vertices, {} edges which took {} seconds", encoded_data_dir.to_str().unwrap(), - g.num_vertices(), - g.num_edges(), + g.count_vertices(), + g.count_edges(), now.elapsed().as_secs() ); g } else { - let g = Graph::new(8); + let g = Graph::new(); let now = Instant::now(); - CsvLoader::new(data_dir, ) + CsvLoader::new(data_dir) .set_delimiter("\t") .load_into_graph(&g, |lotr: Benchr, g: &Graph| { - g.add_vertex( - 1, - lotr.src_id.clone(), - &vec![], - ) + g.add_vertex(1, lotr.src_id.clone(), NO_PROPS) .expect("Failed to add vertex"); - g.add_vertex( - 1, - lotr.dst_id.clone(), - &vec![], - ) + g.add_vertex(1, lotr.dst_id.clone(), NO_PROPS) .expect("Failed to add vertex"); - g.add_edge( - 1, - lotr.src_id.clone(), - lotr.dst_id.clone(), - &vec![], - None, - ) + g.add_edge(1, lotr.src_id.clone(), lotr.dst_id.clone(), NO_PROPS, None) .expect("Failed to add edge"); }) .expect("Failed to load graph from CSV data files"); @@ -84,8 +70,8 @@ fn main() { println!( "Loaded graph from CSV data files {} with {} vertices, {} edges which took {} seconds", encoded_data_dir.to_str().unwrap(), - g.num_vertices(), - g.num_edges(), + g.count_vertices(), + g.count_edges(), now.elapsed().as_secs() ); @@ -95,6 +81,6 @@ fn main() { g }; println!("Data loaded\nPageRanking"); - let r = unweighted_page_rank(&graph, 25, Some(8), None,true); + unweighted_page_rank(&graph, 25, Some(8), None, true); println!("Done PR"); } diff --git a/examples/rust/src/bin/btc/main.rs b/examples/rust/src/bin/btc/main.rs index 71cd352a54..339a9fd889 100644 --- a/examples/rust/src/bin/btc/main.rs +++ b/examples/rust/src/bin/btc/main.rs @@ -1,23 +1,21 @@ #![allow(unused_imports)] -use std::collections::HashMap; -use std::marker::PhantomData; -use std::path::{Path, PathBuf}; -use std::thread::JoinHandle; -use std::{env, thread}; +#![allow(dead_code)] use chrono::{DateTime, Utc}; -use raphtory::core::tgraph::TemporalGraph; -use raphtory::core::utils; -use raphtory::core::{Direction, Prop}; -use raphtory_io::graph_loader::source::csv_loader::CsvLoader; +use raphtory::{core::utils::hashing, graph_loader::source::csv_loader::CsvLoader, prelude::*}; use regex::Regex; use serde::Deserialize; -use std::fs::File; -use std::io::{prelude::*, BufReader, LineWriter}; -use std::time::Instant; - -use raphtory::db::graph::Graph; -use raphtory::db::view_api::*; +use std::{ + collections::HashMap, + env, + fs::File, + io::{prelude::*, BufReader, LineWriter}, + marker::PhantomData, + path::{Path, PathBuf}, + thread, + thread::JoinHandle, + time::Instant, +}; #[derive(Deserialize, std::fmt::Debug)] pub struct Sent { @@ -56,7 +54,7 @@ fn main() { panic!("Missing data dir = {}", data_dir.to_str().unwrap()) } - let test_v = utils::calculate_hash(&"139eeGkMGR6F9EuJQ3qYoXebfkBbNAsLtV:btc"); + let test_v = hashing::calculate_hash(&"139eeGkMGR6F9EuJQ3qYoXebfkBbNAsLtV:btc"); // If data_dir/graphdb.bincode exists, use bincode to load the graph from binary encoded data files // otherwise load the graph from csv data files @@ -70,22 +68,22 @@ fn main() { println!( "Loaded graph from path {} with {} vertices, {} edges, took {} seconds", encoded_data_dir.to_str().unwrap(), - g.num_vertices(), - g.num_edges(), + g.count_vertices(), + g.count_edges(), now.elapsed().as_secs() ); g } else { - let g = Graph::new(16); + let g = Graph::new(); let now = Instant::now(); CsvLoader::new(data_dir) .with_filter(Regex::new(r".+(sent|received)").unwrap()) .load_into_graph(&g, |sent: Sent, g: &Graph| { - let src = utils::calculate_hash(&sent.addr); - let dst = utils::calculate_hash(&sent.txn); + let src = hashing::calculate_hash(&sent.addr); + let dst = hashing::calculate_hash(&sent.txn); let time = sent.time.timestamp(); if src == test_v || dst == test_v { @@ -96,18 +94,18 @@ fn main() { time, src, dst, - &vec![("amount".to_string(), Prop::U64(sent.amount_btc))], + [("amount".to_string(), Prop::U64(sent.amount_btc))], None, ) - .unwrap() + .unwrap(); }) .expect("Failed to load graph from CSV data files"); println!( "Loaded graph from CSV data files {} with {} vertices, {} edges which took {} seconds", encoded_data_dir.to_str().unwrap(), - g.num_vertices(), - g.num_edges(), + g.count_vertices(), + g.count_edges(), now.elapsed().as_secs() ); @@ -117,8 +115,8 @@ fn main() { g }; - assert_eq!(graph.num_vertices(), 9132396); - assert_eq!(graph.num_edges(), 5087223); + assert_eq!(graph.count_vertices(), 9132396); + assert_eq!(graph.count_edges(), 5087223); let windowed_graph = graph.window(0, i64::MAX); diff --git a/examples/rust/src/bin/crypto/main.rs b/examples/rust/src/bin/crypto/main.rs index c5d35fc7a6..fb635a2d10 100644 --- a/examples/rust/src/bin/crypto/main.rs +++ b/examples/rust/src/bin/crypto/main.rs @@ -1,27 +1,12 @@ -use chrono::NaiveDateTime; use itertools::Itertools; -use raphtory::algorithms::generic_taint::generic_taint; -use raphtory::algorithms::pagerank::unweighted_page_rank; -use raphtory::core::time::TryIntoTime; -use raphtory::db::view_api::internal::GraphViewInternalOps; -use raphtory::db::view_api::layer::LayerOps; -use raphtory::db::view_api::time::WindowSet; -use raphtory::db::view_api::*; -use raphtory_io::graph_loader::example::stable_coins::stable_coin_graph; -use serde::Deserialize; -use std::env; -use std::time::Instant; - -#[derive(Deserialize, std::fmt::Debug)] -pub struct StableCoin { - block_number: String, - transaction_index: u32, - from_address: String, - to_address: String, - time_stamp: i64, - contract_address: String, - value: f64, -} +use raphtory::{ + algorithms::{ + pagerank::unweighted_page_rank, temporal_reachability::temporally_reachable_nodes, + }, + db::api::view::*, + graph_loader::example::stable_coins::stable_coin_graph, +}; +use std::{env, time::Instant}; fn main() { let args: Vec = env::args().collect(); @@ -32,13 +17,13 @@ fn main() { Some(args.get(1).unwrap().to_string()) }; - let g = stable_coin_graph(data_dir,true, 1); + let g = stable_coin_graph(data_dir, true); - assert_eq!(g.num_vertices(), 1523333); - assert_eq!(g.num_edges(), 2814155); + assert_eq!(g.count_vertices(), 1523333); + assert_eq!(g.count_edges(), 2814155); assert_eq!( - g.get_unique_layers().into_iter().sorted().collect_vec(), + g.unique_layers().into_iter().sorted().collect_vec(), vec!["Dai", "LUNC", "USD", "USDP", "USDT", "USTC"] ); @@ -49,35 +34,22 @@ fn main() { let now = Instant::now(); - let _ = unweighted_page_rank( - &g, - 20, - None, - None, - true, - ); + let _ = unweighted_page_rank(&g, 20, None, None, true); println!("Time taken: {} secs", now.elapsed().as_secs()); let now = Instant::now(); - let _ = unweighted_page_rank( - &g.layer("USDT") - .unwrap(), - 20, - None, - None, - true - ); + let _ = unweighted_page_rank(&g.layer("USDT").unwrap(), 20, None, None, true); println!("Time taken: {} secs", now.elapsed().as_secs()); println!("Generic taint"); let now = Instant::now(); - let _ = generic_taint( + let _ = temporally_reachable_nodes( &g.layer("USDT").unwrap(), None, 20, 1651105815, vec!["0xd30b438df65f4f788563b2b3611bd6059bff4ad9"], - vec![], + None, ); println!("Time taken: {} secs", now.elapsed().as_secs()); } diff --git a/examples/rust/src/bin/healthcheck/main.rs b/examples/rust/src/bin/healthcheck/main.rs deleted file mode 100644 index c143017ec6..0000000000 --- a/examples/rust/src/bin/healthcheck/main.rs +++ /dev/null @@ -1,208 +0,0 @@ -fn main() {} - -#[cfg(test)] -mod test { - use std::{ - fmt::Debug, - path::{Path, PathBuf}, - }; - - use itertools::Itertools; - use raphtory::algorithms::connected_components::weakly_connected_components; - use raphtory::core::Direction; - use raphtory::db::{ - graph::Graph, - view_api::*, - view_api::{internal::GraphViewInternalOps, GraphViewOps}, - }; - use raphtory_io::graph_loader::source::csv_loader::CsvLoader; - use serde::de::DeserializeOwned; - - trait TestEdge { - fn src(&self) -> u64; - fn dst(&self) -> u64; - fn t(&self) -> i64; - } - - fn load(g1: &Graph, gn: &Graph, p: PathBuf) { - CsvLoader::new(p) - .set_delimiter(" ") - .load_into_graph(&(g1, gn), |pair: REC, (g1, gn)| { - g1.add_edge(pair.t(), pair.src(), pair.dst(), &vec![], None); - gn.add_edge(pair.t(), pair.src(), pair.dst(), &vec![], None); - }) - .expect("Failed to load graph from CSV files"); - } - - fn test_graph_sanity(p: P, n_parts: usize) - where - P: Into, - { - let path: PathBuf = p.into(); - let g1 = Graph::new(1); - let gn = Graph::new(n_parts); - - load::(&g1, &gn, path); - - fn check_graphs(g1: &G, gn: &G, n_parts: usize) { - assert_eq!(g1.num_vertices(), gn.num_vertices()); - // NON-TEMPORAL TESTS HERE! - - let mut expect_1 = g1.vertices().id().collect::>(); - let mut expect_n = gn.vertices().id().collect::>(); - - expect_1.sort(); - expect_n.sort(); - - assert_eq!(expect_1, expect_n, "Graphs are not equal {n_parts}"); - - for v_ref in g1.vertices().id() { - let v1 = g1.vertex(v_ref).unwrap().id(); - let vn = gn.vertex(v_ref).unwrap().id(); - assert_eq!(v1, vn, "Graphs are not equal {n_parts}"); - - let v_id = v1; - let v1 = g1.vertex(v_id).unwrap(); - let vn = gn.vertex(v_id).unwrap(); - let mut expect_1 = v1.neighbours().id().collect_vec(); - let mut expect_n = vn.neighbours().id().collect_vec(); - expect_1.sort(); - expect_n.sort(); - assert_eq!(expect_1, expect_n, "Graphs are not equal {n_parts}"); - - let mut expect_1 = v1.in_neighbours().id().collect_vec(); - let mut expect_n = vn.in_neighbours().id().collect_vec(); - expect_1.sort(); - expect_n.sort(); - assert_eq!(expect_1, expect_n, "Graphs are not equal {n_parts}"); - - let mut expect_1 = v1.out_neighbours().id().collect_vec(); - let mut expect_n = vn.out_neighbours().id().collect_vec(); - expect_1.sort(); - expect_n.sort(); - assert_eq!(expect_1, expect_n, "Graphs are not equal {n_parts}"); - - // now we test degrees - let expect_1 = v1.degree(); - let expect_n = vn.degree(); - assert_eq!(expect_1, expect_n, "Graphs are not equal {n_parts}"); - - let expect_1 = v1.in_degree(); - let expect_n = vn.in_degree(); - assert_eq!(expect_1, expect_n, "Graphs are not equal {n_parts}"); - - let expect_1 = v1.out_degree(); - let expect_n = vn.out_degree(); - assert_eq!(expect_1, expect_n, "Graphs are not equal {n_parts}"); - } - } - - check_graphs(&g1, &gn, n_parts); - - // TEMPORAL TESTS HERE! - let t_start = 0; - let t_end = 100; - let g1_w = g1.window(t_start, t_end); - let gn_w = gn.window(t_start, t_end); - - check_graphs(&g1_w, &gn_w, n_parts); - } - - #[derive(serde::Deserialize, Debug)] - struct Pair { - src: u64, - dst: u64, - t: i64, - } - - impl TestEdge for Pair { - fn src(&self) -> u64 { - self.src - } - - fn dst(&self) -> u64 { - self.dst - } - - fn t(&self) -> i64 { - self.t - } - } - - #[test] - fn load_graph_from_cargo_path() { - let csv_path: PathBuf = [env!("CARGO_MANIFEST_DIR"), "../../resource/", "test2.csv"] - .iter() - .collect(); - - let p = Path::new(&csv_path); - assert!(p.exists()); - - for n_parts in 1..33 { - test_graph_sanity::<&Path, Pair>(p, n_parts); - } - } - - #[derive(serde::Deserialize, Debug)] - struct PairNoTime { - src: u64, - dst: u64, - } - - impl TestEdge for PairNoTime { - fn src(&self) -> u64 { - self.src - } - - fn dst(&self) -> u64 { - self.dst - } - - fn t(&self) -> i64 { - 1 - } - } - - #[test] - fn connected_components() { - let csv_path: PathBuf = [env!("CARGO_MANIFEST_DIR"), "../../resource/", "test3.csv"] - .iter() - .collect(); - - let p = Path::new(&csv_path); - assert!(p.exists()); - let window = -100..100; - - for n_parts in 2..3 { - let g1 = Graph::new(1); - let gn = Graph::new(n_parts); - load::(&g1, &gn, csv_path.clone()); - - let iter_count = 50; - let cc1 = weakly_connected_components(&g1, iter_count, None); - let ccn = weakly_connected_components(&gn, iter_count, None); - - // get LCC - let counts = cc1.iter().counts_by(|(_, cc)| cc); - let max_1 = counts - .into_iter() - .sorted_by(|l, r| l.1.cmp(&r.1)) - .rev() - .take(1) - .next(); - - // get LCC - let counts = ccn.iter().counts_by(|(_, cc)| cc); - let max_n = counts - .into_iter() - .sorted_by(|l, r| l.1.cmp(&r.1)) - .rev() - .take(1) - .next(); - - assert_eq!(max_1, Some((&6, 1039))); - assert_eq!(max_1, max_n); - println!("{:?}", max_1); - } - } -} diff --git a/examples/rust/src/bin/hulongbay/main.rs b/examples/rust/src/bin/hulongbay/main.rs index cfce358570..a80ffab8e0 100644 --- a/examples/rust/src/bin/hulongbay/main.rs +++ b/examples/rust/src/bin/hulongbay/main.rs @@ -1,25 +1,22 @@ // #![allow(unused_imports)] -use std::env; -use std::error::Error; -use std::fmt::{Debug, Display, Formatter}; -use std::path::Path; - +#![allow(dead_code)] use itertools::Itertools; use raphtory::{ algorithms::{ - connected_components::weakly_connected_components, - motifs::three_node_temporal_motifs::{ - global_temporal_three_node_motif, global_temporal_three_node_motif_from_local, - temporal_three_node_motif, - }, - triangle_count::triangle_count, + connected_components::weakly_connected_components, triangle_count::triangle_count, }, graph_loader::source::csv_loader::CsvLoader, - prelude::{AdditionOps, EdgeListOps, Graph, GraphViewOps, Prop, TimeOps, VertexViewOps}, + prelude::*, }; use regex::Regex; use serde::Deserialize; -use std::time::Instant; +use std::{ + env, + error::Error, + fmt::{Debug, Display, Formatter}, + path::Path, + time::Instant, +}; #[derive(Deserialize, Debug)] pub struct Edge { @@ -67,14 +64,14 @@ pub fn loader(data_dir: &Path) -> Result> { println!( "Loaded graph from path {} with {} vertices, {} edges, took {} seconds", encoded_data_dir.display(), - g.num_vertices(), - g.num_edges(), + g.count_vertices(), + g.count_edges(), now.elapsed().as_secs() ); Ok(g) } else { - let g = Graph::new(16); + let g = Graph::new(); let now = Instant::now(); @@ -89,17 +86,17 @@ pub fn loader(data_dir: &Path) -> Result> { time, src, dst, - &vec![("amount".to_owned(), Prop::U64(sent.amount_usd))], + [("amount".to_owned(), Prop::U64(sent.amount_usd))], None, ) - .unwrap() + .unwrap(); })?; println!( "Loaded graph from CSV data files {} with {} vertices, {} edges which took {} seconds", encoded_data_dir.display(), - g.num_vertices(), - g.num_edges(), + g.count_vertices(), + g.count_edges(), now.elapsed().as_secs() ); @@ -113,10 +110,6 @@ fn try_main() -> Result<(), Box> { let data_dir = Path::new(args.get(1).ok_or(MissingArgumentError)?); let graph = loader(data_dir)?; - - let min_time = graph.start().ok_or(GraphEmptyError)?; - let max_time = graph.end().ok_or(GraphEmptyError)?; - let mid_time = (min_time + max_time) / 2; let now = Instant::now(); let motifs = global_temporal_three_node_motif( @@ -181,6 +174,13 @@ fn try_main() -> Result<(), Box> { // now.elapsed().as_secs() // ); + let now = Instant::now(); + let num_windowed_edges2 = window.count_edges(); + println!( + "Window num_edges returned {} in {} seconds", + num_windowed_edges2, + now.elapsed().as_secs() + ); // let now = Instant::now(); // let num_windowed_edges2 = window.num_edges(); // println!( @@ -210,39 +210,18 @@ fn try_main_bm() -> Result<(), Box> { println!("graph time range: {}-{}", earliest_time, latest_time); let now = Instant::now(); - let num_edges2 = graph.num_edges(); + let num_edges2 = graph.count_edges(); println!( "num_edges returned {} in {} milliseconds", num_edges2, now.elapsed().as_millis() ); - println!("\n Immutable graph metrics:"); - - let graph = graph.freeze(); - let now = Instant::now(); - let num_edges: usize = graph - .vertices() - .map(|v| graph.degree(v, Direction::OUT)) - .sum(); - + let num_exploded_edges = graph.edges().explode().count(); println!( - "Counting edges by summing degrees returned {} in {} milliseconds", - num_edges, - now.elapsed().as_millis() - ); - - let earliest_time = graph.earliest_time().ok_or(GraphEmptyError)?; - let latest_time = graph.latest_time().ok_or(GraphEmptyError)?; - - println!("graph time range: {}-{}", earliest_time, latest_time); - - let now = Instant::now(); - let num_edges2 = graph.num_edges(); - println!( - "num_edges returned {} in {} milliseconds", - num_edges2, + "counted {} exploded edges in {} milliseconds", + num_exploded_edges, now.elapsed().as_millis() ); diff --git a/examples/rust/src/bin/lotr/main.rs b/examples/rust/src/bin/lotr/main.rs index ef9cfd8c4f..f89412cf16 100644 --- a/examples/rust/src/bin/lotr/main.rs +++ b/examples/rust/src/bin/lotr/main.rs @@ -1,13 +1,14 @@ use itertools::Itertools; -use raphtory::algorithms::generic_taint::generic_taint; -use raphtory::core::utils; -use raphtory::core::Prop; -use raphtory::db::graph::Graph; -use raphtory::db::view_api::*; -use raphtory_io::graph_loader::source::csv_loader::CsvLoader; +use raphtory::{ + algorithms::temporal_reachability::temporally_reachable_nodes, core::utils::hashing, + graph_loader::source::csv_loader::CsvLoader, prelude::*, +}; use serde::Deserialize; -use std::path::PathBuf; -use std::{env, path::Path, time::Instant}; +use std::{ + env, + path::{Path, PathBuf}, + time::Instant, +}; #[derive(Deserialize, std::fmt::Debug)] pub struct Lotr { @@ -43,14 +44,14 @@ fn main() { println!( "Loaded graph from encoded data files {} with {} vertices, {} edges which took {} seconds", encoded_data_dir.to_str().unwrap(), - g.num_vertices(), - g.num_edges(), + g.count_vertices(), + g.count_edges(), now.elapsed().as_secs() ); g } else { - let g = Graph::new(2); + let g = Graph::new(); let now = Instant::now(); CsvLoader::new(data_dir) @@ -58,14 +59,14 @@ fn main() { g.add_vertex( lotr.time, lotr.src_id.clone(), - &vec![("type".to_string(), Prop::Str("Character".to_string()))], + [("type", Prop::str("Character"))], ) .expect("Failed to add vertex"); g.add_vertex( lotr.time, lotr.dst_id.clone(), - &vec![("type".to_string(), Prop::Str("Character".to_string()))], + [("type", Prop::str("Character"))], ) .expect("Failed to add vertex"); @@ -73,10 +74,7 @@ fn main() { lotr.time, lotr.src_id.clone(), lotr.dst_id.clone(), - &vec![( - "type".to_string(), - Prop::Str("Character Co-occurrence".to_string()), - )], + [("type", Prop::str("Character Co-occurrence"))], None, ) .expect("Failed to add edge"); @@ -86,8 +84,8 @@ fn main() { println!( "Loaded graph from CSV data files {} with {} vertices, {} edges which took {} seconds", encoded_data_dir.to_str().unwrap(), - g.num_vertices(), - g.num_edges(), + g.count_vertices(), + g.count_edges(), now.elapsed().as_secs() ); @@ -97,18 +95,18 @@ fn main() { g }; - assert_eq!(graph.num_vertices(), 139); - assert_eq!(graph.num_edges(), 701); + assert_eq!(graph.count_vertices(), 139); + assert_eq!(graph.count_edges(), 701); - let gandalf = utils::calculate_hash(&"Gandalf"); + let gandalf = hashing::calculate_hash(&"Gandalf"); assert_eq!(gandalf, 2760374808085341115); assert!(graph.has_vertex(gandalf)); assert_eq!(graph.vertex(gandalf).unwrap().name(), "Gandalf"); - let r = generic_taint(&graph, None, 20, 31930, vec!["Gandalf"], vec![]); + let r = temporally_reachable_nodes(&graph, None, 20, 31930, vec!["Gandalf"], None); assert_eq!( - r.keys().sorted().collect_vec(), + r.result.keys().sorted().collect_vec(), vec!["Gandalf", "Saruman", "Wormtongue"] ) } diff --git a/examples/rust/src/bin/pokec/main.rs b/examples/rust/src/bin/pokec/main.rs index c42adc0656..1d3cd55023 100644 --- a/examples/rust/src/bin/pokec/main.rs +++ b/examples/rust/src/bin/pokec/main.rs @@ -1,12 +1,16 @@ -use std::{time::Instant, env, path::Path}; - use raphtory::{ - algorithms::pagerank::unweighted_page_rank, - db::{graph::Graph, view_api::GraphViewOps}, + algorithms::{ + connected_components::weakly_connected_components, pagerank::unweighted_page_rank, + }, + db::{ + api::{mutation::AdditionOps, view::GraphViewOps}, + graph::graph::Graph, + }, + graph_loader::source::csv_loader::CsvLoader, + prelude::NO_PROPS, }; -use raphtory_io::graph_loader::source::csv_loader::CsvLoader; use serde::Deserialize; -use raphtory::algorithms::connected_components::weakly_connected_components; +use std::{env, path::Path, time::Instant}; #[derive(Deserialize, std::fmt::Debug)] struct Edge { @@ -15,52 +19,49 @@ struct Edge { } fn main() { - let shards = 2; - let now = Instant::now(); let args: Vec = env::args().collect(); - //let data_dir = Path::new(args.get(1).expect("No data directory provided")); - let data_dir = Path::new("/tmp/soc-pokec-relationships.txt"); + let data_dir = Path::new(args.get(1).expect("No data directory provided")); let g = if std::path::Path::new("/tmp/pokec").exists() { Graph::load_from_file("/tmp/pokec").unwrap() - } - else{ - let g = Graph::new(shards); + } else { + let g = Graph::new(); CsvLoader::new(data_dir) .set_delimiter("\t") .set_header(false) .load_into_graph(&g, |e: Edge, g| { - g.add_edge(0, e.src, e.dst, &vec![], None) + g.add_edge(0, e.src, e.dst, NO_PROPS, None) .expect("Failed to add edge"); }) .expect("Failed to load graph from encoded data files"); - g.save_to_file("/tmp/pokec"); + g.save_to_file("/tmp/pokec") + .expect("Failed to save graph to file"); g }; - println!( "Loaded graph from encoded data files {} with {} vertices, {} edges which took {} seconds", - "/tmp/soc-pokec-relationships.txt", - g.num_vertices(), - g.num_edges(), + data_dir.to_str().unwrap(), + g.count_vertices(), + g.count_edges(), now.elapsed().as_secs() ); - let frozen = g.freeze(); - let now = Instant::now(); - unweighted_page_rank(&frozen, 100, None , Some(0.00000001), true); + unweighted_page_rank(&g, 100, None, Some(0.00000001), true); println!("PageRank took {} millis", now.elapsed().as_millis()); let now = Instant::now(); - weakly_connected_components(&frozen, 100, None); + weakly_connected_components(&g, 100, None); - println!("Connected Components took {} millis", now.elapsed().as_millis()); + println!( + "Connected Components took {} millis", + now.elapsed().as_millis() + ); } diff --git a/js-raphtory/Cargo.toml b/js-raphtory/Cargo.toml index 62041cb5af..5d2b6f8aed 100644 --- a/js-raphtory/Cargo.toml +++ b/js-raphtory/Cargo.toml @@ -20,6 +20,8 @@ default = ["console_error_panic_hook"] [dependencies] wasm-bindgen = "0.2.63" +serde = { version = "1.0", features = ["derive"] } +serde-wasm-bindgen = "0.5.0" js-sys = "0.3" chrono = "0.4" raphtory = { path = "../raphtory" } diff --git a/js-raphtory/src/graph/edge.rs b/js-raphtory/src/graph/edge.rs index bd2c22731f..d368d7456c 100644 --- a/js-raphtory/src/graph/edge.rs +++ b/js-raphtory/src/graph/edge.rs @@ -1,13 +1,27 @@ -use raphtory::db::edge::EdgeView; -use raphtory::db::view_api::*; -use wasm_bindgen::prelude::*; - use super::Graph; -use crate::graph::{misc::JsProp, vertex::Vertex}; +use crate::graph::{misc::JsProp, vertex::Vertex, UnderGraph}; +use raphtory::db::{ + api::view::*, + graph::{edge::EdgeView, graph::Graph as TGraph}, +}; +use std::sync::Arc; +use wasm_bindgen::prelude::*; #[wasm_bindgen] pub struct Edge(pub(crate) EdgeView); +impl From> for Edge { + fn from(value: EdgeView) -> Self { + let graph = value.graph; + let eref = value.edge; + let js_graph = Graph(UnderGraph::TGraph(Arc::new(graph))); + Edge(EdgeView { + graph: js_graph, + edge: eref, + }) + } +} + #[wasm_bindgen] impl Edge { #[wasm_bindgen(js_name = source)] @@ -22,16 +36,17 @@ impl Edge { #[wasm_bindgen(js_name = properties)] pub fn properties(&self) -> js_sys::Map { + let t_props = self.0.properties(); let obj = js_sys::Map::new(); - for (k, v) in self.0.properties(true) { - obj.set(&k.into(), &JsProp(v).into()); + for (k, v) in t_props.iter() { + obj.set(&k.to_string().into(), &JsProp(v).into()); } obj } #[wasm_bindgen(js_name = getProperty)] pub fn get_property(&self, name: String) -> JsValue { - if let Some(prop) = self.0.property(name, true).map(JsProp) { + if let Some(prop) = self.0.properties().get(&name).map(JsProp) { prop.into() } else { JsValue::NULL diff --git a/js-raphtory/src/graph/graph_view_impl.rs b/js-raphtory/src/graph/graph_view_impl.rs index 42cbfe92e8..ca6e794334 100644 --- a/js-raphtory/src/graph/graph_view_impl.rs +++ b/js-raphtory/src/graph/graph_view_impl.rs @@ -1,14 +1,15 @@ -use raphtory::db::view_api::internal::{GraphViewInternalOps, WrappedGraph}; - use super::{Graph, UnderGraph}; +use raphtory::db::api::view::internal::{Base, BoxableGraphView, InheritViewOps}; -impl WrappedGraph for Graph { - type Internal = dyn GraphViewInternalOps + Send + Sync + 'static; +impl Base for Graph { + type Base = dyn BoxableGraphView + Send + Sync + 'static; - fn as_graph(&self) -> &(dyn GraphViewInternalOps + Send + Sync + 'static) { + fn base(&self) -> &(dyn BoxableGraphView + Send + Sync + 'static) { match &self.0 { UnderGraph::TGraph(g) => g.as_ref(), UnderGraph::WindowedGraph(g) => g.as_ref(), } } } + +impl InheritViewOps for Graph {} diff --git a/js-raphtory/src/graph/misc.rs b/js-raphtory/src/graph/misc.rs index 5290467cc3..29a57f2e33 100644 --- a/js-raphtory/src/graph/misc.rs +++ b/js-raphtory/src/graph/misc.rs @@ -1,10 +1,9 @@ -use std::ops::Deref; -use std::sync::Arc; - use crate::graph::{Graph, UnderGraph}; use chrono::{Datelike, Timelike}; use js_sys::Array; -use raphtory::core::{tgraph_shard::errors::GraphError, Prop}; +use raphtory::core::{utils::errors::GraphError, Prop}; +use serde::{Deserialize, Serialize}; +use std::{ops::Deref, sync::Arc}; use wasm_bindgen::{prelude::wasm_bindgen, JsValue}; #[wasm_bindgen] @@ -13,13 +12,16 @@ pub struct JSError(pub(crate) GraphError); pub(crate) struct JsObjectEntry(pub(crate) JsValue); +#[derive(Serialize, Deserialize)] #[repr(transparent)] pub(crate) struct JsProp(pub(crate) Prop); -impl Into for JsProp { - fn into(self) -> JsValue { - match self.0 { - raphtory::core::Prop::Str(v) => v.into(), +impl From for JsValue { + fn from(value: JsProp) -> JsValue { + match value.0 { + raphtory::core::Prop::U8(v) => v.into(), + raphtory::core::Prop::U16(v) => v.into(), + raphtory::core::Prop::Str(v) => v.to_string().into(), raphtory::core::Prop::I32(v) => v.into(), raphtory::core::Prop::I64(v) => v.into(), raphtory::core::Prop::U32(v) => v.into(), @@ -40,6 +42,14 @@ impl Into for JsProp { .into() } Prop::Graph(v) => Graph(UnderGraph::TGraph(Arc::new(v))).into(), + Prop::List(v) => { + let v: Array = v.iter().map(|v| JsValue::from(JsProp(v.clone()))).collect(); + v.into() + } + Prop::Map(v) => { + let v = v.deref().clone(); + serde_wasm_bindgen::to_value(&v).unwrap() + } } } } @@ -58,6 +68,6 @@ impl From for Option<(String, Prop)> { let key = arr.at(0).as_string().unwrap(); let value = arr.at(1).as_string().unwrap(); - Some((key, Prop::Str(value))) + Some((key, Prop::str(value))) } } diff --git a/js-raphtory/src/graph/mod.rs b/js-raphtory/src/graph/mod.rs index e49ccdf13e..65bec2841c 100644 --- a/js-raphtory/src/graph/mod.rs +++ b/js-raphtory/src/graph/mod.rs @@ -1,27 +1,29 @@ +#![allow(dead_code)] #[cfg(feature = "console_error_panic_hook")] extern crate console_error_panic_hook; use core::panic; -use std::convert::TryFrom; -use std::sync::Arc; - use js_sys::Object; -use raphtory::core::tgraph_shard::errors::GraphError; -use raphtory::core::Prop; -use raphtory::db::graph::Graph as TGraph; -use raphtory::db::graph_window::WindowedGraph; -use raphtory::db::view_api::internal::GraphViewInternalOps; -use raphtory::db::view_api::GraphViewOps; -use raphtory::db::view_api::TimeOps; -use wasm_bindgen::prelude::*; -use wasm_bindgen::JsCast; - -use crate::graph::misc::JSError; -use crate::graph::misc::JsObjectEntry; -use crate::graph::vertex::JsVertex; -use crate::graph::vertex::Vertex; -use crate::log; -use crate::utils::set_panic_hook; +use raphtory::{ + core::utils::errors::GraphError, + db::{ + api::view::{internal::BoxableGraphView, GraphViewOps, TimeOps}, + graph::{graph::Graph as TGraph, views::window_graph::WindowedGraph}, + }, + prelude::*, +}; +use std::{convert::TryFrom, sync::Arc}; +use wasm_bindgen::{prelude::*, JsCast}; + +use crate::{ + graph::{ + edge::Edge, + misc::{JSError, JsObjectEntry}, + vertex::{JsVertex, Vertex}, + }, + log, + utils::set_panic_hook, +}; mod edge; mod graph_view_impl; @@ -48,7 +50,7 @@ impl UnderGraph { } // a bit heavy but might work - pub fn graph(&self) -> Box> { + pub fn graph(&self) -> Box> { match self { UnderGraph::TGraph(g) => Box::new(g.clone()), UnderGraph::WindowedGraph(g) => Box::new(g.clone()), @@ -61,7 +63,7 @@ impl Graph { #[wasm_bindgen(constructor)] pub fn new() -> Self { set_panic_hook(); - Graph(UnderGraph::TGraph(Arc::new(TGraph::new(1)))) + Graph(UnderGraph::TGraph(Arc::new(TGraph::new()))) } #[wasm_bindgen(js_name = window)] @@ -95,9 +97,9 @@ impl Graph { } #[wasm_bindgen(js_name = addVertex)] - pub fn add_vertex_js(&self, t: i64, id: JsValue, js_props: Object) -> Result<(), JSError> { + pub fn add_vertex_js(&self, t: i64, id: JsValue, js_props: Object) -> Result { let rust_props = if js_props.is_string() { - vec![("name".to_string(), Prop::Str(js_props.as_string().unwrap()))] + vec![("name".to_string(), Prop::str(js_props.as_string().unwrap()))] } else if js_props.is_object() { Object::entries(&js_props) .iter() @@ -113,11 +115,13 @@ impl Graph { match JsVertex::try_from(id)? { JsVertex::Str(vertex) => self .mutable_graph() - .add_vertex(t, vertex, &rust_props) + .add_vertex(t, vertex, rust_props) + .map(|v| v.into()) .map_err(JSError), JsVertex::Number(vertex) => self .mutable_graph() - .add_vertex(t, vertex, &rust_props) + .add_vertex(t, vertex, rust_props) + .map(|v| v.into()) .map_err(JSError), } } @@ -129,7 +133,7 @@ impl Graph { src: JsValue, dst: JsValue, js_props: Object, - ) -> Result<(), JSError> { + ) -> Result { js_props.dyn_ref::().map(|bigint| { log(&format!("bigint: {:?}", bigint)); }); @@ -151,12 +155,14 @@ impl Graph { match (JsVertex::try_from(src)?, JsVertex::try_from(dst)?) { (JsVertex::Str(src), JsVertex::Str(dst)) => self .mutable_graph() - .add_edge(t, src, dst, &props, None) - .map_err(JSError), + .add_edge(t, src, dst, props, None) + .map_err(JSError) + .map(|e| e.into()), (JsVertex::Number(src), JsVertex::Number(dst)) => self .mutable_graph() - .add_edge(t, src, dst, &props, None) - .map_err(JSError), + .add_edge(t, src, dst, props, None) + .map_err(JSError) + .map(|e| e.into()), _ => Err(JSError(GraphError::VertexIdNotStringOrNumber)), } } diff --git a/js-raphtory/src/graph/vertex.rs b/js-raphtory/src/graph/vertex.rs index a6881db01f..932d13cde6 100644 --- a/js-raphtory/src/graph/vertex.rs +++ b/js-raphtory/src/graph/vertex.rs @@ -1,18 +1,27 @@ -use std::convert::TryFrom; - +use super::{misc::JSError, Graph}; +use crate::graph::{edge::Edge, misc::JsProp, UnderGraph}; use raphtory::{ - core::tgraph_shard::errors::GraphError, - db::{vertex::VertexView, view_api::VertexViewOps}, + core::utils::errors::GraphError, + db::{ + api::view::VertexViewOps, + graph::{graph::Graph as TGraph, vertex::VertexView}, + }, }; +use std::{convert::TryFrom, sync::Arc}; use wasm_bindgen::prelude::*; -use crate::graph::{edge::Edge, misc::JsProp}; - -use super::{misc::JSError, Graph}; - #[wasm_bindgen] pub struct Vertex(pub(crate) VertexView); +impl From> for Vertex { + fn from(value: VertexView) -> Self { + let vid = value.vertex; + let graph = value.graph; + let js_graph = Graph(UnderGraph::TGraph(Arc::new(graph))); + Vertex(VertexView::new_internal(js_graph, vid)) + } +} + #[wasm_bindgen] impl Vertex { #[wasm_bindgen(js_name = id)] @@ -90,19 +99,19 @@ impl Vertex { #[wasm_bindgen(js_name = properties)] pub fn properties(&self) -> js_sys::Map { let obj = js_sys::Map::new(); - for (k, v) in self.0.properties(true) { - obj.set(&k.into(), &JsProp(v).into()); + for (k, v) in self.0.properties() { + obj.set(&k.to_string().into(), &JsProp(v).into()); } obj } #[wasm_bindgen(js_name = getProperty)] pub fn get_property(&self, name: String) -> JsValue { - if let Some(prop) = self.0.property(name, true).map(JsProp) { - prop.into() - } else { - JsValue::NULL - } + self.0 + .properties() + .get(&name) + .map(|v| JsProp(v).into()) + .unwrap_or(JsValue::NULL) } } diff --git a/paper/joss-raphtory.bib b/paper/joss-raphtory.bib index 152299de89..ac98224a00 100644 --- a/paper/joss-raphtory.bib +++ b/paper/joss-raphtory.bib @@ -6,7 +6,8 @@ @article{gauvin2022randomized number={4}, pages={763--830}, year={2022}, - publisher={SIAM} + publisher={SIAM}, + doi = {10.1137/19M1242252} } @article{bovet2021centralities, @@ -21,7 +22,8 @@ @inproceedings{tang2010analysing author={Tang, John and Musolesi, Mirco and Mascolo, Cecilia and Latora, Vito and Nicosia, Vincenzo}, booktitle={Proceedings of the 3rd Workshop on Social Network Systems}, pages={1--6}, - year={2010} + year={2010}, + doi={10.1145/1852658.1852661} } @article{goh2008burstiness, @@ -32,7 +34,8 @@ @article{goh2008burstiness number={4}, pages={48002}, year={2008}, - publisher={IOP Publishing} + publisher={IOP Publishing}, + doi = {10.1209/0295-5075/81/48002} } @article{pfitzner2013betweenness, title={Betweenness preference: Quantifying correlations in the topological dynamics of temporal networks}, @@ -42,7 +45,8 @@ @article{pfitzner2013betweenness number={19}, pages={198701}, year={2013}, - publisher={APS} + publisher={APS}, + doi = {10.1103/physrevlett.110.198701} } @article{steer2020raphtory, @@ -52,7 +56,8 @@ @article{steer2020raphtory volume={102}, pages={453--464}, year={2020}, - publisher={Elsevier} + publisher={Elsevier}, + doi = {10.1016/j.future.2019.08.022}, } @article{yousaf2023non, @@ -69,7 +74,8 @@ @article{badie2023reticula volume={21}, pages={101301}, year={2023}, - publisher={Elsevier} + publisher={Elsevier}, + doi = {10.1016/j.softx.2022.101301}, } @inproceedings{hackl2021analysis, @@ -77,7 +83,8 @@ @inproceedings{hackl2021analysis author={Hackl, J{\"u}rgen and Scholtes, Ingo and Petrovi{\'c}, Luka V and Perri, Vincenzo and Verginer, Luca and Gote, Christoph}, booktitle={Companion Proceedings of the Web Conference 2021}, pages={530--532}, - year={2021} + year={2021}, + doi = {10.1145/3442442.3452052} } @article{csardi2006igraph, @@ -87,7 +94,8 @@ @article{csardi2006igraph volume={1695}, number={5}, pages={1--9}, - year={2006} + year={2006}, + doi = {10.5281/zenodo.7682609} } @article{zhang2015dynamic, @@ -102,6 +110,7 @@ @article{peixoto2014graph author={Peixoto, Tiago P}, journal={figshare}, year={2014} + doi = {10.6084/m9.figshare.1164194.v14} } @techreport{hagberg2008exploring, @@ -119,7 +128,8 @@ @article{starnini2012random number={5}, pages={056115}, year={2012}, - publisher={APS} + publisher={APS}, + doi = {10.1103/PhysRevE.85.056115} } @article{delvenne2010stability, @@ -130,7 +140,8 @@ @article{delvenne2010stability number={29}, pages={12755--12760}, year={2010}, - publisher={National Acad Sciences} + publisher={National Acad Sciences}, + doi = {10.1073/pnas.0903215107} } @@ -138,14 +149,16 @@ @book{langville2006google title={Google's PageRank and beyond: The science of search engine rankings}, author={Langville, Amy N and Meyer, Carl D}, year={2006}, - publisher={Princeton university press} + publisher={Princeton university press}, + doi = {10.1063/1.2711640}, } @inproceedings{qiu2018network, title={Network embedding as matrix factorization: Unifying deepwalk, line, pte, and node2vec}, author={Qiu, Jiezhong and Dong, Yuxiao and Ma, Hao and Li, Jian and Wang, Kuansan and Tang, Jie}, booktitle={Proceedings of the eleventh ACM international conference on web search and data mining}, pages={459--467}, - year={2018} + year={2018}, + doi = {10.1145/3159652.3159706} } @article{karsai2012universal, @@ -156,7 +169,8 @@ @article{karsai2012universal number={1}, pages={397}, year={2012}, - publisher={Nature Publishing Group UK London} + publisher={Nature Publishing Group UK London}, + doi = {10.1038/srep00397}, } @article{donnat2018tracking, @@ -167,7 +181,8 @@ @article{donnat2018tracking number={2}, pages={971--1012}, year={2018}, - publisher={JSTOR} + publisher={JSTOR}, + doi = {10.1214/18-aoas1176} } @article{malmgren2008poissonian, title={A Poissonian explanation for heavy tails in e-mail communication}, @@ -177,7 +192,8 @@ @article{malmgren2008poissonian number={47}, pages={18153--18158}, year={2008}, - publisher={National Acad Sciences} + publisher={National Acad Sciences}, + doi = {10.1073/pnas.0800332105} } @article{lambiotte2019networks, @@ -188,14 +204,16 @@ @article{lambiotte2019networks number={4}, pages={313--320}, year={2019}, - publisher={Nature Publishing Group UK London} + publisher={Nature Publishing Group UK London}, + doi = {10.1038/s41567-019-0459-y} } @book{newman2018networks, title={Networks}, author={Newman, Mark}, year={2018}, - publisher={Oxford University Press} + publisher={Oxford University Press}, + doi = {10.1093/oso/9780198805090.001.0001} } @article{holme2012temporal, @@ -205,14 +223,16 @@ @article{holme2012temporal volume={519}, number={3}, pages={97--125}, - year={2012} + year={2012}, + doi = {10.1007/978-3-642-36461-7} } @book{masuda2016guide, title={A guide to temporal networks}, author={Masuda, Naoki and Lambiotte, Renaud}, year={2016}, - publisher={World Scientific} + publisher={World Scientific}, + doi = {10.1142/q0033} } @article{arnold2021moving, @@ -220,7 +240,8 @@ @article{arnold2021moving author={Arnold, Naomi A and Steer, Benjamin and Hafnaoui, Imane and Parada G, Hugo A and Mondrag{\'o}n, Raul J and Cuadrado, F{\'e}lix and Clegg, Richard G}, journal={Proceedings of the ACM on Human-Computer Interaction}, number={CSCW}, - year={2021} + year={2021}, + doi = {10.1145/3479591} } @inproceedings{paranjape2017motifs, @@ -228,14 +249,16 @@ @inproceedings{paranjape2017motifs author={Paranjape, Ashwin and Benson, Austin R and Leskovec, Jure}, booktitle={Proceedings of the tenth ACM international conference on web search and data mining}, pages={601--610}, - year={2017} + year={2017}, + doi = {10.1145/3018661.3018731} } @inproceedings{Chronograph, author = {Erb, Benjamin and Mei\ss{}ner, Dominik and Pietron, Jakob and Kargl, Frank}, title = {Chronograph: A Distributed Processing Platform for Online and Batch Computations on Event-Sourced Graphs}, year = {2017}, - booktitle = {Proceedings of the 11th ACM International Conference on Distributed and Event-Based Systems} + booktitle = {Proceedings of the 11th ACM International Conference on Distributed and Event-Based Systems}, + doi = {10.1145/3093742.3093913} } @misc{RecallGraph, @@ -268,5 +291,6 @@ @article{lucas2023inferring volume={3}, number={2}, year={2023}, - publisher={Elsevier} + publisher={Elsevier}, + doi = {10.1101/2021.03.26.437187} } \ No newline at end of file diff --git a/py-raphtory/.gitignore b/py-raphtory/.gitignore deleted file mode 100644 index af3ca5ef1c..0000000000 --- a/py-raphtory/.gitignore +++ /dev/null @@ -1,72 +0,0 @@ -/target - -# Byte-compiled / optimized / DLL files -__pycache__/ -.pytest_cache/ -*.py[cod] - -# C extensions -*.so - -# Distribution / packaging -.Python -.venv/ -env/ -bin/ -build/ -develop-eggs/ -dist/ -eggs/ -lib/ -lib64/ -parts/ -sdist/ -var/ -include/ -man/ -venv/ -*.egg-info/ -.installed.cfg -*.egg - -# Installer logs -pip-log.txt -pip-delete-this-directory.txt -pip-selfcheck.json - -# Unit test / coverage reports -htmlcov/ -.tox/ -.coverage -.cache -nosetests.xml -coverage.xml - -# Translations -*.mo - -# Mr Developer -.mr.developer.cfg -.project -.pydevproject - -# Rope -.ropeproject - -# Django stuff: -*.log -*.pot - -.DS_Store - -# Sphinx documentation -docs/_build/ - -# PyCharm -.idea/ - -# VSCode -.vscode/ - -# Pyenv -.python-version \ No newline at end of file diff --git a/py-raphtory/Cargo.toml b/py-raphtory/Cargo.toml deleted file mode 100644 index e418cc1d40..0000000000 --- a/py-raphtory/Cargo.toml +++ /dev/null @@ -1,36 +0,0 @@ -[package] -name = "py-raphtory" -description = "Raphtory python bindings allowing custom rust algorithms compatible with the python client" -version.workspace = true -edition.workspace = true -rust-version.workspace = true -keywords.workspace = true -authors.workspace = true -documentation.workspace = true -repository.workspace = true -license.workspace = true -readme.workspace = true -homepage.workspace = true -doc = false -# See more keys and their definitions at https://doc.rust-lang.org/cargo/reference/manifest.html - -[dependencies] -pyo3 = {version="0.18.1", features=["multiple-pymethods", "chrono"]} -raphtory = {path = "../raphtory", version = "0.4.0" } -raphtory-io = {path = "../raphtory-io", version = "0.4.0" } -rustc-hash = "1.1.0" -parking_lot = { version = "0.12" , features = ["serde"] } -flume = "0.10" -futures = {version = "0.3", features = ["thread-pool"] } -replace_with = "0.1" -itertools="0.10" -csv = "1.1.6" -flate2 = "1.0" -regex = "1" -serde = { version = "1", features = ["derive", "rc"] } -rayon = "1" -chrono = "0.4" -bincode = "1" -display-error-chain = "0.1.1" -num = "0.4.0" -tokio = { version = "1.27.0", features = ["full"] } diff --git a/py-raphtory/src/algorithms.rs b/py-raphtory/src/algorithms.rs deleted file mode 100644 index cff6db0c62..0000000000 --- a/py-raphtory/src/algorithms.rs +++ /dev/null @@ -1,241 +0,0 @@ -/// Implementations of various graph algorithms that can be run on a graph. -/// -/// To run an algorithm simply import the module and call the function with the graph as the argument -/// -use crate::graph_view::PyGraphView; -use std::collections::HashMap; - -use crate::utils; -use crate::utils::{extract_input_vertex, InputVertexBox}; -use pyo3::prelude::*; -use raphtory::algorithms::connected_components; -use raphtory::algorithms::degree::{ - average_degree as average_degree_rs, max_in_degree as max_in_degree_rs, - max_out_degree as max_out_degree_rs, min_in_degree as min_in_degree_rs, - min_out_degree as min_out_degree_rs, -}; -use raphtory::algorithms::directed_graph_density::directed_graph_density as directed_graph_density_rs; -use raphtory::algorithms::generic_taint::generic_taint as generic_taint_rs; -use raphtory::algorithms::local_clustering_coefficient::local_clustering_coefficient as local_clustering_coefficient_rs; -use raphtory::algorithms::local_triangle_count::local_triangle_count as local_triangle_count_rs; -use raphtory::algorithms::motifs::three_node_local::global_temporal_three_node_motif as global_temporal_three_node_motif_rs; -use raphtory::algorithms::motifs::three_node_local::global_temporal_three_node_motif_from_local as global_temporal_three_node_motif_from_local_rs; -use raphtory::algorithms::motifs::three_node_local::temporal_three_node_motif as temporal_three_node_motif_rs; -use raphtory::algorithms::pagerank::unweighted_page_rank; -use raphtory::algorithms::reciprocity::{ - all_local_reciprocity as all_local_reciprocity_rs, global_reciprocity as global_reciprocity_rs, -}; - -/// Local triangle count - calculates the number of triangles (a cycle of length 3) for a node. -/// It measures the local clustering of a graph. -/// -/// This is useful for understanding the level of connectivity and the likelihood of information -/// or influence spreading through a network. -/// -/// For example, in a social network, the local triangle count of a user's profile can reveal the -/// number of mutual friends they have and the level of interconnectivity between those friends. -/// A high local triangle count for a user indicates that they are part of a tightly-knit group -/// of people, which can be useful for targeted advertising or identifying key influencers -/// within a network. -/// -/// Local triangle count can also be used in other domains such as biology, where it can be used -/// to analyze protein interaction networks, or in transportation networks, where it can be used -/// to identify critical junctions or potential traffic bottlenecks. -/// -#[pyfunction] -pub fn local_triangle_count(g: &PyGraphView, v: &PyAny) -> PyResult> { - let v = utils::extract_vertex_ref(v)?; - Ok(local_triangle_count_rs(&g.graph, v)) -} - -#[pyfunction] -pub fn weakly_connected_components( - g: &PyGraphView, - iter_count: usize, -) -> PyResult> { - Ok(connected_components::weakly_connected_components( - &g.graph, iter_count, None, - )) -} - -#[pyfunction] -pub fn pagerank( - g: &PyGraphView, - iter_count: usize, - max_diff: Option, -) -> PyResult> { - Ok(unweighted_page_rank(&g.graph, iter_count, None, max_diff, true)) -} - -#[pyfunction] -pub fn generic_taint( - g: &PyGraphView, - iter_count: usize, - start_time: i64, - infected_nodes: Vec<&PyAny>, - stop_nodes: Vec<&PyAny>, -) -> Result>, PyErr> { - let infected_nodes: PyResult> = infected_nodes - .into_iter() - .map(|v| extract_input_vertex(v)) - .collect(); - let stop_nodes: PyResult> = stop_nodes - .into_iter() - .map(|v| extract_input_vertex(v)) - .collect(); - - Ok(generic_taint_rs( - &g.graph, - None, - iter_count, - start_time, - infected_nodes?, - stop_nodes?, - )) -} - -/// Local Clustering coefficient - measures the degree to which nodes in a graph tend to cluster together. -/// -/// It is calculated by dividing the number of triangles (sets of three nodes that are all -/// connected to each other) in the graph by the total number of possible triangles. -/// The resulting value is a number between 0 and 1 that represents the density of -/// clustering in the graph. -/// -/// A high clustering coefficient indicates that nodes tend to be -/// connected to nodes that are themselves connected to each other, while a low clustering -/// coefficient indicates that nodes tend to be connected to nodes that are not connected -/// to each other. -/// -/// In a social network of a particular community, we can compute the clustering -/// coefficient of each node to get an idea of how strongly connected and cohesive -/// that node's neighborhood is. -/// -/// A high clustering coefficient for a node in a social network indicates that the -/// node's neighbors tend to be strongly connected with each other, forming a tightly-knit -/// group or community. In contrast, a low clustering coefficient for a node indicates that -/// its neighbors are relatively less connected with each other, suggesting a more fragmented -/// or diverse community. -#[pyfunction] -pub fn local_clustering_coefficient(g: &PyGraphView, v: &PyAny) -> PyResult> { - let v = utils::extract_vertex_ref(v)?; - Ok(local_clustering_coefficient_rs(&g.graph, v)) -} - -/// Graph density - measures how dense or sparse a graph is. -/// -/// It is defined as the ratio of the number of edges in the graph to the total number of possible -/// edges. A dense graph has a high edge-to-vertex ratio, while a sparse graph has a low -/// edge-to-vertex ratio. -/// -/// For example in social network analysis, a dense graph may indicate a highly interconnected -/// community, while a sparse graph may indicate more isolated individuals. -#[pyfunction] -pub fn directed_graph_density(g: &PyGraphView) -> f32 { - directed_graph_density_rs(&g.graph) -} - -/// The average degree of all vertices in the graph. -#[pyfunction] -pub fn average_degree(g: &PyGraphView) -> f64 { - average_degree_rs(&g.graph) -} - -/// The maximum out degree of any vertex in the graph. -#[pyfunction] -pub fn max_out_degree(g: &PyGraphView) -> usize { - max_out_degree_rs(&g.graph) -} - -/// The maximum in degree of any vertex in the graph. -#[pyfunction] -pub fn max_in_degree(g: &PyGraphView) -> usize { - max_in_degree_rs(&g.graph) -} - -/// The minimum out degree of any vertex in the graph. -#[pyfunction] -pub fn min_out_degree(g: &PyGraphView) -> usize { - min_out_degree_rs(&g.graph) -} - -/// The minimum in degree of any vertex in the graph. -#[pyfunction] -pub fn min_in_degree(g: &PyGraphView) -> usize { - min_in_degree_rs(&g.graph) -} - -/// Reciprocity - measure of the symmetry of relationships in a graph, the global reciprocity of -/// the entire graph. -/// This calculates the number of reciprocal connections (edges that go in both directions) in a -/// graph and normalizes it by the total number of edges. -/// -/// In a social network context, reciprocity measures the likelihood that if person A is linked -/// to person B, then person B is linked to person A. This algorithm can be used to determine the -/// level of symmetry or balance in a social network. It can also reveal the power dynamics in a -/// group or community. For example, if one person has many connections that are not reciprocated, -/// it could indicate that this person has more power or influence in the network than others. -/// -/// In a business context, reciprocity can be used to study customer behavior. For instance, in a -/// transactional network, if a customer tends to make a purchase from a seller and then the seller -/// makes a purchase from the same customer, it can indicate a strong reciprocal relationship -/// between them. On the other hand, if the seller does not make a purchase from the same customer, -/// it could imply a less reciprocal or more one-sided relationship. -#[pyfunction] -pub fn global_reciprocity(g: &PyGraphView) -> f64 { - global_reciprocity_rs(&g.graph, None) -} - -/// Reciprocity - measure of the symmetry of relationships in a graph. -/// the reciprocity of every vertex in the graph as a tuple of vector id and the reciprocity -/// This calculates the number of reciprocal connections (edges that go in both directions) in a -/// graph and normalizes it by the total number of edges. -/// -/// In a social network context, reciprocity measures the likelihood that if person A is linked -/// to person B, then person B is linked to person A. This algorithm can be used to determine the -/// level of symmetry or balance in a social network. It can also reveal the power dynamics in a -/// group or community. For example, if one person has many connections that are not reciprocated, -/// it could indicate that this person has more power or influence in the network than others. -/// -/// In a business context, reciprocity can be used to study customer behavior. For instance, in a -/// transactional network, if a customer tends to make a purchase from a seller and then the seller -/// makes a purchase from the same customer, it can indicate a strong reciprocal relationship -/// between them. On the other hand, if the seller does not make a purchase from the same customer, -/// it could imply a less reciprocal or more one-sided relationship. -/// -#[pyfunction] -pub fn all_local_reciprocity(g: &PyGraphView) -> HashMap { - all_local_reciprocity_rs(&g.graph, None) -} - -/// Computes the number of both open and closed triplets within a graph -/// -/// An open triplet, is one where a node has two neighbors, but no edge between them. -/// A closed triplet is one where a node has two neighbors, and an edge between them. -#[pyfunction] -pub fn triplet_count(g: &PyGraphView) -> usize { - raphtory::algorithms::triplet_count::triplet_count(&g.graph, None) -} - -/// Computes the global clustering coefficient of a graph. The global clustering coefficient is -/// defined as the number of triangles in the graph divided by the number of triplets in the graph. -#[pyfunction] -pub fn global_clustering_coefficient(g: &PyGraphView) -> f64 { - raphtory::algorithms::clustering_coefficient::clustering_coefficient(&g.graph) -} - -#[pyfunction] -pub fn temporal_three_node_motif(g: &PyGraphView, delta: i64) -> HashMap> { - temporal_three_node_motif_rs(&g.graph, None, delta) -} - -#[pyfunction] -pub fn global_temporal_three_node_motif(g: &PyGraphView, delta: i64) -> Vec { - global_temporal_three_node_motif_rs(&g.graph, None, delta) -} - -#[pyfunction] -pub fn global_temporal_three_node_motif_from_local( - counts: HashMap>, -) -> Vec { - global_temporal_three_node_motif_from_local_rs(counts) -} diff --git a/py-raphtory/src/dynamic.rs b/py-raphtory/src/dynamic.rs deleted file mode 100644 index a3dc3945ff..0000000000 --- a/py-raphtory/src/dynamic.rs +++ /dev/null @@ -1,44 +0,0 @@ -use raphtory::db::graph::Graph; -use raphtory::db::graph_layer::LayeredGraph; -use raphtory::db::graph_window::WindowedGraph; -use raphtory::db::view_api::internal::{GraphViewInternalOps, WrappedGraph}; -use raphtory::db::view_api::GraphViewOps; -use std::sync::Arc; - -#[derive(Clone)] -pub struct DynamicGraph(Arc); - -pub trait IntoDynamic { - fn into_dynamic(self) -> DynamicGraph; -} - -impl IntoDynamic for Graph { - fn into_dynamic(self) -> DynamicGraph { - DynamicGraph(self.as_arc()) - } -} - -impl IntoDynamic for WindowedGraph { - fn into_dynamic(self) -> DynamicGraph { - DynamicGraph(Arc::new(self)) - } -} - -impl IntoDynamic for LayeredGraph { - fn into_dynamic(self) -> DynamicGraph { - DynamicGraph(Arc::new(self)) - } -} - -impl IntoDynamic for DynamicGraph { - fn into_dynamic(self) -> DynamicGraph { - self - } -} - -impl WrappedGraph for DynamicGraph { - type Internal = dyn GraphViewInternalOps + Send + Sync + 'static; - fn as_graph(&self) -> &(dyn GraphViewInternalOps + Send + Sync + 'static) { - &*self.0 - } -} diff --git a/py-raphtory/src/edge.rs b/py-raphtory/src/edge.rs deleted file mode 100644 index 3a7c466273..0000000000 --- a/py-raphtory/src/edge.rs +++ /dev/null @@ -1,549 +0,0 @@ -//! The edge module contains the PyEdge class, which is used to represent edges in the graph and -//! provides access to the edge's properties and vertices. -//! -//! The PyEdge class also provides access to the perspective APIs, which allow the user to view the -//! edge as it existed at a particular point in time, or as it existed over a particular time range. -//! -use crate::dynamic::{DynamicGraph, IntoDynamic}; -use crate::types::repr::{iterator_repr, Repr}; -use crate::utils::*; -use crate::vertex::{PyVertex, PyVertexIterable}; -use crate::wrappers::iterators::{OptionI64Iterable, OptionPropIterable}; -use crate::wrappers::prop::Prop; -use chrono::NaiveDateTime; -use itertools::Itertools; -use pyo3::prelude::*; -use pyo3::{pyclass, pymethods, PyAny, PyRef, PyRefMut, PyResult}; -use raphtory::db::edge::EdgeView; -use raphtory::db::view_api::*; -use std::collections::HashMap; -use std::sync::Arc; - -/// PyEdge is a Python class that represents an edge in the graph. -/// An edge is a directed connection between two vertices. -#[pyclass(name = "Edge")] -pub struct PyEdge { - pub(crate) edge: EdgeView, -} - -impl From> for PyEdge { - fn from(value: EdgeView) -> Self { - Self { - edge: EdgeView { - graph: value.graph.clone().into_dynamic(), - edge: value.edge, - }, - } - } -} - -impl IntoPyObject for EdgeView { - fn into_py_object(self) -> PyObject { - let py_version: PyEdge = self.into(); - Python::with_gil(|py| py_version.into_py(py)) - } -} - -/// PyEdge is a Python class that represents an edge in the graph. -/// An edge is a directed connection between two vertices. -#[pymethods] -impl PyEdge { - pub fn __getitem__(&self, name: String) -> Option { - self.property(name, Some(true)) - } - - /// Returns the value of the property with the given name. - /// If the property is not found, None is returned. - /// If the property is found, the value of the property is returned. - /// - /// Arguments: - /// name (str): The name of the property to retrieve. - /// - /// Returns: - /// The value of the property with the given name. - #[pyo3(signature = (name, include_static = true))] - pub fn property(&self, name: String, include_static: Option) -> Option { - let include_static = include_static.unwrap_or(true); - self.edge - .property(name, include_static) - .map(|prop| prop.into()) - } - - /// Returns the value of the property with the given name all times. - /// If the property is not found, None is returned. - /// If the property is found, the value of the property is returned. - /// - /// Arguments: - /// name (str): The name of the property to retrieve. - /// - /// Returns: - /// The value of the property with the given name. - #[pyo3(signature = (name))] - pub fn property_history(&self, name: String) -> Vec<(i64, Prop)> { - self.edge - .property_history(name) - .into_iter() - .map(|(k, v)| (k, v.into())) - .collect() - } - - /// Returns a list of timestamps of when an edge is added or change to an edge is made. - /// - /// Returns: - /// A list of timestamps. - /// - - pub fn history(&self) -> Vec { - self.edge.history() - } - - /// Returns a dictionary of all properties on the edge. - /// - /// Arguments: - /// include_static (bool): Whether to include static properties in the result. - /// - /// Returns: - /// A dictionary of all properties on the edge. - #[pyo3(signature = (include_static = true))] - pub fn properties(&self, include_static: Option) -> HashMap { - let include_static = include_static.unwrap_or(true); - self.edge - .properties(include_static) - .into_iter() - .map(|(k, v)| (k, v.into())) - .collect() - } - - /// Returns a dictionary of all properties on the edge at all times. - /// - /// Returns: - /// A dictionary of all properties on the edge at all times. - pub fn property_histories(&self) -> HashMap> { - self.edge - .property_histories() - .into_iter() - .map(|(k, v)| (k, v.into_iter().map(|(t, p)| (t, p.into())).collect())) - .collect() - } - - /// Returns a list of all property names on the edge. - /// - /// Arguments: - /// include_static (bool): Whether to include static properties in the result. - /// - /// Returns: - /// A list of all property names on the edge. - #[pyo3(signature = (include_static = true))] - pub fn property_names(&self, include_static: Option) -> Vec { - let include_static = include_static.unwrap_or(true); - self.edge.property_names(include_static) - } - - /// Check if a property exists with the given name. - /// - /// Arguments: - /// name (str): The name of the property to check. - /// include_static (bool): Whether to include static properties in the result. - /// - /// Returns: - /// True if a property exists with the given name, False otherwise. - #[pyo3(signature = (name, include_static = true))] - pub fn has_property(&self, name: String, include_static: Option) -> bool { - let include_static = include_static.unwrap_or(true); - self.edge.has_property(name, include_static) - } - - /// Check if a static property exists with the given name. - /// - /// Arguments: - /// name (str): The name of the property to check. - /// - /// Returns: - /// True if a static property exists with the given name, False otherwise. - pub fn has_static_property(&self, name: String) -> bool { - self.edge.has_static_property(name) - } - - pub fn static_property(&self, name: String) -> Option { - self.edge.static_property(name).map(|prop| prop.into()) - } - - /// Get the source vertex of the Edge. - /// - /// Returns: - /// The source vertex of the Edge. - fn src(&self) -> PyVertex { - self.edge.src().into() - } - - /// Get the destination vertex of the Edge. - /// - /// Returns: - /// The destination vertex of the Edge. - fn dst(&self) -> PyVertex { - self.edge.dst().into() - } - - //****** Perspective APIS ******// - - /// Get the start time of the Edge. - /// - /// Returns: - /// The start time of the Edge. - pub fn start(&self) -> Option { - self.edge.start() - } - - /// Get the start datetime of the Edge. - /// - /// Returns: - /// the start datetime of the Edge. - pub fn start_date_time(&self) -> Option { - let start_time = self.edge.start()?; - Some(NaiveDateTime::from_timestamp_millis(start_time).unwrap()) - } - - /// Get the end time of the Edge. - /// - /// Returns: - /// The end time of the Edge. - pub fn end(&self) -> Option { - self.edge.end() - } - - /// Get the end datetime of the Edge. - /// - /// Returns: - /// The end datetime of the Edge - pub fn end_date_time(&self) -> Option { - let end_time = self.edge.end()?; - Some(NaiveDateTime::from_timestamp_millis(end_time).unwrap()) - } - - /// Get the duration of the Edge. - /// - /// Arguments: - /// step (int): The step size to use when calculating the duration. - /// - /// Returns: - /// A set of windows containing edges that fall in the time period - #[pyo3(signature = (step))] - fn expanding(&self, step: &PyAny) -> PyResult { - expanding_impl(&self.edge, step) - } - - /// Get a set of Edge windows for a given window size, step, start time - /// and end time using rolling window. - /// A rolling window is a window that moves forward by `step` size at each iteration. - /// - /// Arguments: - /// window (int): The size of the window. - /// step (int): The step size to use when calculating the duration. - /// start (int): The start time to use when calculating the duration. - /// end (int): The end time to use when calculating the duration. - /// - /// Returns: - /// A set of windows containing edges that fall in the time period - fn rolling(&self, window: &PyAny, step: Option<&PyAny>) -> PyResult { - rolling_impl(&self.edge, window, step) - } - - /// Get a new Edge with the properties of this Edge within the specified time window. - /// - /// Arguments: - /// t_start (int): The start time of the window. - /// t_end (int): The end time of the window. - /// - /// Returns: - /// A new Edge with the properties of this Edge within the specified time window. - #[pyo3(signature = (t_start = None, t_end = None))] - pub fn window(&self, t_start: Option<&PyAny>, t_end: Option<&PyAny>) -> PyResult { - window_impl(&self.edge, t_start, t_end).map(|e| e.into()) - } - - /// Get a new Edge with the properties of this Edge at a specified time. - /// - /// Arguments: - /// end (int): The time to get the properties at. - /// - /// Returns: - /// A new Edge with the properties of this Edge at a specified time. - #[pyo3(signature = (end))] - pub fn at(&self, end: &PyAny) -> PyResult { - at_impl(&self.edge, end).map(|e| e.into()) - } - - /// Explodes an Edge into a list of PyEdges. This is useful when you want to iterate over - /// the properties of an Edge at every single point in time. This will return a seperate edge - /// each time a property had been changed. - /// - /// Returns: - /// A list of PyEdges - pub fn explode(&self) -> PyEdges { - let edge = self.edge.clone(); - (move || edge.explode()).into() - } - - /// Gets the earliest time of an edge. - /// - /// Returns: - /// (int) The earliest time of an edge - pub fn earliest_time(&self) -> Option { - self.edge.earliest_time() - } - - /// Gets of earliest datetime of an edge. - /// - /// Returns: - /// the earliest datetime of an edge - pub fn earliest_date_time(&self) -> Option { - Some(NaiveDateTime::from_timestamp_millis(self.edge.earliest_time()?).unwrap()) - } - - /// Gets the latest time of an edge. - /// - /// Returns: - /// (int) The latest time of an edge - pub fn latest_time(&self) -> Option { - self.edge.latest_time() - } - - /// Gets of latest datetime of an edge. - /// - /// Returns: - /// the latest datetime of an edge - pub fn latest_date_time(&self) -> Option { - let latest_time = self.edge.latest_time()?; - Some(NaiveDateTime::from_timestamp_millis(latest_time).unwrap()) - } - - /// Gets the time of an exploded edge. - /// - /// Returns: - /// (int) The time of an exploded edge - pub fn time(&self) -> Option { - self.edge.time() - } - - /// Gets the name of the layer this edge belongs to - /// - /// Returns: - /// (str) The name of the layer - pub fn layer_name(&self) -> String { - self.edge.layer_name() - } - - /// Gets the datetime of an exploded edge. - /// - /// Returns: - /// (datetime) the datetime of an exploded edge - pub fn date_time(&self) -> Option { - let date_time = self.edge.time()?; - Some(NaiveDateTime::from_timestamp_millis(date_time).unwrap()) - } - - /// Displays the Edge as a string. - pub fn __repr__(&self) -> String { - self.repr() - } -} - -impl Repr for PyEdge { - fn repr(&self) -> String { - let properties = &self - .properties(Some(true)) - .iter() - .map(|(k, v)| k.to_string() + " : " + &v.to_string()) - .join(", "); - - let source = self.edge.src().name(); - let target = self.edge.dst().name(); - let earliest_time = self.edge.earliest_time(); - let latest_time = self.edge.latest_time(); - if properties.is_empty() { - format!( - "Edge(source={}, target={}, earliest_time={}, latest_time={})", - source.trim_matches('"'), - target.trim_matches('"'), - earliest_time.unwrap_or(0), - latest_time.unwrap_or(0), - ) - } else { - let property_string: String = "{".to_string() + &properties + "}"; - format!( - "Edge(source={}, target={}, earliest_time={}, latest_time={}, properties={})", - source.trim_matches('"'), - target.trim_matches('"'), - earliest_time.unwrap_or(0), - latest_time.unwrap_or(0), - property_string - ) - } - } -} - -py_iterator!(PyEdgeIter, EdgeView, PyEdge, "EdgeIter"); - -/// A list of edges that can be iterated over. -#[pyclass(name = "Edges")] -pub struct PyEdges { - builder: Arc BoxedIter> + Send + Sync + 'static>, -} - -impl PyEdges { - /// an iterable that can be used in rust - fn iter(&self) -> BoxedIter> { - (self.builder)() - } - - /// returns an iterable used in python - fn py_iter(&self) -> BoxedIter { - Box::new(self.iter().map(|e| e.into())) - } -} - -#[pymethods] -impl PyEdges { - fn __iter__(&self) -> PyEdgeIter { - PyEdgeIter { - iter: Box::new(self.py_iter()), - } - } - - fn __len__(&self) -> usize { - self.iter().count() - } - - fn src(&self) -> PyVertexIterable { - let builder = self.builder.clone(); - (move || builder().src()).into() - } - - fn dst(&self) -> PyVertexIterable { - let builder = self.builder.clone(); - (move || builder().dst()).into() - } - - /// Returns all edges as a list - fn collect(&self) -> Vec { - self.py_iter().collect() - } - - /// Returns the first edge - fn first(&self) -> Option { - self.py_iter().next() - } - - /// Returns the number of edges - fn count(&self) -> usize { - self.py_iter().count() - } - - /// Explodes the edges into a list of edges. This is useful when you want to iterate over - /// the properties of an Edge at every single point in time. This will return a seperate edge - /// each time a property had been changed. - fn explode(&self) -> PyEdges { - let builder = self.builder.clone(); - (move || { - let iter: BoxedIter> = - Box::new(builder().flat_map(|e| e.explode())); - iter - }) - .into() - } - - /// Returns the earliest time of the edges. - fn earliest_time(&self) -> OptionI64Iterable { - let edges: Arc< - dyn Fn() -> Box> + Send> + Send + Sync, - > = self.builder.clone(); - (move || edges().earliest_time()).into() - } - - /// Returns the latest time of the edges. - fn latest_time(&self) -> OptionI64Iterable { - let edges: Arc< - dyn Fn() -> Box> + Send> + Send + Sync, - > = self.builder.clone(); - (move || edges().latest_time()).into() - } - - fn property(&self, name: String, include_static: Option) -> OptionPropIterable { - let edges: Arc< - dyn Fn() -> Box> + Send> + Send + Sync, - > = self.builder.clone(); - (move || edges().property(name.clone(), include_static.unwrap_or(true))).into() - } - - fn __repr__(&self) -> String { - self.repr() - } -} - -impl Repr for PyEdges { - fn repr(&self) -> String { - format!("Edges({})", iterator_repr(self.__iter__().into_iter())) - } -} - -impl BoxedIter> + Send + Sync + 'static> From for PyEdges { - fn from(value: F) -> Self { - Self { - builder: Arc::new(value), - } - } -} - -py_iterator!( - PyNestedEdgeIter, - BoxedIter>, - PyEdgeIter, - "NestedEdgeIter" -); - -#[pyclass(name = "NestedEdges")] -pub struct PyNestedEdges { - builder: Arc BoxedIter>> + Send + Sync + 'static>, -} - -impl PyNestedEdges { - fn iter(&self) -> BoxedIter>> { - (self.builder)() - } -} - -#[pymethods] -impl PyNestedEdges { - fn __iter__(&self) -> PyNestedEdgeIter { - self.iter().into() - } - - fn collect(&self) -> Vec> { - self.iter() - .map(|e| e.map(|ee| ee.into()).collect()) - .collect() - } - - fn explode(&self) -> PyNestedEdges { - let builder = self.builder.clone(); - (move || { - let iter: BoxedIter>> = Box::new(builder().map(|e| { - let inner_box: BoxedIter> = - Box::new(e.flat_map(|e| e.explode())); - inner_box - })); - iter - }) - .into() - } -} - -impl BoxedIter>> + Send + Sync + 'static> From - for PyNestedEdges -{ - fn from(value: F) -> Self { - Self { - builder: Arc::new(value), - } - } -} diff --git a/py-raphtory/src/graph.rs b/py-raphtory/src/graph.rs deleted file mode 100644 index 765b12dbe6..0000000000 --- a/py-raphtory/src/graph.rs +++ /dev/null @@ -1,225 +0,0 @@ -//! Defines the `Graph` struct, which represents a raphtory graph in memory. -//! -//! This is the base class used to create a temporal graph, add vertices and edges, -//! create windows, and query the graph with a variety of algorithms. -//! It is a wrapper around a set of shards, which are the actual graph data structures. -//! In Python, this class wraps around the rust graph. - -use crate::graph_view::PyGraphView; -use crate::utils::{adapt_result, extract_input_vertex, extract_into_time, InputVertexBox}; -use crate::wrappers::prop::Prop; -use itertools::Itertools; -use pyo3::exceptions::PyException; -use pyo3::prelude::*; -use raphtory::core as dbc; -use raphtory::db::graph::Graph; -use std::collections::HashMap; -use std::fmt::{Debug, Formatter}; -use std::path::{Display, Path, PathBuf}; - -/// A temporal graph. -#[derive(Clone)] -#[pyclass(name="Graph", extends=PyGraphView)] -pub struct PyGraph { - pub(crate) graph: Graph, -} - -impl Debug for PyGraph { - fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result { - write!(f, "{}", self.graph) - } -} - -impl From for PyGraph { - fn from(value: Graph) -> Self { - Self { graph: value } - } -} - -impl PyGraph { - pub fn py_from_db_graph(db_graph: Graph) -> PyResult> { - Python::with_gil(|py| { - Py::new( - py, - (PyGraph::from(db_graph.clone()), PyGraphView::from(db_graph)), - ) - }) - } -} - -/// A temporal graph. -#[pymethods] -impl PyGraph { - #[new] - #[pyo3(signature = (nr_shards=1))] - pub fn py_new(nr_shards: usize) -> (Self, PyGraphView) { - let graph = Graph::new(nr_shards); - ( - Self { - graph: graph.clone(), - }, - PyGraphView::from(graph), - ) - } - - /// Adds a new vertex with the given id and properties to the graph. - /// - /// Arguments: - /// timestamp (int, str, or datetime(utc)): The timestamp of the vertex. - /// id (str or int): The id of the vertex. - /// properties (dict): The properties of the vertex. - /// - /// Returns: - /// None - #[pyo3(signature = (timestamp, id, properties=None))] - pub fn add_vertex( - &self, - timestamp: &PyAny, - id: &PyAny, - properties: Option>, - ) -> PyResult<()> { - let time = extract_into_time(timestamp)?; - let v = Self::extract_id(id)?; - let result = self - .graph - .add_vertex(time, v, &Self::transform_props(properties)); - adapt_result(result) - } - - /// Adds properties to an existing vertex. - /// - /// Arguments: - /// id (str or int): The id of the vertex. - /// properties (dict): The properties of the vertex. - /// - /// Returns: - /// None - pub fn add_vertex_properties( - &self, - id: &PyAny, - properties: HashMap, - ) -> PyResult<()> { - let v = Self::extract_id(id)?; - let result = self - .graph - .add_vertex_properties(v, &Self::transform_props(Some(properties))); - adapt_result(result) - } - - /// Adds a new edge with the given source and destination vertices and properties to the graph. - /// - /// Arguments: - /// timestamp (int): The timestamp of the edge. - /// src (str or int): The id of the source vertex. - /// dst (str or int): The id of the destination vertex. - /// properties (dict): The properties of the edge, as a dict of string and properties - /// layer (str): The layer of the edge. - /// - /// Returns: - /// None - #[pyo3(signature = (timestamp, src, dst, properties=None, layer=None))] - pub fn add_edge( - &self, - timestamp: &PyAny, - src: &PyAny, - dst: &PyAny, - properties: Option>, - layer: Option<&str>, - ) -> PyResult<()> { - let time = extract_into_time(timestamp)?; - let src = Self::extract_id(src)?; - let dst = Self::extract_id(dst)?; - adapt_result( - self.graph - .add_edge(time, src, dst, &Self::transform_props(properties), layer), - ) - } - - /// Adds properties to an existing edge. - /// - /// Arguments: - /// src (str or int): The id of the source vertex. - /// dst (str or int): The id of the destination vertex. - /// properties (dict): The properties of the edge, as a dict of string and properties - /// layer (str): The layer of the edge. - /// - /// Returns: - /// None - #[pyo3(signature = (src, dst, properties, layer=None))] - pub fn add_edge_properties( - &self, - src: &PyAny, - dst: &PyAny, - properties: HashMap, - layer: Option<&str>, - ) -> PyResult<()> { - let src = Self::extract_id(src)?; - let dst = Self::extract_id(dst)?; - let result = self.graph.add_edge_properties( - src, - dst, - &Self::transform_props(Some(properties)), - layer, - ); - adapt_result(result) - } - - //****** Saving And Loading ******// - - // Alternative constructors are tricky, see: https://gist.github.com/redshiftzero/648e4feeff3843ffd9924f13625f839c - - /// Loads a graph from the given path. - /// - /// Arguments: - /// path (str): The path to the graph. - /// - /// Returns: - /// Graph: The loaded graph. - #[staticmethod] - pub fn load_from_file(path: String) -> PyResult> { - let file_path: PathBuf = [env!("CARGO_MANIFEST_DIR"), &path].iter().collect(); - - match Graph::load_from_file(file_path) { - Ok(g) => Self::py_from_db_graph(g), - Err(e) => Err(PyException::new_err(format!( - "Failed to load graph from the files. Reason: {}", - e - ))), - } - } - - /// Saves the graph to the given path. - /// - /// Arguments: - /// path (str): The path to the graph. - /// - /// Returns: - /// None - pub fn save_to_file(&self, path: String) -> PyResult<()> { - match self.graph.save_to_file(Path::new(&path)) { - Ok(()) => Ok(()), - Err(e) => Err(PyException::new_err(format!( - "Failed to save graph to the files. Reason: {}", - e - ))), - } - } -} - -impl PyGraph { - fn transform_props(props: Option>) -> Vec<(String, dbc::Prop)> { - props - .unwrap_or_default() - .into_iter() - .map(|(key, value)| (key, value.into())) - .collect_vec() - } - - /// Extracts the id from the given python vertex - /// - /// Arguments: - /// id (str or int): The id of the vertex. - pub(crate) fn extract_id(id: &PyAny) -> PyResult { - extract_input_vertex(id) - } -} diff --git a/py-raphtory/src/graph_view.rs b/py-raphtory/src/graph_view.rs deleted file mode 100644 index f7edf95fab..0000000000 --- a/py-raphtory/src/graph_view.rs +++ /dev/null @@ -1,302 +0,0 @@ -//! The API for querying a view of the graph in a read-only state -use crate::dynamic::{DynamicGraph, IntoDynamic}; -use crate::edge::{PyEdge, PyEdges}; -use crate::types::repr::Repr; -use crate::utils::{ - at_impl, expanding_impl, extract_vertex_ref, rolling_impl, window_impl, IntoPyObject, - PyWindowSet, -}; -use crate::vertex::{PyVertex, PyVertices}; -use chrono::prelude::*; -use pyo3::prelude::*; -use raphtory::db::view_api::layer::LayerOps; -use raphtory::db::view_api::*; -use raphtory::*; - -/// Graph view is a read-only version of a graph at a certain point in time. -#[pyclass(name = "GraphView", frozen, subclass)] -pub struct PyGraphView { - pub graph: DynamicGraph, -} - -/// Graph view is a read-only version of a graph at a certain point in time. -impl From for PyGraphView { - fn from(value: G) -> Self { - PyGraphView { - graph: value.into_dynamic(), - } - } -} - -impl IntoPyObject for G { - fn into_py_object(self) -> PyObject { - let py_version: PyGraphView = self.into(); - Python::with_gil(|py| py_version.into_py(py)) - } -} - -/// The API for querying a view of the graph in a read-only state -#[pymethods] -impl PyGraphView { - pub fn get_unique_layers(&self) -> Vec { - self.graph.get_unique_layers() - } - - //****** Metrics APIs ******// - - /// Timestamp of earliest activity in the graph - /// - /// Returns: - /// the timestamp of the earliest activity in the graph - pub fn earliest_time(&self) -> Option { - self.graph.earliest_time() - } - - /// DateTime of earliest activity in the graph - /// - /// Returns: - /// the datetime of the earliest activity in the graph - pub fn earliest_date_time(&self) -> Option { - let earliest_time = self.graph.earliest_time()?; - Some(NaiveDateTime::from_timestamp_millis(earliest_time).unwrap()) - } - - /// Timestamp of latest activity in the graph - /// - /// Returns: - /// the timestamp of the latest activity in the graph - pub fn latest_time(&self) -> Option { - self.graph.latest_time() - } - - /// DateTime of latest activity in the graph - /// - /// Returns: - /// the datetime of the latest activity in the graph - pub fn latest_date_time(&self) -> Option { - let latest_time = self.graph.latest_time()?; - Some(NaiveDateTime::from_timestamp_millis(latest_time).unwrap()) - } - - /// Number of edges in the graph - /// - /// Returns: - /// the number of edges in the graph - pub fn num_edges(&self) -> usize { - self.graph.num_edges() - } - - /// Number of vertices in the graph - /// - /// Returns: - /// the number of vertices in the graph - pub fn num_vertices(&self) -> usize { - self.graph.num_vertices() - } - - /// Returns true if the graph contains the specified vertex - /// - /// Arguments: - /// id (str or int): the vertex id - /// - /// Returns: - /// true if the graph contains the specified vertex, false otherwise - pub fn has_vertex(&self, id: &PyAny) -> PyResult { - let v = extract_vertex_ref(id)?; - Ok(self.graph.has_vertex(v)) - } - - /// Returns true if the graph contains the specified edge - /// - /// Arguments: - /// src (str or int): the source vertex id - /// dst (str or int): the destination vertex id - /// layer (str): the edge layer (optional) - /// - /// Returns: - /// true if the graph contains the specified edge, false otherwise - #[pyo3(signature = (src, dst, layer=None))] - pub fn has_edge(&self, src: &PyAny, dst: &PyAny, layer: Option<&str>) -> PyResult { - let src = extract_vertex_ref(src)?; - let dst = extract_vertex_ref(dst)?; - Ok(self.graph.has_edge(src, dst, layer)) - } - - //****** Getter APIs ******// - - /// Gets the vertex with the specified id - /// - /// Arguments: - /// id (str or int): the vertex id - /// - /// Returns: - /// the vertex with the specified id, or None if the vertex does not exist - pub fn vertex(&self, id: &PyAny) -> PyResult> { - let v = extract_vertex_ref(id)?; - Ok(self.graph.vertex(v).map(|v| v.into())) - } - - /// Gets the vertices in the graph - /// - /// Returns: - /// the vertices in the graph - #[getter] - pub fn vertices(&self) -> PyVertices { - self.graph.vertices().into() - } - - /// Gets the edge with the specified source and destination vertices - /// - /// Arguments: - /// src (str or int): the source vertex id - /// dst (str or int): the destination vertex id - /// layer (str): the edge layer (optional) - /// - /// Returns: - /// the edge with the specified source and destination vertices, or None if the edge does not exist - #[pyo3(signature = (src, dst, layer=None))] - pub fn edge(&self, src: &PyAny, dst: &PyAny, layer: Option<&str>) -> PyResult> { - let src = extract_vertex_ref(src)?; - let dst = extract_vertex_ref(dst)?; - Ok(self.graph.edge(src, dst, layer).map(|we| we.into())) - } - - /// Gets all edges in the graph - /// - /// Returns: - /// the edges in the graph - pub fn edges(&self) -> PyEdges { - let clone = self.graph.clone(); - (move || clone.edges()).into() - } - - //****** Perspective APIS ******// - - /// Returns the default start time for perspectives over the view - /// - /// Returns: - /// the default start time for perspectives over the view - pub fn start(&self) -> Option { - self.graph.start() - } - - /// Returns the default start datetime for perspectives over the view - /// - /// Returns: - /// the default start datetime for perspectives over the view - pub fn start_date_time(&self) -> Option { - let start_time = self.graph.start()?; - Some(NaiveDateTime::from_timestamp_millis(start_time).unwrap()) - } - - /// Returns the default end time for perspectives over the view - /// - /// Returns: - /// the default end time for perspectives over the view - pub fn end(&self) -> Option { - self.graph.end() - } - - #[doc = window_size_doc_string!()] - pub fn window_size(&self) -> Option { - self.graph.window_size() - } - - /// Returns the default end datetime for perspectives over the view - /// - /// Returns: - /// the default end datetime for perspectives over the view - pub fn end_date_time(&self) -> Option { - let end_time = self.graph.end()?; - Some(NaiveDateTime::from_timestamp_millis(end_time).unwrap()) - } - - /// Creates a `WindowSet` with the given `step` size and optional `start` and `end` times, - /// using an expanding window. - /// - /// An expanding window is a window that grows by `step` size at each iteration. - /// - /// Arguments: - /// step (int) : the size of the window - /// start (int): the start time of the window (optional) - /// end (int): the end time of the window (optional) - /// - /// Returns: - /// A `WindowSet` with the given `step` size and optional `start` and `end` times, - #[pyo3(signature = (step))] - fn expanding(&self, step: &PyAny) -> PyResult { - expanding_impl(&self.graph, step) - } - - /// Creates a `WindowSet` with the given `window` size and optional `step`, `start` and `end` times, - /// using a rolling window. - /// - /// A rolling window is a window that moves forward by `step` size at each iteration. - /// - /// Arguments: - /// window (int): the size of the window - /// step (int): the size of the step (optional) - /// start (int): the start time of the window (optional) - /// end: the end time of the window (optional) - /// - /// Returns: - /// a `WindowSet` with the given `window` size and optional `step`, `start` and `end` times, - fn rolling(&self, window: &PyAny, step: Option<&PyAny>) -> PyResult { - rolling_impl(&self.graph, window, step) - } - - /// Create a view including all events between `t_start` (inclusive) and `t_end` (exclusive) - /// - /// Arguments: - /// start (int): the start time of the window (optional) - /// end (int): the end time of the window (optional) - /// - /// Returns: - /// a view including all events between `t_start` (inclusive) and `t_end` (exclusive) - #[pyo3(signature = (start=None, end=None))] - pub fn window(&self, start: Option<&PyAny>, end: Option<&PyAny>) -> PyResult { - window_impl(&self.graph, start, end).map(|g| g.into()) - } - - /// Create a view including all events until `end` (inclusive) - /// - /// Arguments: - /// end (int) : the end time of the window - /// - /// Returns: - /// a view including all events until `end` (inclusive) - #[pyo3(signature = (end))] - pub fn at(&self, end: &PyAny) -> PyResult { - at_impl(&self.graph, end).map(|g| g.into()) - } - - #[doc = default_layer_doc_string!()] - pub fn default_layer(&self) -> PyGraphView { - self.graph.default_layer().into() - } - - #[doc = layer_doc_string!()] - #[pyo3(signature = (name))] - pub fn layer(&self, name: &str) -> Option { - self.graph.layer(name).map(|layer| layer.into()) - } - - /// Displays the graph - pub fn __repr__(&self) -> String { - self.repr() - } -} - -impl Repr for PyGraphView { - fn repr(&self) -> String { - let num_edges = self.graph.num_edges(); - let num_vertices = self.graph.num_vertices(); - let earliest_time = self.graph.earliest_time().unwrap_or_default(); - let latest_time = self.graph.latest_time().unwrap_or_default(); - - format!( - "Graph(number_of_edges={:?}, number_of_vertices={:?}, earliest_time={:?}, latest_time={:?})", - num_edges, num_vertices, earliest_time, latest_time - ) - } -} diff --git a/py-raphtory/src/lib.rs b/py-raphtory/src/lib.rs deleted file mode 100644 index b99c9e6218..0000000000 --- a/py-raphtory/src/lib.rs +++ /dev/null @@ -1,16 +0,0 @@ -extern crate core; - -#[macro_use] -mod macros; - -pub mod algorithms; -pub mod dynamic; -pub mod edge; -pub mod graph; -pub mod graph_gen; -pub mod graph_loader; -pub mod graph_view; -pub mod types; -pub mod utils; -pub mod vertex; -pub mod wrappers; diff --git a/py-raphtory/src/macros/iter.rs b/py-raphtory/src/macros/iter.rs deleted file mode 100644 index d1fe39a32a..0000000000 --- a/py-raphtory/src/macros/iter.rs +++ /dev/null @@ -1,69 +0,0 @@ -// Internal macro for generating the iterator struct (with or without name) -macro_rules! _py_iterator_struct { - ($name:ident, $pyitem:ty) => { - #[pyclass] - pub struct $name { - iter: Box + Send>, - } - }; - ($name:ident, $pyname:literal, $pyitem:ty) => { - #[pyclass(name=$pyname)] - pub struct $name { - iter: Box + Send>, - } - }; -} - -// internal macro for adding methods to iterators -macro_rules! _py_iterator_methods { - ($name:ident, $item:ty, $pyitem:ty) => { - #[pymethods] - impl $name { - fn __iter__(slf: PyRef<'_, Self>) -> PyRef<'_, Self> { - slf - } - fn __next__(mut slf: PyRefMut<'_, Self>) -> Option<$pyitem> { - slf.iter.next() - } - } - - impl From + Send>> for $name { - fn from(value: Box + Send>) -> Self { - let iter = Box::new(value.map(|v| v.into())); - Self { iter } - } - } - - impl IntoIterator for $name { - type Item = $pyitem; - type IntoIter = Box + Send>; - - fn into_iter(self) -> Self::IntoIter { - self.iter - } - } - }; -} - -/// Construct a python Iterator struct -/// -/// # Arguments -/// -/// * `name` - The identifier for the new struct -/// * `item` - The type of `Item` for the wrapped iterator -/// * `pyitem` - The type of the python wrapper for `Item` (optional if `item` implements `IntoPy`) -/// * `pyname` - The python-side name for the iterator (optional, defaults to `name`) -macro_rules! py_iterator { - ($name:ident, $item:ty) => { - _py_iterator_struct!($name, $item); - _py_iterator_methods!($name, $item, $item); - }; - ($name:ident, $item:ty, $pyitem:ty) => { - _py_iterator_struct!($name, $pyitem); - _py_iterator_methods!($name, $item, $pyitem); - }; - ($name:ident, $item:ty, $pyitem:ty, $pyname:literal) => { - _py_iterator_struct!($name, $pyname, $pyitem); - _py_iterator_methods!($name, $item, $pyitem); - }; -} diff --git a/py-raphtory/src/macros/iterable.rs b/py-raphtory/src/macros/iterable.rs deleted file mode 100644 index f99e61acaa..0000000000 --- a/py-raphtory/src/macros/iterable.rs +++ /dev/null @@ -1,178 +0,0 @@ -// internal macro for sum and mean methods -macro_rules! _py_numeric_methods { - ($name:ident, $item:ty, $pyitem:ty) => { - #[pymethods] - impl $name { - pub fn sum(&self) -> $pyitem { - let v: $item = self.iter().sum(); - v.into() - } - - pub fn mean(&self) -> f64 { - use $crate::wrappers::iterators::MeanExt; - self.iter().mean() - } - } - }; -} - -// Internal macro defining max and min on ordered iterables -macro_rules! _py_ord_max_min_methods { - ($name:ident, $pyitem:ty) => { - #[pymethods] - impl $name { - pub fn max(&self) -> Option<$pyitem> { - self.iter().max().map(|v| v.into()) - } - - pub fn min(&self) -> Option<$pyitem> { - self.iter().min().map(|v| v.into()) - } - } - }; -} - -// Internal macro defining max and min on float iterables -macro_rules! _py_float_max_min_methods { - ($name:ident, $pyitem:ty) => { - #[pymethods] - impl $name { - pub fn max(&self) -> Option<$pyitem> { - self.iter().max_by(|a, b| a.total_cmp(b)).map(|v| v.into()) - } - pub fn min(&self) -> Option<$pyitem> { - self.iter().min_by(|a, b| a.total_cmp(b)).map(|v| v.into()) - } - } - }; -} - -// Internal macro for methods supported by all iterables (also used by nested iterables) -macro_rules! _py_iterable_base_methods { - ($name:ident, $iter:ty) => { - #[pymethods] - impl $name { - pub fn __iter__(&self) -> $iter { - self.iter().into() - } - - pub fn __len__(&self) -> usize { - self.iter().count() - } - - pub fn __repr__(&self) -> String { - self.repr() - } - } - }; -} - -// internal macro for the collect method (as it is different for nested iterables) -macro_rules! _py_iterable_collect_method { - ($name:ident, $pyitem:ty) => { - #[pymethods] - impl $name { - pub fn collect(&self) -> Vec<$pyitem> { - self.iter().map(|v| v.into()).collect() - } - } - }; -} - -/// Construct a python Iterable struct which wraps a closure that returns an iterator -/// -/// Has methods `__iter__`, `__len__`, `__repr__`, `collect` -/// -/// # Arguments -/// -/// * `name` - The identifier for the new struct -/// * `item` - The type of `Item` for the wrapped iterator builder -/// * `pyitem` - The type of the python wrapper for `Item` (optional if `item` implements `IntoPy`, need Into<`pyitem`> to be implemented for `item`) -/// * `pyiter` - The python iterator wrapper that should be returned when calling `__iter__` (needs to have the same `item` and `pyitem`) -macro_rules! py_iterable { - ($name:ident, $item:ty, $pyiter:ty) => { - py_iterable!($name, $item, $item, $pyiter); - }; - ($name:ident, $item:ty, $pyitem:ty, $pyiter:ty) => { - #[pyclass] - pub struct $name($crate::types::iterable::Iterable<$item, $pyitem>); - - impl std::ops::Deref for $name { - type Target = $crate::types::iterable::Iterable<$item, $pyitem>; - - fn deref(&self) -> &Self::Target { - &self.0 - } - } - - impl BoxedIter<$item> + Send + Sync + 'static> From for $name { - fn from(value: F) -> Self { - Self($crate::types::iterable::Iterable::new( - stringify!($name).to_string(), - value, - )) - } - } - _py_iterable_base_methods!($name, $pyiter); - _py_iterable_collect_method!($name, $pyitem); - }; -} - -/// Construct a python Iterable struct which wraps a closure that returns an iterator of ordered values -/// -/// additionally adds the `min` and `max` methods to those created by `py_iterable` -/// # Arguments -/// -/// * `name` - The identifier for the new struct -/// * `item` - The type of `Item` for the wrapped iterator builder -/// * `pyitem` - The type of the python wrapper for `Item` (optional if `item` implements `IntoPy`, need Into<`pyitem`> to be implemented for `item`) -/// * `pyiter` - The python iterator wrapper that should be returned when calling `__iter__` (needs to have the same `item` and `pyitem`) -macro_rules! py_ordered_iterable { - ($name:ident, $item:ty, $iter:ty) => { - py_ordered_iterable!($name, $item, $item, $iter); - }; - ($name:ident, $item:ty, $pyitem:ty, $iter:ty) => { - py_iterable!($name, $item, $pyitem, $iter); - _py_ord_max_min_methods!($name, $pyitem); - }; -} - -/// Construct a python Iterable struct which wraps a closure that returns an iterator of ordered and summable values -/// -/// additionally adds the `mean` and `sum` methods to those created by `py_ordered_iterable` -/// # Arguments -/// -/// * `name` - The identifier for the new struct -/// * `item` - The type of `Item` for the wrapped iterator builder -/// * `pyitem` - The type of the python wrapper for `Item` (optional if `item` implements `IntoPy`, need Into<`pyitem`> to be implemented for `item`) -/// * `pyiter` - The python iterator wrapper that should be returned when calling `__iter__` (needs to have the same `item` and `pyitem`) -macro_rules! py_numeric_iterable { - ($name:ident, $item:ty, $iter:ty) => { - py_numeric_iterable!($name, $item, $item, $iter); - }; - ($name:ident, $item:ty, $pyitem:ty, $iter:ty) => { - py_ordered_iterable!($name, $item, $pyitem, $iter); - _py_numeric_methods!($name, $item, $pyitem); - }; -} - -/// Construct a python Iterable struct which wraps a closure that returns an iterator of float values -/// -/// This acts the same as `py_numeric_iterable` but with special implementations of `max` and `min` for floats. -/// -/// # Arguments -/// -/// * `name` - The identifier for the new struct -/// * `item` - The type of `Item` for the wrapped iterator builder -/// * `pyitem` - The type of the python wrapper for `Item` (optional if `item` implements `IntoPy`, need Into<`pyitem`> to be implemented for `item`) -/// * `pyiter` - The python iterator wrapper that should be returned when calling `__iter__` (needs to have the same `item` and `pyitem`) -macro_rules! py_float_iterable { - ($name:ident, $item:ty, $iter:ty) => { - py_float_iterable!($name, $item, $item, $iter); - }; - ($name:ident, $item:ty, $pyitem:ty, $iter:ty) => { - py_iterable!($name, $item, $pyitem, $iter); - _py_numeric_methods!($name, $item, $pyitem); - _py_float_max_min_methods!($name, $pyitem); - }; -} diff --git a/py-raphtory/src/macros/mod.rs b/py-raphtory/src/macros/mod.rs deleted file mode 100644 index 7b041b8b41..0000000000 --- a/py-raphtory/src/macros/mod.rs +++ /dev/null @@ -1,6 +0,0 @@ -#[macro_use] -mod iter; -#[macro_use] -mod iterable; -#[macro_use] -mod nested_iterable; diff --git a/py-raphtory/src/perspective.rs b/py-raphtory/src/perspective.rs deleted file mode 100644 index 89da73496c..0000000000 --- a/py-raphtory/src/perspective.rs +++ /dev/null @@ -1,113 +0,0 @@ -//! This module defines the `PyPerspective` struct and the `PyPerspectiveSet` iterator. -//! -//! `PyPerspective` is a simple struct representing a time range from `start` to `end`. -//! The start time is inclusive and the end time is exclusive. -//! -//! `PyPerspectiveSet` is an iterator over a range of time periods (`Perspective`s). -//! It can be used to generate rolling or expanding perspectives based on a `step` size and an optional `window` size. -//! -//! These perpectives are used when querying the graph to determine the time bounds. -use pyo3::{pyclass, pymethods}; -use raphtory::db::perspective; -use raphtory::db::perspective::PerspectiveSet; -use std::i64; - -/// A struct representing a time range from `start` to `end`. -/// -/// The start time is inclusive and the end time is exclusive. -#[derive(Clone)] -#[pyclass(name = "Perspective")] -pub struct PyPerspective { - pub start: Option, - pub end: Option, -} - -/// Representing a time range from `start` to `end` for a graph -#[pymethods] -impl PyPerspective { - /// Creates a new `Perspective` with the given `start` and `end` times. - /// Arguments: - /// start (int): The start time of the perspective. If None, the perspective will start at the beginning of the graph. - /// end (int): The end time of the perspective. If None, the perspective will end at the end of the graph. - /// - /// Returns: - /// Perspective: A new perspective with the given start and end times. - #[new] - #[pyo3(signature = (start=None, end=None))] - fn new(start: Option, end: Option) -> Self { - PyPerspective { start, end } - } - - /// Creates an `PyPerspectiveSet` with the given `step` size and optional `start` and `end` times, - /// using an expanding window. - /// - /// An expanding window is a window that grows by `step` size at each iteration. - /// - /// Arguments: - /// step (int): The size of the step to take at each iteration. - /// start (int): The start time of the perspective. If None, the perspective will start at the beginning of the graph. (optional) - /// end (int): The end time of the perspective. If None, the perspective will end at the end of the graph. (optional) - /// - /// Returns: - /// PyPerspectiveSet: An iterator over a range of time periods (`Perspective`s). - #[staticmethod] - #[pyo3(signature = (step, start=None, end=None))] - fn expanding(step: u64, start: Option, end: Option) -> PyPerspectiveSet { - PyPerspectiveSet { - ps: perspective::Perspective::expanding(step, start, end), - } - } - - /// Creates an `PerspectiveSet` with the given `window` size and optional `step`, `start` and `end` times, - /// using a rolling window. - /// - /// A rolling window is a window that moves forward by `step` size at each iteration. - /// If `step` is not provided, it defaults to the `window` size. - /// - /// Arguments: - /// window (int): The size of the window to use at each iteration. - /// step (int): The size of the step to take at each iteration. (optional) - /// start (int): The start time of the perspective. If None, the perspective will start at the beginning of the graph. (optional) - /// end (int): The end time of the perspective. If None, the perspective will end at the end of the graph. (optional) - /// - /// Returns: - /// PyPerspectiveSet: An iterator over a range of time periods (`Perspective`s). - #[staticmethod] - #[pyo3(signature = (window, step=None, start=None, end=None))] - fn rolling( - window: u64, - step: Option, - start: Option, - end: Option, - ) -> PyPerspectiveSet { - PyPerspectiveSet { - ps: perspective::Perspective::rolling(window, step, start, end), - } - } -} - -impl From for PyPerspective { - fn from(value: perspective::Perspective) -> Self { - PyPerspective { - start: value.start, - end: value.end, - } - } -} - -impl From for perspective::Perspective { - fn from(value: PyPerspective) -> Self { - perspective::Perspective { - start: value.start, - end: value.end, - } - } -} - -/// A PerspectiveSet represents a set of windows on a timeline, -/// defined by a start, end, step, and window size. -#[pyclass(name = "PerspectiveSet")] -#[derive(Clone)] -pub struct PyPerspectiveSet { - pub(crate) ps: PerspectiveSet, -} diff --git a/py-raphtory/src/types/iterable.rs b/py-raphtory/src/types/iterable.rs deleted file mode 100644 index 3cb803b3b2..0000000000 --- a/py-raphtory/src/types/iterable.rs +++ /dev/null @@ -1,68 +0,0 @@ -use crate::types::repr::{iterator_repr, Repr}; -use pyo3::{IntoPy, PyObject}; -use raphtory::db::view_api::BoxedIter; -use std::marker::PhantomData; -use std::sync::Arc; - -pub struct Iterable + From + Repr> { - pub name: String, - pub builder: Arc BoxedIter + Send + Sync + 'static>, - pytype: PhantomData, -} - -impl + From + Repr> Iterable { - pub fn iter(&self) -> BoxedIter { - (self.builder)() - } - pub fn py_iter(&self) -> BoxedIter { - Box::new(self.iter().map(|i| i.into())) - } - pub fn new BoxedIter + Send + Sync + 'static>(name: String, builder: F) -> Self { - Self { - name, - builder: Arc::new(builder), - pytype: Default::default(), - } - } -} - -impl + From + Repr> Repr for Iterable { - fn repr(&self) -> String { - format!("{}([{}])", self.name, iterator_repr(self.py_iter())) - } -} - -pub struct NestedIterable + From + Repr> { - pub name: String, - pub builder: Arc BoxedIter> + Send + Sync + 'static>, - pytype: PhantomData, -} - -impl + From + Repr> NestedIterable { - pub fn iter(&self) -> BoxedIter> { - (self.builder)() - } - pub fn new BoxedIter> + Send + Sync + 'static>( - name: String, - builder: F, - ) -> Self { - Self { - name, - builder: Arc::new(builder), - pytype: Default::default(), - } - } -} - -impl + From + Repr> Repr for NestedIterable { - fn repr(&self) -> String { - format!( - "{}([{}])", - self.name, - iterator_repr( - self.iter() - .map(|it| format!("[{}]", iterator_repr(it.map(|i| PyI::from(i))))) - ) - ) - } -} diff --git a/py-raphtory/src/types/mod.rs b/py-raphtory/src/types/mod.rs deleted file mode 100644 index 21288e8fdc..0000000000 --- a/py-raphtory/src/types/mod.rs +++ /dev/null @@ -1,2 +0,0 @@ -pub mod iterable; -pub mod repr; diff --git a/py-raphtory/src/wrappers/iterators.rs b/py-raphtory/src/wrappers/iterators.rs deleted file mode 100644 index 4364ddf8cb..0000000000 --- a/py-raphtory/src/wrappers/iterators.rs +++ /dev/null @@ -1,163 +0,0 @@ -use crate::types::repr::Repr; -use crate::wrappers::prop::{PropHistories, PropHistory, PropValue, Props}; -use num::cast::AsPrimitive; -use pyo3::prelude::*; -use raphtory::core as db_c; -use raphtory::db::view_api::BoxedIter; -use std::collections::HashMap; -use std::i64; -use std::iter::Sum; -use std::ops::Deref; - -pub(crate) trait MeanExt: Iterator -where - V: AsPrimitive + Sum, -{ - fn mean(self) -> f64 - where - Self: Sized, - { - let mut count: usize = 0; - let sum: V = self.inspect(|_| count += 1).sum(); - - if count > 0 { - sum.as_() / (count as f64) - } else { - 0.0 - } - } -} - -impl, V: AsPrimitive + Sum> MeanExt for I {} - -py_iterator!(Float64Iter, f64); -py_float_iterable!(Float64Iterable, f64, Float64Iter); - -py_iterator!(U64Iter, u64); -py_numeric_iterable!(U64Iterable, u64, U64Iter); -py_iterator!(NestedU64Iter, BoxedIter, U64Iter); -py_nested_numeric_iterable!( - NestedU64Iterable, - u64, - NestedU64Iter, - U64Iterable, - OptionU64Iterable -); - -py_iterator!(OptionU64Iter, Option); -py_iterable!(OptionU64Iterable, Option, Option, OptionU64Iter); -_py_ord_max_min_methods!(OptionU64Iterable, Option); - -py_iterator!(I64Iter, i64); -py_numeric_iterable!(I64Iterable, i64, I64Iter); -py_iterator!(NestedI64Iter, BoxedIter, I64Iter); -py_nested_numeric_iterable!( - NestedI64Iterable, - i64, - NestedI64Iter, - I64Iterable, - OptionI64Iterable -); - -py_iterator!(OptionI64Iter, Option); -py_iterable!(OptionI64Iterable, Option, OptionI64Iter); -_py_ord_max_min_methods!(OptionI64Iterable, Option); -py_iterator!(OptionOptionI64Iter, Option>); -py_iterable!( - OptionOptionI64Iterable, - Option>, - OptionOptionI64Iter -); -_py_ord_max_min_methods!(OptionOptionI64Iterable, Option>); - -py_iterator!(NestedOptionI64Iter, BoxedIter>, OptionI64Iter); -py_nested_ordered_iterable!( - NestedOptionI64Iterable, - Option, - NestedOptionI64Iter, - OptionOptionI64Iterable -); - -py_iterator!(UsizeIter, usize); -py_numeric_iterable!(UsizeIterable, usize, UsizeIter); -py_iterator!(OptionUsizeIter, Option); -py_ordered_iterable!(OptionUsizeIterable, Option, OptionUsizeIter); -py_iterator!(NestedUsizeIter, BoxedIter, UsizeIter); -py_nested_numeric_iterable!( - NestedUsizeIterable, - usize, - NestedUsizeIter, - UsizeIterable, - OptionUsizeIterable -); - -py_iterator!(BoolIter, bool); -py_iterable!(BoolIterable, bool, BoolIter); -py_iterator!(NestedBoolIter, BoxedIter, BoolIter); -py_nested_iterable!(NestedBoolIterable, bool, NestedBoolIter); - -py_iterator!(StringIter, String); -py_iterable!(StringIterable, String, StringIter); -py_iterator!(NestedStringIter, BoxedIter, StringIter); -py_nested_iterable!(NestedStringIterable, String, NestedStringIter); - -py_iterator!(StringVecIter, Vec); -py_iterable!(StringVecIterable, Vec, StringVecIter); -py_iterator!(NestedStringVecIter, BoxedIter>, StringVecIter); -py_nested_iterable!(NestedStringVecIterable, Vec, NestedStringVecIter); - -py_iterator!(OptionPropIter, Option, PropValue); -py_iterable!( - OptionPropIterable, - Option, - PropValue, - OptionPropIter -); -py_iterator!( - NestedOptionPropIter, - BoxedIter>, - OptionPropIter -); -py_nested_iterable!( - NestedOptionPropIterable, - Option, - PropValue, - NestedOptionPropIter -); - -py_iterator!(PropHistoryIter, Vec<(i64, db_c::Prop)>, PropHistory); -py_iterable!( - PropHistoryIterable, - Vec<(i64, db_c::Prop)>, - PropHistory, - PropHistoryIter -); -py_iterator!( - NestedPropHistoryIter, - BoxedIter>, - PropHistoryIter -); -py_nested_iterable!( - NestedPropHistoryIterable, - Vec<(i64, db_c::Prop)>, - PropHistory, - NestedPropHistoryIter -); - -py_iterator!(PropsIter, HashMap, Props); -py_iterable!(PropsIterable, HashMap, Props, PropsIter); -py_iterator!( - NestedPropsIter, - BoxedIter>, - PropsIter -); -py_nested_iterable!(NestedPropsIterable, HashMap, Props, NestedPropsIter); - -py_iterator!(PropHistoriesIter, HashMap>, PropHistories); -py_iterable!(PropHistoriesIterable, HashMap>, PropHistories, PropHistoriesIter); -py_iterator!( - NestedPropHistoriesIter, - BoxedIter>>, - PropHistoriesIter -); -py_nested_iterable!(NestedPropHistoriesIterable, HashMap>, PropHistories, NestedPropHistoriesIter); diff --git a/py-raphtory/src/wrappers/prop.rs b/py-raphtory/src/wrappers/prop.rs deleted file mode 100644 index c3307db1d9..0000000000 --- a/py-raphtory/src/wrappers/prop.rs +++ /dev/null @@ -1,190 +0,0 @@ -use crate::graph::PyGraph; -use crate::graph_view::PyGraphView; -use crate::types::repr::Repr; -use chrono::NaiveDateTime; -use pyo3::{FromPyObject, IntoPy, PyAny, PyObject, PyResult, Python}; -use raphtory::core as db_c; -use raphtory::db; -use std::collections::HashMap; -use std::{fmt, i64}; - -#[repr(transparent)] -#[derive(Debug, Clone)] -pub struct PGraph(db::graph::Graph); - -impl IntoPy for PGraph { - fn into_py(self, py: Python<'_>) -> PyObject { - PyGraph::py_from_db_graph(self.0).unwrap().into_py(py) - } -} - -impl<'source> FromPyObject<'source> for PGraph { - fn extract(ob: &'source PyAny) -> PyResult { - let res: PyGraph = ob.extract()?; - Ok(PGraph(res.graph)) - } -} - -#[derive(FromPyObject, Debug, Clone)] -pub enum Prop { - Str(String), - Bool(bool), - I64(i64), - U64(u64), - F64(f64), - DTime(NaiveDateTime), - Graph(PGraph), -} - -impl fmt::Display for Prop { - fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result { - match self { - Prop::Str(value) => write!(f, "{}", value), - Prop::Bool(value) => write!(f, "{}", value), - Prop::I64(value) => write!(f, "{}", value), - Prop::U64(value) => write!(f, "{}", value), - Prop::F64(value) => write!(f, "{}", value), - Prop::DTime(value) => write!(f, "{}", value), - Prop::Graph(value) => write!(f, "{}", value.0), - } - } -} - -impl IntoPy for Prop { - fn into_py(self, py: Python<'_>) -> PyObject { - match self { - Prop::Str(s) => s.into_py(py), - Prop::Bool(bool) => bool.into_py(py), - Prop::I64(i64) => i64.into_py(py), - Prop::U64(u64) => u64.into_py(py), - Prop::F64(f64) => f64.into_py(py), - Prop::DTime(dtime) => dtime.into_py(py), - Prop::Graph(g) => g.into_py(py), // Need to find a better way - } - } -} - -impl From for db_c::Prop { - fn from(prop: Prop) -> db_c::Prop { - match prop { - Prop::Str(string) => db_c::Prop::Str(string), - Prop::Bool(bool) => db_c::Prop::Bool(bool), - Prop::I64(i64) => db_c::Prop::I64(i64), - Prop::U64(u64) => db_c::Prop::U64(u64), - Prop::F64(f64) => db_c::Prop::F64(f64), - Prop::DTime(dtime) => db_c::Prop::DTime(dtime), - Prop::Graph(g) => db_c::Prop::Graph(g.0), - } - } -} - -impl From for Prop { - fn from(prop: db_c::Prop) -> Prop { - match prop { - db_c::Prop::Str(string) => Prop::Str(string), - db_c::Prop::Bool(bool) => Prop::Bool(bool), - db_c::Prop::I32(i32) => Prop::I64(i32 as i64), - db_c::Prop::I64(i64) => Prop::I64(i64), - db_c::Prop::U32(u32) => Prop::U64(u32 as u64), - db_c::Prop::U64(u64) => Prop::U64(u64), - db_c::Prop::F64(f64) => Prop::F64(f64), - db_c::Prop::F32(f32) => Prop::F64(f32 as f64), - db_c::Prop::DTime(dtime) => Prop::DTime(dtime), - db_c::Prop::Graph(g) => Prop::Graph(PGraph(g)), - } - } -} - -impl Repr for Prop { - fn repr(&self) -> String { - match &self { - Prop::Str(v) => v.repr(), - Prop::Bool(v) => v.repr(), - Prop::I64(v) => v.repr(), - Prop::U64(v) => v.repr(), - Prop::F64(v) => v.repr(), - Prop::DTime(v) => v.repr(), - Prop::Graph(g) => g.0.to_string(), - } - } -} - -pub struct PropValue(Option); - -impl From> for PropValue { - fn from(value: Option) -> Self { - Self(value.map(|v| v.into())) - } -} - -impl IntoPy for PropValue { - fn into_py(self, py: Python<'_>) -> PyObject { - self.0.into_py(py) - } -} - -impl Repr for PropValue { - fn repr(&self) -> String { - self.0.repr() - } -} - -pub struct Props(HashMap); - -impl Repr for Props { - fn repr(&self) -> String { - self.0.repr() - } -} - -impl From> for Props { - fn from(value: HashMap) -> Self { - Self(value.into_iter().map(|(k, v)| (k, v.into())).collect()) - } -} - -impl IntoPy for Props { - fn into_py(self, py: Python<'_>) -> PyObject { - self.0.into_py(py) - } -} - -pub struct PropHistory(Vec<(i64, Prop)>); - -impl Repr for PropHistory { - fn repr(&self) -> String { - self.0.repr() - } -} - -impl From> for PropHistory { - fn from(value: Vec<(i64, db_c::Prop)>) -> Self { - Self(value.into_iter().map(|(t, v)| (t, v.into())).collect()) - } -} - -impl IntoPy for PropHistory { - fn into_py(self, py: Python<'_>) -> PyObject { - self.0.into_py(py) - } -} - -pub struct PropHistories(HashMap); - -impl Repr for PropHistories { - fn repr(&self) -> String { - self.0.repr() - } -} - -impl From>> for PropHistories { - fn from(value: HashMap>) -> Self { - Self(value.into_iter().map(|(k, h)| (k, h.into())).collect()) - } -} - -impl IntoPy for PropHistories { - fn into_py(self, py: Python<'_>) -> PyObject { - self.0.into_py(py) - } -} diff --git a/python/Cargo.toml b/python/Cargo.toml index adbe1cbbcb..afd2fb1612 100644 --- a/python/Cargo.toml +++ b/python/Cargo.toml @@ -18,13 +18,16 @@ name = "raphtory" crate-type = ["cdylib"] [dependencies] -pyo3 = {version="0.18.1", features=["multiple-pymethods", "chrono"]} -py-raphtory = {path = "../py-raphtory", version = "0.4.0" } +pyo3 = {version= "0.19.2", features=["multiple-pymethods", "chrono"]} +pyo3-asyncio = { version = "0.19.0", features = ["tokio-runtime"] } +raphtory_core = {path = "../raphtory", version = "0.5.7", features=["python"], package="raphtory" } +raphtory-graphql = {path = "../raphtory-graphql", version = "0.5.7" } openssl = { version = "0.10", features = ["vendored"] } # DO NOT REMOVE IT BREAKS PYTHON RELEASE + [features] extension-module = ["pyo3/extension-module"] default = ["extension-module"] [build-dependencies] -pyo3-build-config = "0.18.1" +pyo3-build-config = "0.19.2" diff --git a/python/pyproject.toml b/python/pyproject.toml index 2d09eba682..d336f4dc1a 100644 --- a/python/pyproject.toml +++ b/python/pyproject.toml @@ -4,16 +4,19 @@ build-backend = "maturin" [project] name = "raphtory" -requires-python = ">=3.7" +requires-python = ">=3.8" classifiers = [ "Programming Language :: Rust", "Programming Language :: Python :: Implementation :: CPython", "Programming Language :: Python :: Implementation :: PyPy", ] dependencies = [ - "pandas >= 1.3.3", "pyvis >= 0.3.2", "networkx >= 2.6.3", + "pandas >= 2.0.3", + "pyarrow >= 12.0.1", + "requests >= 2.31.0", + "gql[all] == 3.4.1" ] @@ -26,7 +29,7 @@ slack = "https://join.slack.com/t/raphtory/shared_invite/zt-xbebws9j-VgPIFRleJFJ youtube = "https://www.youtube.com/@pometry8546/videos" [project.optional-dependencies] -vis = ["pyvis >= 0.3.2", "networkx >= 2.6.3", "matplotlib >= 3.4.3", "seaborn >= 0.11.2"] +export = ["pyvis >= 0.3.2", "networkx >= 2.6.3", "matplotlib >= 3.4.3", "seaborn >= 0.11.2"] [tool.maturin] features = ["pyo3/extension-module"] diff --git a/python/python/raphtory/__init__.py b/python/python/raphtory/__init__.py index cd5307a257..a55a080cac 100644 --- a/python/python/raphtory/__init__.py +++ b/python/python/raphtory/__init__.py @@ -1,9 +1,11 @@ import sys from .raphtory import * + sys.modules["raphtory.algorithms"] = algorithms sys.modules["raphtory.graph_gen"] = graph_gen sys.modules["raphtory.graph_loader"] = graph_loader - +# sys.modules["raphtory.vectors"] = vectors # TODO: re-enable +# sys.modules["raphtory.graphql"] = graphql from .nullmodels import * @@ -13,4 +15,4 @@ algorithms.__doc__ = "Algorithmic functions that can be run on Raphtory graphs" graph_gen.__doc__ = "Generate Raphtory graphs from attachment models" -graph_loader.__doc__ = "Load and save Raphtory graphs from/to file(s)" \ No newline at end of file +graph_loader.__doc__ = "Load and save Raphtory graphs from/to file(s)" diff --git a/python/python/raphtory/export.py b/python/python/raphtory/export.py new file mode 100644 index 0000000000..c643d65fd5 --- /dev/null +++ b/python/python/raphtory/export.py @@ -0,0 +1,271 @@ +""" +Generate a visualisation using matplotlib or pyvis from Raphtory graphs. +""" +from pyvis.network import Network +import networkx as nx +import pandas as pd + + +def to_pyvis( + graph, + explode_edges=False, + edge_color="#000000", + shape=None, + node_image=None, + edge_weight=None, + edge_label=None, + colour_nodes_by_type=False, + type_property="type", + notebook=True, + **kwargs, +): + r"""Draw a graph with Pyvis. + + .. note:: + + Pyvis is a required dependency. + If you intend to use this function make sure that + you install Pyvis with ``pip install pyvis`` + + :param graph: A Raphtory graph. + :param explode_edges: A boolean that is set to True if you want to explode the edges in the graph. By default this is set to False. + :param str edge_color: A string defining the colour of the edges in the graph. By default ``#000000`` (black) is set. + :param str shape: An optional string defining what the node looks like. + There are two types of nodes. One type has the label inside of it and the other type has the label underneath it. + The types with the label inside of it are: ellipse, circle, database, box, text. + The ones with the label outside of it are: image, circularImage, diamond, dot, star, triangle, triangleDown, square and icon. + By default ``"dot"`` is set. + :param str node_image: An optional string defining the url of a custom node image. By default an image of a circle is set. + :param str edge_weight: An optional string defining the name of the property where edge weight is set on your Raphtory graph. By default ``1`` is set. + :param str edge_label: An optional string defining the name of the property where edge label is set on your Raphtory graph. By default, an empty string as the label is set. + :param bool notebook: A boolean that is set to True if using jupyter notebook. By default this is set to True. + :param kwargs: Additional keyword arguments that are passed to the pyvis Network class. + + :returns: A pyvis network + + For Example: + + .. jupyter-execute:: + + from raphtory import Graph + from raphtory import export + + g = Graph() + g.add_vertex(1, src, properties={"image": "image.png"}) + g.add_edge(1, 1, 2, {"title": "edge", "weight": 1}) + g.add_edge(1, 2, 1, {"title": "edge", "weight": 3}) + + export.to_pyvis(graph=g, edge_color="#FF0000", edge_weight= "weight", shape="image", node_image="image", edge_label="title") + + """ + visGraph = Network(notebook=notebook, **kwargs) + if colour_nodes_by_type: + groups = { + value: index + 1 + for index, value in enumerate( + set(graph.vertices.properties.get(type_property)) + ) + } + + for v in graph.vertices: + image = ( + v.properties.get(node_image) + if node_image != None + else "https://cdn-icons-png.flaticon.com/512/7584/7584620.png" + ) + shape = shape if shape is not None else "dot" + if colour_nodes_by_type: + visGraph.add_node( + v.id, + label=v.name, + shape=shape, + image=image, + group=groups[v.properties.get(type_property)], + ) + else: + visGraph.add_node(v.id, label=v.name, shape=shape, image=image) + + edges = graph.edges().explode() if explode_edges else graph.edges().explode_layers() + for e in edges: + weight = e.properties.get(edge_weight) if edge_weight is not None else 1 + if weight is None: + weight = 1 + label = e.properties.get(edge_label) if edge_label is not None else "" + if label is None: + label = "" + visGraph.add_edge( + e.src.id, + e.dst.id, + value=weight, + color=edge_color, + title=label, + arrowStrikethrough=False, + ) + + return visGraph + + +def to_networkx( + graph, + explode_edges=False, + include_vertex_properties=True, + include_edge_properties=True, + include_update_history=True, + include_property_histories=True, +): + r"""Returns a graph with NetworkX. + .. note:: + + Network X is a required dependency. + If you intend to use this function make sure that + you install Network X with ``pip install networkx`` + + :param Graph graph: A Raphtory graph. + :param bool explode_edges: A boolean that is set to True if you want to explode the edges in the graph. By default this is set to False. + :param bool include_vertex_properties: A boolean that is set to True if you want to include the vertex properties in the graph. By default this is set to True. + :param bool include_edge_properties: A boolean that is set to True if you want to include the edge properties in the graph. By default this is set to True. + :param bool include_update_history: A boolean that is set to True if you want to include the update histories in the graph. By default this is set to True. + :param bool include_property_histories: A boolean that is set to True if you want to include the histories in the graph. By default this is set to True. + + :returns: A Networkx MultiDiGraph. + """ + + networkXGraph = nx.MultiDiGraph() + + vertex_tuples = [] + for v in graph.vertices: + properties = {} + if include_vertex_properties: + if include_property_histories: + properties.update(v.properties.constant.as_dict()) + properties.update(v.properties.temporal.histories()) + else: + properties = v.properties.as_dict() + if include_update_history: + properties.update({"update_history": v.history()}) + vertex_tuples.append((v.name, properties)) + networkXGraph.add_nodes_from(vertex_tuples) + + edge_tuples = [] + edges = graph.edges().explode() if explode_edges else graph.edges().explode_layers() + for e in edges: + properties = {} + src = e.src.name + dst = e.dst.name + if include_edge_properties: + if include_property_histories: + properties.update(e.properties.constant.as_dict()) + properties.update(e.properties.temporal.histories()) + else: + properties = e.properties.as_dict() + layer = e.layer_name + if layer is not None: + properties.update({"layer": layer}) + if include_update_history: + if explode_edges: + properties.update({"update_history": e.time}) + else: + properties.update({"update_history": e.history()}) + edge_tuples.append((src, dst, properties)) + + networkXGraph.add_edges_from(edge_tuples) + + return networkXGraph + + +def to_edge_df( + graph, + explode_edges=False, + include_edge_properties=True, + include_update_history=True, + include_property_histories=True, +): + r"""Returns an edge list pandas dataframe for the given graph. + .. note:: + + Pandas is a required dependency. + If you intend to use this function make sure that + you install pandas with ``pip install pandas`` + + :param Graph graph: A Raphtory graph. + :param bool explode_edges: A boolean that is set to True if you want to explode the edges in the graph. By default this is set to False. + :param bool include_edge_properties: A boolean that is set to True if you want to include the edge properties in the graph. By default this is set to True. + :param bool include_update_history: A boolean that is set to True if you want to include the update histories in the graph. By default this is set to True. + :param bool include_property_histories: A boolean that is set to True if you want to include the histories in the graph. By default this is set to True. + + :returns: A pandas dataframe. + """ + edge_tuples = [] + + columns = ["src", "dst", "layer"] + if include_edge_properties: + columns.append("properties") + if include_update_history: + columns.append("update_history") + + edges = graph.edges().explode() if explode_edges else graph.edges().explode_layers() + for e in edges: + tuple = [e.src.name, e.dst.name, e.layer_name] + if include_edge_properties: + properties = {} + if include_property_histories: + properties.update(e.properties.constant.as_dict()) + properties.update(e.properties.temporal.histories()) + else: + properties = e.properties.as_dict() + tuple.append(properties) + + if include_update_history: + if explode_edges: + tuple.append(e.time) + else: + tuple.append(e.history()) + + edge_tuples.append(tuple) + + return pd.DataFrame(edge_tuples, columns=columns) + + +def to_vertex_df( + graph, + include_vertex_properties=True, + include_update_history=True, + include_property_histories=True, +): + r"""Returns an vertex list pandas dataframe for the given graph. + + .. note:: + + Pandas is a required dependency. + If you intend to use this function make sure that + you install pandas with ``pip install pandas`` + + :param Graph graph: A Raphtory graph. + :param bool include_vertex_properties: A boolean that is set to True if you want to include the vertex properties in the graph. By default this is set to True. + :param bool include_update_history: A boolean that is set to True if you want to include the update histories in the graph. By default this is set to True. + :param bool include_property_histories: A boolean that is set to True if you want to include the histories in the graph. By default this is set to True. + + :returns: A pandas dataframe. + + """ + vertex_tuples = [] + columns = ["id"] + if include_vertex_properties: + columns.append("properties") + if include_update_history: + columns.append("update_history") + + for v in graph.vertices: + tuple = [v.name] + if include_vertex_properties: + properties = {} + if include_property_histories: + properties.update(v.properties.constant.as_dict()) + properties.update(v.properties.temporal.histories()) + else: + properties = v.properties.as_dict() + tuple.append(properties) + if include_update_history: + tuple.append(v.history()) + vertex_tuples.append(tuple) + return pd.DataFrame(vertex_tuples, columns=columns) diff --git a/python/python/raphtory/graphqlclient.py b/python/python/raphtory/graphqlclient.py new file mode 100644 index 0000000000..7bc130bfcf --- /dev/null +++ b/python/python/raphtory/graphqlclient.py @@ -0,0 +1,128 @@ +from gql import Client, gql +from gql.transport.requests import RequestsHTTPTransport +import raphtory +from raphtory import internal_graphql + + +class RaphtoryGraphQLClient: + """ + A client for handling GraphQL operations in the context of Raphtory. + """ + + def __init__(self, url: str): + """ + Initialize a GraphQL Client Connection. + + Args: + url (str): URL to a server with the port appended to the URL. + + Note: + This constructor creates a GraphQL client connection to the given URL. + """ + transport = RequestsHTTPTransport(url=url, use_json=True) + self.client = Client(transport=transport, fetch_schema_from_transport=True) + # Below attempts to connect to the server with the url + # self.client.connect_sync() + + def query(self, query: str, variables: dict = {}): + """ + Execute a GraphQL query. + + Args: + query (str): The GraphQL query string. + variables (dict, optional): Variables for the query. Defaults to an empty dictionary. + + Returns: + dict: Result of the query. + """ + query = gql(query) + return self.client.execute(query, variables) + + def load_graphs_from_path(self, path: str) -> dict: + """ + Load graphs from a directory of bincode files. + + Args: + path (str): Directory containing bincode files. + + Returns: + dict: Result after executing the mutation. + + Note: + Existing graphs with the same name are overwritten. + """ + mutation_q = gql( + """ + mutation LoadGraphsFromPath($path: String!) { + loadGraphsFromPath(path: $path) + } + """ + ) + result = self.client.execute(mutation_q, variable_values={"path": path}) + if len(result["loadGraphsFromPath"]): + print("Loaded %i graph(s)" % len(result["loadGraphsFromPath"])) + return result + else: + print("Could not find a graph to load") + return result + + def load_new_graphs_from_path(self, path: str) -> dict: + """ + Load new graphs from a directory of bincode files. + + Args: + path (str): Directory containing bincode files. + + Returns: + dict: Result after executing the mutation. + + Note: + Existing graphs will not be overwritten. + """ + mutation_q = gql( + """ + mutation LoadNewGraphsFromPath($path: String!) { + loadNewGraphsFromPath(path: $path) + } + """ + ) + result = self.client.execute(mutation_q, variable_values={"path": path}) + + if len(result["loadNewGraphsFromPath"]): + print("Loaded %i graph(s)" % len(result["loadNewGraphsFromPath"])) + return result + else: + print("Could not find a graph to load") + return result + + def send_graph(self, name: str, graph: raphtory.Graph): + """ + Upload a graph to the GraphQL Server. + + Args: + name (str): Name of the graph. + graph (raphtory.Graph): Graph object to be uploaded. + + Returns: + dict: Result after executing the mutation. + + Raises: + Exception: If there's an error sending the graph. + """ + encoded_graph = internal_graphql.encode_graph(graph) + + mutation_q = gql( + """ + mutation SendGraph($name: String!, $graph: String!) { + sendGraph(name: $name, graph: $graph) + } + """ + ) + result = self.client.execute( + mutation_q, variable_values={"name": name, "graph": encoded_graph} + ) + if "sendGraph" in result: + print("Sent graph %s to GraphlQL Server" % len(result["sendGraph"])) + return result + else: + raise Exception("Error Sending Graph %s" % result) diff --git a/python/python/raphtory/graphqlserver.py b/python/python/raphtory/graphqlserver.py new file mode 100644 index 0000000000..360feafa4e --- /dev/null +++ b/python/python/raphtory/graphqlserver.py @@ -0,0 +1,103 @@ +""" +This module contains helper functions and classes for working with the GraphQL server for Raphtory. +Calling the run_server function will start the GraphQL server. If run in the background, this will return a +GraphQLServer object that can be used to run queries. +""" + +from raphtory import internal_graphql +import asyncio +import threading +import requests +import time +from raphtory import graphqlclient + + +class GraphQLServer: + """ + A helper class that can be used to query the Raphtory GraphQL server. + """ + + def __init__(self, port): + self.port = port + + def query(self, query): + """ + Runs a GraphQL query on the server. + + :param query(str): The GraphQL query to run. + + :raises Exception: If the query fails to run. + + :return: Returns the json-encoded content of a response, if any. + + """ + r = requests.post("http://localhost:" + str(self.port), json={"query": query}) + if r.status_code == 200: + return r.json() + else: + raise Exception(f"Query failed to run with a {r.status_code}.") + + def wait_for_online(self): + """ + Waits for the server to be online. This is called automatically when run_server is called. + """ + while True: + try: + r = requests.get("http://localhost:" + str(self.port)) + if r.status_code == 200: + return True + except: + pass + time.sleep(1) + + +async def _from_map_and_directory(graphs, graph_dir, port): + await internal_graphql.from_map_and_directory(graphs, graph_dir, port) + + +async def _from_directory(graph_dir, port): + await internal_graphql.from_directory(graph_dir, port) + + +async def _from_map(graphs, port): + await internal_graphql.from_map(graphs, port) + + +def _run(func, daemon, port): + if daemon: + + def _run_in_background(): + asyncio.run(func) + + threading.Thread(target=_run_in_background, daemon=True).start() + server = GraphQLServer(port) + server.wait_for_online() + return graphqlclient.RaphtoryGraphQLClient("http://localhost:" + str(port)) + else: + loop = asyncio.get_event_loop() + loop.run_until_complete(func) + loop.close() + + +def run_server(graphs=None, graph_dir=None, port=1736, daemon=False): + """ + Runs the Raphtory GraphQL server. + + Args: + graphs (dict, optional): A dictionary of graphs to load into the server. Default is None. + graph_dir (str, optional): The directory to load graphs from. Default is None. + port (int, optional): The port to run the server on. Default is 1736. + daemon (bool, optional): Whether to run the server in the background. Default is False. + + Returns: + GraphQLServer: A GraphQLServer object that can be used to query the server. (Only if daemon is True) + """ + + if graph_dir is not None and graphs is not None: + return _run(_from_map_and_directory(graphs, graph_dir, port), daemon, port) + elif graph_dir is not None: + return _run(_from_directory(graph_dir, port), daemon, port) + elif graphs is not None: + return _run(_from_map(graphs, port), daemon, port) + else: + print("No graphs or graph directory specified. Exiting.") diff --git a/python/python/raphtory/nullmodels.py b/python/python/raphtory/nullmodels.py index fa5fc0923e..46b026a0dd 100644 --- a/python/python/raphtory/nullmodels.py +++ b/python/python/raphtory/nullmodels.py @@ -1,15 +1,36 @@ """ -Generate null models for a graph. +Generate randomised reference models for a temporal graph edgelist """ import pandas as pd -def shuffle_column(graph_df:pd.DataFrame, col_number=None, col_name=None, inplace=False): + +def shuffle_column( + graph_df: pd.DataFrame, col_number=None, col_name=None, inplace=False +): """ - returns a dataframe with a given column shuffled + Returns an edgelist with a given column shuffled. Exactly one of col_number or col_name should be specified. + + Args: + graph_df (pd.DataFrame): The input DataFrame representing the timestamped edgelist. + col_number (int, optional): The column number to shuffle. Default is None. + col_name (str, optional): The column name to shuffle. Default is None. + inplace (bool, optional): If True, shuffles the column in-place. Otherwise, creates a copy of the DataFrame. Default is False. + + Returns: + pd.DataFrame: The shuffled DataFrame with the specified column. + + Raises: + AssertionError: If neither col_number nor col_name is provided. + AssertionError: If both col_number and col_name are provided. + """ - assert col_number is not None or col_name is not None, f"No column number or name provided." - assert not (col_name is not None and col_number is not None), f"Cannot have both a column number and a column name." + assert ( + col_number is not None or col_name is not None + ), f"No column number or name provided." + assert not ( + col_name is not None and col_number is not None + ), f"Cannot have both a column number and a column name." if inplace: df = graph_df @@ -19,21 +40,45 @@ def shuffle_column(graph_df:pd.DataFrame, col_number=None, col_name=None, inplac no_events = len(df) if col_number is not None: - col = df[[col_number]].sample(n=no_events) - col.reset_index(inplace=True,drop=True) - df[[col_number]] = col + col = df[df.columns[col_number]].sample(n=no_events) + col.reset_index(inplace=True, drop=True) + df[df.columns[col_number]] = col if col_name is not None: col = df[col_name].sample(n=no_events) - col.reset_index(inplace=True,drop=True) - + col.reset_index(inplace=True, drop=True) + df[col_name] = col return df -def shuffle_multiple_columns(graph_df:pd.DataFrame, col_numbers:list=None, col_names:list=None, inplace=False): + +def shuffle_multiple_columns( + graph_df: pd.DataFrame, + col_numbers: list = None, + col_names: list = None, + inplace=False, +): """ - returns a dataframe with a given columns shuffled. + Returns an edgelist with given columns shuffled. Exactly one of col_numbers or col_names should be specified. + + Args: + graph_df (pd.DataFrame): The input DataFrame representing the graph. + col_numbers (list, optional): The list of column numbers to shuffle. Default is None. + col_names (list, optional): The list of column names to shuffle. Default is None. + inplace (bool, optional): If True, shuffles the columns in-place. Otherwise, creates a copy of the DataFrame. Default is False. + + Returns: + pd.DataFrame: The shuffled DataFrame with the specified columns. + + Raises: + AssertionError: If neither col_numbers nor col_names are provided. + AssertionError: If both col_numbers and col_names are provided. + """ - assert col_numbers is not None or col_names is not None, f"No column numbers or names provided." - assert not (col_names is not None and col_numbers is not None), f"Cannot have both column numbers and column names." + assert ( + col_numbers is not None or col_names is not None + ), f"No column numbers or names provided." + assert not ( + col_names is not None and col_numbers is not None + ), f"Cannot have both column numbers and column names." if col_numbers is not None: for n in col_numbers: @@ -41,19 +86,38 @@ def shuffle_multiple_columns(graph_df:pd.DataFrame, col_numbers:list=None, col_n if col_names is not None: for name in col_names: df = shuffle_column(graph_df, col_name=name) - return df - -def permuted_timestamps_model(graph_df:pd.DataFrame, time_col:int=None, time_name:str=None, inplace=False, sorted=False): + + +def permuted_timestamps_model( + graph_df: pd.DataFrame, + time_col: int = None, + time_name: str = None, + inplace=False, + sorted=False, +): """ - returns a dataframe with the time column shuffled + Returns a DataFrame with the time column shuffled. + + Args: + graph_df (pd.DataFrame): The input DataFrame representing the graph. + time_col (int, optional): The column number of the time column to shuffle. Default is None. + time_name (str, optional): The column name of the time column to shuffle. Default is None. + inplace (bool, optional): If True, shuffles the time column in-place. Otherwise, creates a copy of the DataFrame. Default is False. + sorted (bool, optional): If True, sorts the DataFrame by the shuffled time column. Default is False. + + Returns: + pd.DataFrame or None: The shuffled DataFrame with the time column, or None if inplace=True. + """ shuffled_df = shuffle_column(graph_df, time_col, time_name, inplace) if sorted: - shuffled_df.sort_values(by=time_name if time_name else shuffled_df.columns[time_col], inplace=True) - + shuffled_df.sort_values( + by=time_name if time_name else shuffled_df.columns[time_col], inplace=True + ) + if inplace: return else: - return shuffled_df \ No newline at end of file + return shuffled_df diff --git a/python/python/raphtory/vis.py b/python/python/raphtory/vis.py deleted file mode 100644 index 4011d8c6c0..0000000000 --- a/python/python/raphtory/vis.py +++ /dev/null @@ -1,153 +0,0 @@ -""" -Generate a visualisation using matplotlib or pyvis from Raphtory graphs. -""" -from pyvis.network import Network -import networkx as nx - -r"""Draw a graph with Pyvis. - -.. note:: - - Pyvis is a required dependency. - If you intend to use this function make sure that - you install Pyvis with ``pip install pyvis`` - -:param graph: A Raphtory graph. -:param str height: A string defining the height of the graph. By default ``800px`` is set. -:param str width: A string defining the width of the graph. By default ``800px`` is set. -:param str bg_color: A string defining the colour of the graph background. It must be a HTML color code. By default ``#white`` (white) is set. -:param str font_color: A string defining the colour of the graph font. By default ``"black"`` is set. -:param str edge_color: A string defining the colour of the edges in the graph. By default ``#000000`` (black) is set. -:param str shape: An optional string defining what the node looks like. - There are two types of nodes. One type has the label inside of it and the other type has the label underneath it. - The types with the label inside of it are: ellipse, circle, database, box, text. - The ones with the label outside of it are: image, circularImage, diamond, dot, star, triangle, triangleDown, square and icon. - By default ``"dot"`` is set. -:param str node_image: An optional string defining the url of a custom node image. By default an image of a circle is set. -:param str edge_weight: An optional string defining the name of the property where edge weight is set on your Raphtory graph. By default ``1`` is set. -:param str edge_label: An optional string defining the name of the property where edge label is set on your Raphtory graph. By default, an empty string as the label is set. -:param bool notebook: A boolean that is set to True if using jupyter notebook. By default this is set to True. - - -:returns: A pyvis visualisation in static HTML format that is interactive with toggles menu. -:rtype: IFrame(name, width=self.width, height=self.height) - -For Example: - -.. jupyter-execute:: - - from raphtory import Graph - from raphtory import vis - - g = Graph() - g.add_vertex(1, src, properties={"image": "image.png"}) - g.add_edge(1, 1, 2, {"title": "edge", "weight": 1}) - g.add_edge(1, 2, 1, {"title": "edge", "weight": 3}) - - vis.to_pyvis(graph=g, edge_color="#FF0000", edge_weight= "weight", shape="image", node_image="image", edge_label="title") - -""" - -def to_pyvis( - graph, - height="800px", - width="800px", - bg_color="#white", - font_color="black", - edge_color="#000000", - shape=None, - node_image=None, - edge_weight=None, - edge_label=None, - notebook=True, - ): - """ - Returns a dynamic visualisation in static HTML format from a Raphtory graph. - """ - visGraph = Network(height=height, width=width, bgcolor=bg_color, font_color=font_color, notebook=notebook) - - for v in graph.vertices(): - image = v.property(node_image) if node_image != None else "https://cdn-icons-png.flaticon.com/512/7584/7584620.png" - shape = shape if shape != None else "dot" - visGraph.add_node(v.id(), label= v.name(), shape=shape, image=image) - - for e in graph.edges(): - weight = e.property(edge_weight) if edge_weight != None else 1 - label = e.property(edge_label) if edge_label != None else "" - visGraph.add_edge(e.src().id(), e.dst().id(), value=weight, color=edge_color, title=label) - - visGraph.show_buttons(filter_=['physics']) - visGraph.show('nx.html') - return visGraph - -r"""Draw a graph with NetworkX. - -.. note:: - - Network X is a required dependency. - If you intend to use this function make sure that - you install Network X with ``pip install networkx`` - -:param graph: A Raphtory graph. -:param float k: A float defining optimal distance between nodes. If None the distance is set to 1/sqrt(n) where n is the number of nodes. Increase this value to move nodes farther apart. -:param int iterations: An integer defining the maximum number of iterations taken to generate the optimum spring layout. Increasing this number will increase the computational time to generate the layout. By default ``50`` is set. -:param scalar or array node_size: A scalar defining the size of nodes. By default ``300`` is set. -:param color or array of colors node_color: Node color. Can be a single color or a sequence of colors with the same length as nodelist. Color can be string or rgb (or rgba) tuple of floats from 0-1. If numeric values are specified they will be mapped to colors using the cmap and vmin,vmax parameters. See matplotlib.scatter for more details. By default ``"#1f78b4"`` (blue) is set. -:param color or array of colors edge_color: Edge color. Can be a single color or a sequence of colors with the same length as edgelist. Color can be string or rgb (or rgba) tuple of floats from 0-1. If numeric values are specified they will be mapped to colors using the edge_cmap and edge_vmin,edge_vmax parameters. By default ``'k'`` (black) is set. -:param bool arrows: If None, directed graphs draw arrowheads with FancyArrowPatch, while undirected graphs draw edges via LineCollection for speed. If True, draw arrowheads with FancyArrowPatches (bendable and stylish). If False, draw edges using LineCollection (linear and fast). - Note: Arrowheads will be the same color as edges. Default is None. -:param str arrow_style: Style of the edges, defaults to ``‘-|>’``. - -:returns: A networkx visualisation that appears in the notebook output. -:rtype: matplotlib.collections.PathCollection and matplotlib.collections.LineCollection or a list of matplotlib.patches.FancyArrowPatch. - `PathCollection` of the nodes. - If ``arrows=True``, a list of FancyArrowPatches is returned. - If ``arrows=False``, a LineCollection is returned. - If ``arrows=None`` (the default), then a LineCollection is returned if - `G` is undirected, otherwise returns a list of FancyArrowPatches. - -For Example: - -.. jupyter-execute:: - - from raphtory import Graph - from raphtory import vis - - g = Graph() - g.add_vertex(1, src, properties={"image": "image.png"}) - g.add_edge(1, 1, 2, {"title": "edge", "weight": 1}) - g.add_edge(1, 2, 1, {"title": "edge", "weight": 3}) - - vis.to_networkx(graph=g, k=0.15, iterations=100, node_size=500, node_color='red', edge_color='blue', arrows=True) - -""" -def to_networkx( - graph, - k=None, - iterations=50, - node_size=300, - node_color='#1f78b4', - edge_color='k', - arrows=None, - arrow_style= "-|>" - ): - """ - Returns a Network X graph visualiation from a Raphtory graph. - """ - - networkXGraph = nx.MultiDiGraph() - - networkXGraph.add_nodes_from(list(graph.vertices().id())) - - edges = [] - for e in graph.edges(): - edges.append((e.src().id(), e.dst().id())) - - networkXGraph.add_edges_from(edges) - pos = nx.spring_layout(networkXGraph, k=k, iterations=iterations) - - nx.draw_networkx_nodes(networkXGraph, pos, node_size=node_size, node_color=node_color) - nx.draw_networkx_edges(networkXGraph, pos, edge_color=edge_color, arrows=arrows, arrowstyle=arrow_style) - - - diff --git a/python/src/graphql.rs b/python/src/graphql.rs new file mode 100644 index 0000000000..048cd2050f --- /dev/null +++ b/python/src/graphql.rs @@ -0,0 +1,85 @@ +use pyo3::{exceptions, prelude::*}; +use raphtory_core::{ + db::api::view::internal::MaterializedGraph, + prelude::Graph, + python::{graph::graph::PyGraph, utils::errors::adapt_err_value}, +}; +use raphtory_graphql::{url_decode_graph, url_encode_graph, RaphtoryServer}; +use std::collections::HashMap; + +#[pyfunction] +pub fn from_map( + py: Python, + graphs: HashMap, + port: Option, +) -> PyResult<&PyAny> { + let graphs: HashMap = graphs + .into_iter() + .map(|(key, value)| (key, value.into())) + .collect(); + let server = RaphtoryServer::from_map(graphs); + let port = port.unwrap_or(1736); + pyo3_asyncio::tokio::future_into_py(py, async move { + server + .run_with_port(port) + .await + .map_err(|e| adapt_err_value(&e)) + }) +} + +#[pyfunction] +pub fn from_directory(py: Python, path: String, port: Option) -> PyResult<&PyAny> { + let server = RaphtoryServer::from_directory(path.as_str()); + let port = port.unwrap_or(1736); + pyo3_asyncio::tokio::future_into_py(py, async move { + server + .run_with_port(port) + .await + .map_err(|e| adapt_err_value(&e)) + }) +} + +#[pyfunction] +pub fn from_map_and_directory( + py: Python, + graphs: HashMap, + path: String, + port: Option, +) -> PyResult<&PyAny> { + let graphs: HashMap = graphs + .into_iter() + .map(|(key, value)| (key, value.into())) + .collect(); + let port = port.unwrap_or(1736); + let server = RaphtoryServer::from_map_and_directory(graphs, path.as_str()); + pyo3_asyncio::tokio::future_into_py(py, async move { + server + .run_with_port(port) + .await + .map_err(|e| adapt_err_value(&e)) + }) +} + +#[pyfunction] +pub fn encode_graph(graph: MaterializedGraph) -> PyResult { + let result = url_encode_graph(graph); + match result { + Ok(s) => Ok(s), + Err(e) => Err(exceptions::PyValueError::new_err(format!( + "Error encoding: {:?}", + e + ))), + } +} + +#[pyfunction] +pub fn decode_graph(py: Python, encoded_graph: String) -> PyResult { + let result = url_decode_graph(encoded_graph); + match result { + Ok(s) => Ok(s.into_py(py)), + Err(e) => Err(exceptions::PyValueError::new_err(format!( + "Error decoding: {:?}", + e + ))), + } +} diff --git a/python/src/lib.rs b/python/src/lib.rs index 0222eaf018..9dd2e70636 100644 --- a/python/src/lib.rs +++ b/python/src/lib.rs @@ -1,32 +1,53 @@ -extern crate core; +mod graphql; -use py_raphtory::algorithms::*; -use py_raphtory::graph::PyGraph; -use py_raphtory::graph_gen::*; -use py_raphtory::graph_loader::*; +extern crate core; +use graphql::*; use pyo3::prelude::*; -use py_raphtory::edge::{PyEdge, PyEdges}; -use py_raphtory::vertex::{PyVertex, PyVertices}; +use raphtory_core::python::{ + graph::{ + algorithm_result::AlgorithmResultStrU64, + edge::{PyDirection, PyEdge, PyEdges}, + graph::PyGraph, + graph_with_deletions::PyGraphWithDeletions, + properties::{PyConstProperties, PyProperties, PyTemporalProp, PyTemporalProperties}, + vertex::{PyVertex, PyVertices}, + }, + packages::{algorithms::*, graph_gen::*, graph_loader::*}, +}; /// Raphtory graph analytics library #[pymodule] fn raphtory(py: Python<'_>, m: &PyModule) -> PyResult<()> { + //Graph classes m.add_class::()?; + m.add_class::()?; + m.add_class::()?; + m.add_class::()?; + m.add_class::()?; + m.add_class::()?; + m.add_class::()?; + m.add_class::()?; + m.add_class::()?; + m.add_class::()?; + m.add_class::()?; + + //GRAPHQL + let graphql_module = PyModule::new(py, "internal_graphql")?; + graphql_module.add_function(wrap_pyfunction!(from_map, graphql_module)?)?; + graphql_module.add_function(wrap_pyfunction!(from_directory, graphql_module)?)?; + graphql_module.add_function(wrap_pyfunction!(from_map_and_directory, graphql_module)?)?; + graphql_module.add_function(wrap_pyfunction!(encode_graph, graphql_module)?)?; + graphql_module.add_function(wrap_pyfunction!(decode_graph, graphql_module)?)?; + m.add_submodule(graphql_module)?; + //ALGORITHMS let algorithm_module = PyModule::new(py, "algorithms")?; algorithm_module.add_function(wrap_pyfunction!(global_reciprocity, algorithm_module)?)?; algorithm_module.add_function(wrap_pyfunction!(all_local_reciprocity, algorithm_module)?)?; + m.add_class::()?; + algorithm_module.add_function(wrap_pyfunction!(triplet_count, algorithm_module)?)?; - algorithm_module.add_function(wrap_pyfunction!( - global_clustering_coefficient, - algorithm_module - )?)?; algorithm_module.add_function(wrap_pyfunction!(local_triangle_count, algorithm_module)?)?; - algorithm_module.add_function(wrap_pyfunction!(generic_taint, algorithm_module)?)?; - algorithm_module.add_function(wrap_pyfunction!( - local_clustering_coefficient, - algorithm_module - )?)?; algorithm_module.add_function(wrap_pyfunction!(average_degree, algorithm_module)?)?; algorithm_module.add_function(wrap_pyfunction!(directed_graph_density, algorithm_module)?)?; algorithm_module.add_function(wrap_pyfunction!(max_out_degree, algorithm_module)?)?; @@ -35,11 +56,20 @@ fn raphtory(py: Python<'_>, m: &PyModule) -> PyResult<()> { algorithm_module.add_function(wrap_pyfunction!(min_in_degree, algorithm_module)?)?; algorithm_module.add_function(wrap_pyfunction!(pagerank, algorithm_module)?)?; algorithm_module.add_function(wrap_pyfunction!( - weakly_connected_components, + global_clustering_coefficient, algorithm_module )?)?; + algorithm_module.add_function(wrap_pyfunction!( - temporal_three_node_motif, + temporally_reachable_nodes, + algorithm_module + )?)?; + algorithm_module.add_function(wrap_pyfunction!( + local_clustering_coefficient, + algorithm_module + )?)?; + algorithm_module.add_function(wrap_pyfunction!( + weakly_connected_components, algorithm_module )?)?; algorithm_module.add_function(wrap_pyfunction!( @@ -47,21 +77,30 @@ fn raphtory(py: Python<'_>, m: &PyModule) -> PyResult<()> { algorithm_module )?)?; algorithm_module.add_function(wrap_pyfunction!( - global_temporal_three_node_motif_from_local, + global_temporal_three_node_motif_multi, + algorithm_module + )?)?; + algorithm_module.add_function(wrap_pyfunction!( + local_temporal_three_node_motifs, algorithm_module )?)?; + algorithm_module.add_function(wrap_pyfunction!(hits, algorithm_module)?)?; + algorithm_module.add_function(wrap_pyfunction!(balance, algorithm_module)?)?; m.add_submodule(algorithm_module)?; + + //GRAPH LOADER let graph_loader_module = PyModule::new(py, "graph_loader")?; graph_loader_module.add_function(wrap_pyfunction!(lotr_graph, graph_loader_module)?)?; + graph_loader_module.add_function(wrap_pyfunction!(neo4j_movie_graph, graph_loader_module)?)?; + graph_loader_module.add_function(wrap_pyfunction!(stable_coin_graph, graph_loader_module)?)?; graph_loader_module.add_function(wrap_pyfunction!( reddit_hyperlink_graph, graph_loader_module )?)?; - graph_loader_module.add_function(wrap_pyfunction!(neo4j_movie_graph, graph_loader_module)?)?; - graph_loader_module.add_function(wrap_pyfunction!(stable_coin_graph, graph_loader_module)?)?; m.add_submodule(graph_loader_module)?; + //GRAPH GENERATOR let graph_gen_module = PyModule::new(py, "graph_gen")?; graph_gen_module.add_function(wrap_pyfunction!(random_attachment, graph_gen_module)?)?; graph_gen_module.add_function(wrap_pyfunction!( @@ -70,10 +109,11 @@ fn raphtory(py: Python<'_>, m: &PyModule) -> PyResult<()> { )?)?; m.add_submodule(graph_gen_module)?; - m.add_class::()?; - m.add_class::()?; - m.add_class::()?; - m.add_class::()?; + // TODO: re-enable + //VECTORS + // let vectors_module = PyModule::new(py, "vectors")?; + // vectors_module.add_class::()?; + // m.add_submodule(vectors_module)?; Ok(()) } diff --git a/python/tests/data/network_traffic_edges.csv b/python/tests/data/network_traffic_edges.csv new file mode 100644 index 0000000000..aa5cfa1563 --- /dev/null +++ b/python/tests/data/network_traffic_edges.csv @@ -0,0 +1,10 @@ +timestamp,source,destination,data_size_MB,transaction_type,is_encrypted +2023-09-01T08:00:00Z,ServerA,ServerB,5.6,Critical System Request,True +2023-09-01T08:05:00Z,ServerA,ServerC,7.1,File Transfer,False +2023-09-01T08:10:00Z,ServerB,ServerD,3.2,Standard Service Request,True +2023-09-01T08:15:00Z,ServerD,ServerE,8.9,Administrative Command,False +2023-09-01T08:20:00Z,ServerC,ServerA,4.5,Critical System Request,True +2023-09-01T08:25:00Z,ServerE,ServerB,6.2,File Transfer,False +2023-09-01T08:30:00Z,ServerD,ServerC,5.0,Standard Service Request,True +2023-09-01T08:31:00Z,ServerD,ServerC,10.0,Standard Service Request,True +2023-09-01T08:32:00Z,ServerD,ServerC,15.0,Standard Service Request,True diff --git a/python/tests/data/network_traffic_vertices.csv b/python/tests/data/network_traffic_vertices.csv new file mode 100644 index 0000000000..4191ee20b1 --- /dev/null +++ b/python/tests/data/network_traffic_vertices.csv @@ -0,0 +1,8 @@ +timestamp,server_id,server_name,hardware_type,OS_version,primary_function,uptime_days +2023-09-01T08:00:00Z,ServerA,Alpha,Blade Server,Ubuntu 20.04,Database,120 +2023-09-01T08:01:00Z,ServerA,Alpha,Blade Server,Ubuntu 20.04,Database,121 +2023-09-01T08:02:00Z,ServerA,Alpha,Blade Server,Ubuntu 20.04,Database,122 +2023-09-01T08:05:00Z,ServerB,Beta,Rack Server,Red Hat 8.1,Web Server,45 +2023-09-01T08:10:00Z,ServerC,Charlie,Blade Server,Windows Server 2022,File Storage,90 +2023-09-01T08:15:00Z,ServerD,Delta,Tower Server,Ubuntu 20.04,Application Server,60 +2023-09-01T08:20:00Z,ServerE,Echo,Rack Server,Red Hat 8.1,Backup,30 \ No newline at end of file diff --git a/python/tests/expected/dataframe_output/edge_df_all.json b/python/tests/expected/dataframe_output/edge_df_all.json new file mode 100644 index 0000000000..aa0fd10414 --- /dev/null +++ b/python/tests/expected/dataframe_output/edge_df_all.json @@ -0,0 +1 @@ +{"src":{"0":"ServerA","1":"ServerA","2":"ServerB","3":"ServerC","4":"ServerD","5":"ServerD","6":"ServerE"},"dst":{"0":"ServerB","1":"ServerC","2":"ServerD","3":"ServerA","4":"ServerC","5":"ServerE","6":"ServerB"},"layer":{"0":"Critical System Request","1":"File Transfer","2":"Standard Service Request","3":"Critical System Request","4":"Standard Service Request","5":"Administrative Command","6":"File Transfer"},"properties":{"0":{"datasource":"data\/network_traffic_edges.csv","is_encrypted":true,"data_size_MB":[[1693555200000,5.6]]},"1":{"is_encrypted":false,"datasource":"data\/network_traffic_edges.csv","data_size_MB":[[1693555500000,7.1]]},"2":{"is_encrypted":true,"datasource":"data\/network_traffic_edges.csv","data_size_MB":[[1693555800000,3.2]]},"3":{"datasource":"data\/network_traffic_edges.csv","is_encrypted":true,"data_size_MB":[[1693556400000,4.5]]},"4":{"datasource":"data\/network_traffic_edges.csv","is_encrypted":true,"data_size_MB":[[1693557000000,5.0],[1693557060000,10.0],[1693557120000,15.0]]},"5":{"datasource":"data\/network_traffic_edges.csv","is_encrypted":false,"data_size_MB":[[1693556100000,8.9]]},"6":{"datasource":"data\/network_traffic_edges.csv","is_encrypted":false,"data_size_MB":[[1693556700000,6.2]]}},"update_history":{"0":[1693555200000],"1":[1693555500000],"2":[1693555800000],"3":[1693556400000],"4":[1693557000000,1693557060000,1693557120000],"5":[1693556100000],"6":[1693556700000]}} \ No newline at end of file diff --git a/python/tests/expected/dataframe_output/edge_df_exploded.json b/python/tests/expected/dataframe_output/edge_df_exploded.json new file mode 100644 index 0000000000..ab848f74f9 --- /dev/null +++ b/python/tests/expected/dataframe_output/edge_df_exploded.json @@ -0,0 +1 @@ +{"src":{"0":"ServerA","1":"ServerA","2":"ServerB","3":"ServerC","4":"ServerD","5":"ServerD","6":"ServerD","7":"ServerD","8":"ServerE"},"dst":{"0":"ServerB","1":"ServerC","2":"ServerD","3":"ServerA","4":"ServerC","5":"ServerC","6":"ServerC","7":"ServerE","8":"ServerB"},"layer":{"0":"Critical System Request","1":"File Transfer","2":"Standard Service Request","3":"Critical System Request","4":"Standard Service Request","5":"Standard Service Request","6":"Standard Service Request","7":"Administrative Command","8":"File Transfer"},"properties":{"0":{"datasource":"data\/network_traffic_edges.csv","is_encrypted":true,"data_size_MB":[[1693555200000,5.6]]},"1":{"is_encrypted":false,"datasource":"data\/network_traffic_edges.csv","data_size_MB":[[1693555500000,7.1]]},"2":{"is_encrypted":true,"datasource":"data\/network_traffic_edges.csv","data_size_MB":[[1693555800000,3.2]]},"3":{"datasource":"data\/network_traffic_edges.csv","is_encrypted":true,"data_size_MB":[[1693556400000,4.5]]},"4":{"is_encrypted":true,"datasource":"data\/network_traffic_edges.csv","data_size_MB":[[1693557000000,5.0]]},"5":{"is_encrypted":true,"datasource":"data\/network_traffic_edges.csv","data_size_MB":[[1693557060000,10.0]]},"6":{"is_encrypted":true,"datasource":"data\/network_traffic_edges.csv","data_size_MB":[[1693557120000,15.0]]},"7":{"datasource":"data\/network_traffic_edges.csv","is_encrypted":false,"data_size_MB":[[1693556100000,8.9]]},"8":{"datasource":"data\/network_traffic_edges.csv","is_encrypted":false,"data_size_MB":[[1693556700000,6.2]]}},"update_history":{"0":1693555200000,"1":1693555500000,"2":1693555800000,"3":1693556400000,"4":1693557000000,"5":1693557060000,"6":1693557120000,"7":1693556100000,"8":1693556700000}} \ No newline at end of file diff --git a/python/tests/expected/dataframe_output/edge_df_exploded_no_hist.json b/python/tests/expected/dataframe_output/edge_df_exploded_no_hist.json new file mode 100644 index 0000000000..b56c7b33d4 --- /dev/null +++ b/python/tests/expected/dataframe_output/edge_df_exploded_no_hist.json @@ -0,0 +1 @@ +{"src":{"0":"ServerA","1":"ServerA","2":"ServerB","3":"ServerC","4":"ServerD","5":"ServerD","6":"ServerD","7":"ServerD","8":"ServerE"},"dst":{"0":"ServerB","1":"ServerC","2":"ServerD","3":"ServerA","4":"ServerC","5":"ServerC","6":"ServerC","7":"ServerE","8":"ServerB"},"layer":{"0":"Critical System Request","1":"File Transfer","2":"Standard Service Request","3":"Critical System Request","4":"Standard Service Request","5":"Standard Service Request","6":"Standard Service Request","7":"Administrative Command","8":"File Transfer"},"properties":{"0":{"datasource":"data\/network_traffic_edges.csv","is_encrypted":true,"data_size_MB":[[1693555200000,5.6]]},"1":{"is_encrypted":false,"datasource":"data\/network_traffic_edges.csv","data_size_MB":[[1693555500000,7.1]]},"2":{"datasource":"data\/network_traffic_edges.csv","is_encrypted":true,"data_size_MB":[[1693555800000,3.2]]},"3":{"datasource":"data\/network_traffic_edges.csv","is_encrypted":true,"data_size_MB":[[1693556400000,4.5]]},"4":{"is_encrypted":true,"datasource":"data\/network_traffic_edges.csv","data_size_MB":[[1693557000000,5.0]]},"5":{"is_encrypted":true,"datasource":"data\/network_traffic_edges.csv","data_size_MB":[[1693557060000,10.0]]},"6":{"is_encrypted":true,"datasource":"data\/network_traffic_edges.csv","data_size_MB":[[1693557120000,15.0]]},"7":{"datasource":"data\/network_traffic_edges.csv","is_encrypted":false,"data_size_MB":[[1693556100000,8.9]]},"8":{"is_encrypted":false,"datasource":"data\/network_traffic_edges.csv","data_size_MB":[[1693556700000,6.2]]}}} \ No newline at end of file diff --git a/python/tests/expected/dataframe_output/edge_df_exploded_no_prop_hist.json b/python/tests/expected/dataframe_output/edge_df_exploded_no_prop_hist.json new file mode 100644 index 0000000000..c960e1cd30 --- /dev/null +++ b/python/tests/expected/dataframe_output/edge_df_exploded_no_prop_hist.json @@ -0,0 +1 @@ +{"src":{"0":"ServerA","1":"ServerA","2":"ServerB","3":"ServerC","4":"ServerD","5":"ServerD","6":"ServerD","7":"ServerD","8":"ServerE"},"dst":{"0":"ServerB","1":"ServerC","2":"ServerD","3":"ServerA","4":"ServerC","5":"ServerC","6":"ServerC","7":"ServerE","8":"ServerB"},"layer":{"0":"Critical System Request","1":"File Transfer","2":"Standard Service Request","3":"Critical System Request","4":"Standard Service Request","5":"Standard Service Request","6":"Standard Service Request","7":"Administrative Command","8":"File Transfer"},"properties":{"0":{"data_size_MB":5.6,"is_encrypted":true,"datasource":"data\/network_traffic_edges.csv"},"1":{"datasource":"data\/network_traffic_edges.csv","is_encrypted":false,"data_size_MB":7.1},"2":{"data_size_MB":3.2,"is_encrypted":true,"datasource":"data\/network_traffic_edges.csv"},"3":{"data_size_MB":4.5,"is_encrypted":true,"datasource":"data\/network_traffic_edges.csv"},"4":{"is_encrypted":true,"data_size_MB":5.0,"datasource":"data\/network_traffic_edges.csv"},"5":{"is_encrypted":true,"data_size_MB":10.0,"datasource":"data\/network_traffic_edges.csv"},"6":{"data_size_MB":15.0,"is_encrypted":true,"datasource":"data\/network_traffic_edges.csv"},"7":{"datasource":"data\/network_traffic_edges.csv","data_size_MB":8.9,"is_encrypted":false},"8":{"data_size_MB":6.2,"is_encrypted":false,"datasource":"data\/network_traffic_edges.csv"}},"update_history":{"0":1693555200000,"1":1693555500000,"2":1693555800000,"3":1693556400000,"4":1693557000000,"5":1693557060000,"6":1693557120000,"7":1693556100000,"8":1693556700000}} \ No newline at end of file diff --git a/python/tests/expected/dataframe_output/edge_df_exploded_no_props.json b/python/tests/expected/dataframe_output/edge_df_exploded_no_props.json new file mode 100644 index 0000000000..3d7debc056 --- /dev/null +++ b/python/tests/expected/dataframe_output/edge_df_exploded_no_props.json @@ -0,0 +1 @@ +{"src":{"0":"ServerA","1":"ServerA","2":"ServerB","3":"ServerC","4":"ServerD","5":"ServerD","6":"ServerD","7":"ServerD","8":"ServerE"},"dst":{"0":"ServerB","1":"ServerC","2":"ServerD","3":"ServerA","4":"ServerC","5":"ServerC","6":"ServerC","7":"ServerE","8":"ServerB"},"layer":{"0":"Critical System Request","1":"File Transfer","2":"Standard Service Request","3":"Critical System Request","4":"Standard Service Request","5":"Standard Service Request","6":"Standard Service Request","7":"Administrative Command","8":"File Transfer"},"update_history":{"0":1693555200000,"1":1693555500000,"2":1693555800000,"3":1693556400000,"4":1693557000000,"5":1693557060000,"6":1693557120000,"7":1693556100000,"8":1693556700000}} \ No newline at end of file diff --git a/python/tests/expected/dataframe_output/edge_df_no_hist.json b/python/tests/expected/dataframe_output/edge_df_no_hist.json new file mode 100644 index 0000000000..6c16f9c08a --- /dev/null +++ b/python/tests/expected/dataframe_output/edge_df_no_hist.json @@ -0,0 +1 @@ +{"src":{"0":"ServerA","1":"ServerA","2":"ServerB","3":"ServerC","4":"ServerD","5":"ServerD","6":"ServerE"},"dst":{"0":"ServerB","1":"ServerC","2":"ServerD","3":"ServerA","4":"ServerC","5":"ServerE","6":"ServerB"},"layer":{"0":"Critical System Request","1":"File Transfer","2":"Standard Service Request","3":"Critical System Request","4":"Standard Service Request","5":"Administrative Command","6":"File Transfer"},"properties":{"0":{"is_encrypted":true,"datasource":"data\/network_traffic_edges.csv","data_size_MB":[[1693555200000,5.6]]},"1":{"is_encrypted":false,"datasource":"data\/network_traffic_edges.csv","data_size_MB":[[1693555500000,7.1]]},"2":{"is_encrypted":true,"datasource":"data\/network_traffic_edges.csv","data_size_MB":[[1693555800000,3.2]]},"3":{"datasource":"data\/network_traffic_edges.csv","is_encrypted":true,"data_size_MB":[[1693556400000,4.5]]},"4":{"datasource":"data\/network_traffic_edges.csv","is_encrypted":true,"data_size_MB":[[1693557000000,5.0],[1693557060000,10.0],[1693557120000,15.0]]},"5":{"is_encrypted":false,"datasource":"data\/network_traffic_edges.csv","data_size_MB":[[1693556100000,8.9]]},"6":{"datasource":"data\/network_traffic_edges.csv","is_encrypted":false,"data_size_MB":[[1693556700000,6.2]]}}} \ No newline at end of file diff --git a/python/tests/expected/dataframe_output/edge_df_no_prop_hist.json b/python/tests/expected/dataframe_output/edge_df_no_prop_hist.json new file mode 100644 index 0000000000..6aeab277eb --- /dev/null +++ b/python/tests/expected/dataframe_output/edge_df_no_prop_hist.json @@ -0,0 +1 @@ +{"src":{"0":"ServerA","1":"ServerA","2":"ServerB","3":"ServerC","4":"ServerD","5":"ServerD","6":"ServerE"},"dst":{"0":"ServerB","1":"ServerC","2":"ServerD","3":"ServerA","4":"ServerC","5":"ServerE","6":"ServerB"},"layer":{"0":"Critical System Request","1":"File Transfer","2":"Standard Service Request","3":"Critical System Request","4":"Standard Service Request","5":"Administrative Command","6":"File Transfer"},"properties":{"0":{"is_encrypted":true,"datasource":"data\/network_traffic_edges.csv","data_size_MB":5.6},"1":{"is_encrypted":false,"datasource":"data\/network_traffic_edges.csv","data_size_MB":7.1},"2":{"is_encrypted":true,"datasource":"data\/network_traffic_edges.csv","data_size_MB":3.2},"3":{"datasource":"data\/network_traffic_edges.csv","data_size_MB":4.5,"is_encrypted":true},"4":{"datasource":"data\/network_traffic_edges.csv","data_size_MB":15.0,"is_encrypted":true},"5":{"datasource":"data\/network_traffic_edges.csv","is_encrypted":false,"data_size_MB":8.9},"6":{"datasource":"data\/network_traffic_edges.csv","is_encrypted":false,"data_size_MB":6.2}},"update_history":{"0":[1693555200000],"1":[1693555500000],"2":[1693555800000],"3":[1693556400000],"4":[1693557000000,1693557060000,1693557120000],"5":[1693556100000],"6":[1693556700000]}} \ No newline at end of file diff --git a/python/tests/expected/dataframe_output/edge_df_no_props.json b/python/tests/expected/dataframe_output/edge_df_no_props.json new file mode 100644 index 0000000000..fd8e7d395f --- /dev/null +++ b/python/tests/expected/dataframe_output/edge_df_no_props.json @@ -0,0 +1 @@ +{"src":{"0":"ServerA","1":"ServerA","2":"ServerB","3":"ServerC","4":"ServerD","5":"ServerD","6":"ServerE"},"dst":{"0":"ServerB","1":"ServerC","2":"ServerD","3":"ServerA","4":"ServerC","5":"ServerE","6":"ServerB"},"layer":{"0":"Critical System Request","1":"File Transfer","2":"Standard Service Request","3":"Critical System Request","4":"Standard Service Request","5":"Administrative Command","6":"File Transfer"},"update_history":{"0":[1693555200000],"1":[1693555500000],"2":[1693555800000],"3":[1693556400000],"4":[1693557000000,1693557060000,1693557120000],"5":[1693556100000],"6":[1693556700000]}} \ No newline at end of file diff --git a/python/tests/expected/dataframe_output/vertex_df_all.json b/python/tests/expected/dataframe_output/vertex_df_all.json new file mode 100644 index 0000000000..f01ebb4df1 --- /dev/null +++ b/python/tests/expected/dataframe_output/vertex_df_all.json @@ -0,0 +1 @@ +{"id":{"0":"ServerA","1":"ServerB","2":"ServerC","3":"ServerD","4":"ServerE"},"properties":{"0":{"server_name":"Alpha","hardware_type":"Blade Server","datasource":"data\/network_traffic_edges.csv","primary_function":[[1693555200000,"Database"],[1693555260000,"Database"],[1693555320000,"Database"]],"uptime_days":[[1693555200000,120],[1693555260000,121],[1693555320000,122]],"OS_version":[[1693555200000,"Ubuntu 20.04"],[1693555260000,"Ubuntu 20.04"],[1693555320000,"Ubuntu 20.04"]]},"1":{"datasource":"data\/network_traffic_edges.csv","hardware_type":"Rack Server","server_name":"Beta","uptime_days":[[1693555500000,45]],"OS_version":[[1693555500000,"Red Hat 8.1"]],"primary_function":[[1693555500000,"Web Server"]]},"2":{"server_name":"Charlie","datasource":"data\/network_traffic_edges.csv","hardware_type":"Blade Server","OS_version":[[1693555800000,"Windows Server 2022"]],"primary_function":[[1693555800000,"File Storage"]],"uptime_days":[[1693555800000,90]]},"3":{"datasource":"data\/network_traffic_edges.csv","server_name":"Delta","hardware_type":"Tower Server","uptime_days":[[1693556100000,60]],"OS_version":[[1693556100000,"Ubuntu 20.04"]],"primary_function":[[1693556100000,"Application Server"]]},"4":{"server_name":"Echo","hardware_type":"Rack Server","datasource":"data\/network_traffic_edges.csv","primary_function":[[1693556400000,"Backup"]],"OS_version":[[1693556400000,"Red Hat 8.1"]],"uptime_days":[[1693556400000,30]]}},"update_history":{"0":[1693555200000,1693555260000,1693555320000,1693555500000,1693556400000],"1":[1693555200000,1693555500000,1693555800000,1693556700000],"2":[1693555500000,1693555800000,1693556400000,1693557000000,1693557060000,1693557120000],"3":[1693555800000,1693556100000,1693557000000,1693557060000,1693557120000],"4":[1693556100000,1693556400000,1693556700000]}} \ No newline at end of file diff --git a/python/tests/expected/dataframe_output/vertex_df_no_hist.json b/python/tests/expected/dataframe_output/vertex_df_no_hist.json new file mode 100644 index 0000000000..c166f0e4d4 --- /dev/null +++ b/python/tests/expected/dataframe_output/vertex_df_no_hist.json @@ -0,0 +1 @@ +{"id":{"0":"ServerA","1":"ServerB","2":"ServerC","3":"ServerD","4":"ServerE"},"properties":{"0":{"datasource":"data\/network_traffic_edges.csv","server_name":"Alpha","hardware_type":"Blade Server","OS_version":[[1693555200000,"Ubuntu 20.04"],[1693555260000,"Ubuntu 20.04"],[1693555320000,"Ubuntu 20.04"]],"uptime_days":[[1693555200000,120],[1693555260000,121],[1693555320000,122]],"primary_function":[[1693555200000,"Database"],[1693555260000,"Database"],[1693555320000,"Database"]]},"1":{"datasource":"data\/network_traffic_edges.csv","hardware_type":"Rack Server","server_name":"Beta","primary_function":[[1693555500000,"Web Server"]],"uptime_days":[[1693555500000,45]],"OS_version":[[1693555500000,"Red Hat 8.1"]]},"2":{"hardware_type":"Blade Server","server_name":"Charlie","datasource":"data\/network_traffic_edges.csv","uptime_days":[[1693555800000,90]],"OS_version":[[1693555800000,"Windows Server 2022"]],"primary_function":[[1693555800000,"File Storage"]]},"3":{"server_name":"Delta","hardware_type":"Tower Server","datasource":"data\/network_traffic_edges.csv","uptime_days":[[1693556100000,60]],"OS_version":[[1693556100000,"Ubuntu 20.04"]],"primary_function":[[1693556100000,"Application Server"]]},"4":{"datasource":"data\/network_traffic_edges.csv","hardware_type":"Rack Server","server_name":"Echo","uptime_days":[[1693556400000,30]],"OS_version":[[1693556400000,"Red Hat 8.1"]],"primary_function":[[1693556400000,"Backup"]]}}} \ No newline at end of file diff --git a/python/tests/expected/dataframe_output/vertex_df_no_prop_hist.json b/python/tests/expected/dataframe_output/vertex_df_no_prop_hist.json new file mode 100644 index 0000000000..1f072ff239 --- /dev/null +++ b/python/tests/expected/dataframe_output/vertex_df_no_prop_hist.json @@ -0,0 +1 @@ +{"id":{"0":"ServerA","1":"ServerB","2":"ServerC","3":"ServerD","4":"ServerE"},"properties":{"0":{"server_name":"Alpha","datasource":"data\/network_traffic_edges.csv","hardware_type":"Blade Server","uptime_days":122,"OS_version":"Ubuntu 20.04","primary_function":"Database"},"1":{"primary_function":"Web Server","server_name":"Beta","OS_version":"Red Hat 8.1","hardware_type":"Rack Server","datasource":"data\/network_traffic_edges.csv","uptime_days":45},"2":{"primary_function":"File Storage","server_name":"Charlie","datasource":"data\/network_traffic_edges.csv","hardware_type":"Blade Server","OS_version":"Windows Server 2022","uptime_days":90},"3":{"primary_function":"Application Server","OS_version":"Ubuntu 20.04","server_name":"Delta","datasource":"data\/network_traffic_edges.csv","uptime_days":60,"hardware_type":"Tower Server"},"4":{"primary_function":"Backup","hardware_type":"Rack Server","OS_version":"Red Hat 8.1","datasource":"data\/network_traffic_edges.csv","uptime_days":30,"server_name":"Echo"}},"update_history":{"0":[1693555200000,1693555260000,1693555320000,1693555500000,1693556400000],"1":[1693555200000,1693555500000,1693555800000,1693556700000],"2":[1693555500000,1693555800000,1693556400000,1693557000000,1693557060000,1693557120000],"3":[1693555800000,1693556100000,1693557000000,1693557060000,1693557120000],"4":[1693556100000,1693556400000,1693556700000]}} \ No newline at end of file diff --git a/python/tests/expected/dataframe_output/vertex_df_no_props.json b/python/tests/expected/dataframe_output/vertex_df_no_props.json new file mode 100644 index 0000000000..d388c1fde7 --- /dev/null +++ b/python/tests/expected/dataframe_output/vertex_df_no_props.json @@ -0,0 +1 @@ +{"id":{"0":"ServerA","1":"ServerB","2":"ServerC","3":"ServerD","4":"ServerE"},"update_history":{"0":[1693555200000,1693555260000,1693555320000,1693555500000,1693556400000],"1":[1693555200000,1693555500000,1693555800000,1693556700000],"2":[1693555500000,1693555800000,1693556400000,1693557000000,1693557060000,1693557120000],"3":[1693555800000,1693556100000,1693557000000,1693557060000,1693557120000],"4":[1693556100000,1693556400000,1693556700000]}} \ No newline at end of file diff --git a/python/tests/notebook.ipynb b/python/tests/notebook.ipynb index 2b65c528bb..fe85c71777 100644 --- a/python/tests/notebook.ipynb +++ b/python/tests/notebook.ipynb @@ -2,13 +2,14 @@ "cells": [ { "cell_type": "code", - "execution_count": 9, + "execution_count": null, "metadata": {}, "outputs": [], "source": [ "import pandas as pd\n", "import matplotlib.pyplot as plt\n", - "import seaborn as sns" + "import seaborn as sns\n", + "import tempfile" ] }, { @@ -24,24 +25,13 @@ }, { "cell_type": "code", - "execution_count": 10, + "execution_count": null, "metadata": { "pycharm": { "name": "#%%\n" } }, - "outputs": [ - { - "data": { - "text/plain": [ - "Graph(number_of_edges=0, number_of_vertices=0, earliest_time=0, latest_time=0)" - ] - }, - "execution_count": 10, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "from raphtory import Graph\n", "g = Graph()\n", @@ -69,26 +59,9 @@ }, { "cell_type": "code", - "execution_count": 11, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "True True False\n", - "True False\n", - "1 3\n", - "True True False\n", - "True False\n", - "2 5\n", - "Vertex(name=Ben, properties={_id : Ben})\n", - "Edge(source=Haaroon, target=Hamza, earliest_time=7, latest_time=7, properties={property2 : 9.8, First-Met : 01/01/1990, property1 : 1, property3 : test})\n", - "Graph(number_of_edges=3, number_of_vertices=6, earliest_time=1, latest_time=8)\n", - "True\n" - ] - } - ], + "outputs": [], "source": [ "# Basic Addition with integer IDs\n", "g.add_vertex(timestamp=1,id=10)\n", @@ -99,7 +72,7 @@ "# checking edge 1,2 exists and 2,1 doesn't as Raphtory is directed\n", "print(g.has_edge(1,2),g.has_edge(2,1))\n", "# Check the total number of edges and vertices\n", - "print(g.num_edges(),g.num_vertices())\n", + "print(g.count_edges(),g.count_vertices())\n", "\n", "# Adding vertices and edges with String IDs\n", "g.add_vertex(timestamp=5,id=\"Ben\")\n", @@ -108,43 +81,33 @@ "# Performing the same checks as before, but with strings\n", "print(g.has_vertex(id=\"Ben\"), g.has_vertex(id=\"Hamza\"), g.has_vertex(id=\"Dave\"))\n", "print(g.has_edge(src=\"Hamza\",dst=\"Ben\"),g.has_edge(src=\"Ben\",dst=\"Hamza\"))\n", - "print(g.num_edges(),g.num_vertices())\n", + "print(g.count_edges(),g.count_vertices())\n", "\n", "#Add an edge with Temporal Properties which can change over time\n", - "g.add_edge(timestamp=7,src=\"Haaroon\",dst=\"Hamza\",properties={\"property1\": 1, \"property2\": 9.8, \"property3\": \"test\"})\n", + "e = g.add_edge(timestamp=7,src=\"Haaroon\",dst=\"Hamza\",properties={\"property1\": 1, \"property2\": 9.8, \"property3\": \"test\"})\n", "#Add a static property which is immutable\n", - "g.add_edge_properties(src=\"Haaroon\",dst=\"Hamza\",properties={\"First-Met\":\"01/01/1990\"})\n", + "e.add_constant_properties(properties={\"First-Met\":\"01/01/1990\"})\n", "\n", "#Add an vertex with Temporal Properties which can change over time\n", - "g.add_vertex(timestamp=5,id=\"Hamza\",properties= {\"property1\": 5, \"property2\": 12.5, \"property3\": \"test2\"})\n", + "v = g.add_vertex(timestamp=5,id=\"Hamza\",properties= {\"property1\": 5, \"property2\": 12.5, \"property3\": \"test2\"})\n", "#Add a static property which is immutable\n", - "g.add_vertex_properties(id=\"Hamza\",properties={\"Date-of-Birth\":\"01/01/1990\"})\n", + "v.add_constant_properties(properties={\"Date-of-Birth\":\"01/01/1990\"})\n", "print(g.vertex(\"Ben\").__repr__())\n", "print(g.edge(\"Haaroon\",\"Hamza\").__repr__())\n", "print(g.__repr__())\n", - "g.save_to_file(\"/tmp/graph\")\n", + "with tempfile.NamedTemporaryFile() as g_path:\n", + " g.save_to_file(g_path.name)\n", "\n", - "loaded_graph = Graph.load_from_file(\"/tmp/graph\")\n", + " loaded_graph = Graph.load_from_file(g_path.name)\n", "\n", - "print(loaded_graph.has_vertex(\"Hamza\"))" + " print(loaded_graph.has_vertex(\"Hamza\"))" ] }, { "cell_type": "code", - "execution_count": 12, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "image/png": "", - "text/plain": [ - "
" - ] - }, - "metadata": {}, - "output_type": "display_data" - } - ], + "outputs": [], "source": [ "from raphtory import graph_loader\n", "\n", @@ -153,47 +116,26 @@ "g.add_vertex(timestamp=0,id=\"Gandalf\",properties={\"Race\":\"Maiar\"})\n", "\n", "#view[\"Gandalf\"][\"Race\"]\n", - "from raphtory import vis\n", + "from raphtory import export\n", "\n", - "vis.to_networkx(view, k=20)" + "export.to_networkx(view)" ] }, { "cell_type": "code", - "execution_count": 13, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "" - ] - }, - "execution_count": 13, - "metadata": {}, - "output_type": "execute_result" - }, - { - "data": { - "image/png": "", - "text/plain": [ - "
" - ] - }, - "metadata": {}, - "output_type": "display_data" - } - ], + "outputs": [], "source": [ "from raphtory import graph_gen\n", "\n", - "g = Graph(4)\n", + "g = Graph()\n", "graph_gen.ba_preferential_attachment(g,vertices_to_add=1000,edges_per_step=10)\n", "view = g.window(0,1000)\n", "\n", "ids = []\n", "degrees = []\n", - "for v in view.vertices():\n", + "for v in view.vertices:\n", " ids.append(v.id)\n", " degrees.append(v.degree())\n", "\n", @@ -205,7 +147,7 @@ }, { "cell_type": "code", - "execution_count": 14, + "execution_count": null, "metadata": { "pycharm": { "name": "#%%\n" @@ -222,30 +164,9 @@ }, { "cell_type": "code", - "execution_count": 15, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "" - ] - }, - "execution_count": 15, - "metadata": {}, - "output_type": "execute_result" - }, - { - "data": { - "image/png": "", - "text/plain": [ - "
" - ] - }, - "metadata": {}, - "output_type": "display_data" - } - ], + "outputs": [], "source": [ "views = g.expanding(100)\n", "\n", @@ -255,10 +176,10 @@ "degree = []\n", "\n", "for view in views:\n", - " timestamps.append(view.latest_time())\n", + " timestamps.append(view.latest_time)\n", " #vertex_count.append(view.num_vertices()) \n", " #edge_count.append(view.num_edges())\n", - " degree.append(view.num_edges()/max(1,view.num_vertices())) \n", + " degree.append(view.count_edges()/max(1,view.count_vertices())) \n", " \n", "sns.set_context()\n", "ax = plt.gca()\n", @@ -270,30 +191,9 @@ }, { "cell_type": "code", - "execution_count": 16, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "" - ] - }, - "execution_count": 16, - "metadata": {}, - "output_type": "execute_result" - }, - { - "data": { - "image/png": "", - "text/plain": [ - "
" - ] - }, - "metadata": {}, - "output_type": "display_data" - } - ], + "outputs": [], "source": [ "views = g.expanding(step=10) \n", "\n", @@ -301,7 +201,7 @@ "degree = []\n", "\n", "for view in views:\n", - " timestamps.append(view.latest_time())\n", + " timestamps.append(view.latest_time)\n", " gandalf = view.vertex(\"Gandalf\")\n", " if(gandalf is not None):\n", " degree.append(gandalf.degree())\n", @@ -320,7 +220,7 @@ ], "metadata": { "kernelspec": { - "display_name": "raphtory", + "display_name": "Python 3 (ipykernel)", "language": "python", "name": "python3" }, @@ -334,7 +234,7 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.10.9" + "version": "3.11.2" }, "vscode": { "interpreter": { diff --git a/python/tests/test_graph_conversions.py b/python/tests/test_graph_conversions.py new file mode 100644 index 0000000000..b3cdedf581 --- /dev/null +++ b/python/tests/test_graph_conversions.py @@ -0,0 +1,1008 @@ +from raphtory import Graph +from raphtory import export +import pandas as pd +import json +from pathlib import Path + +base_dir = Path(__file__).parent + + +def build_graph(): + edges_df = pd.read_csv(base_dir / "data/network_traffic_edges.csv") + edges_df["timestamp"] = pd.to_datetime(edges_df["timestamp"]).astype( + "datetime64[ms, UTC]" + ) + + vertices_df = pd.read_csv(base_dir / "data/network_traffic_vertices.csv") + vertices_df["timestamp"] = pd.to_datetime(vertices_df["timestamp"]).astype( + "datetime64[ms, UTC]" + ) + + return Graph.load_from_pandas( + edges_df=edges_df, + src="source", + dst="destination", + time="timestamp", + props=["data_size_MB"], + layer_in_df="transaction_type", + const_props=["is_encrypted"], + shared_const_props={"datasource": "data/network_traffic_edges.csv"}, + vertex_df=vertices_df, + vertex_col="server_id", + vertex_time_col="timestamp", + vertex_props=["OS_version", "primary_function", "uptime_days"], + vertex_const_props=["server_name", "hardware_type"], + vertex_shared_const_props={"datasource": "data/network_traffic_edges.csv"}, + ) + + +def test_py_vis(): + g = build_graph() + pyvis_g = export.to_pyvis(g, directed=True) + + assert pyvis_g.nodes == [ + { + "color": "#97c2fc", + "id": 7678824742430955432, + "image": "https://cdn-icons-png.flaticon.com/512/7584/7584620.png", + "label": "ServerA", + "shape": "dot", + }, + { + "color": "#97c2fc", + "id": 7718004695861170879, + "image": "https://cdn-icons-png.flaticon.com/512/7584/7584620.png", + "label": "ServerB", + "shape": "dot", + }, + { + "color": "#97c2fc", + "id": 17918514325589227856, + "image": "https://cdn-icons-png.flaticon.com/512/7584/7584620.png", + "label": "ServerC", + "shape": "dot", + }, + { + "color": "#97c2fc", + "id": 14902018402467198225, + "image": "https://cdn-icons-png.flaticon.com/512/7584/7584620.png", + "label": "ServerD", + "shape": "dot", + }, + { + "color": "#97c2fc", + "id": 11577954539736240602, + "image": "https://cdn-icons-png.flaticon.com/512/7584/7584620.png", + "label": "ServerE", + "shape": "dot", + }, + ] + assert pyvis_g.edges == [ + { + "arrowStrikethrough": False, + "arrows": "to", + "color": "#000000", + "from": 7678824742430955432, + "title": "", + "to": 7718004695861170879, + "value": 1, + }, + { + "arrowStrikethrough": False, + "arrows": "to", + "color": "#000000", + "from": 7678824742430955432, + "title": "", + "to": 17918514325589227856, + "value": 1, + }, + { + "arrowStrikethrough": False, + "arrows": "to", + "color": "#000000", + "from": 7718004695861170879, + "title": "", + "to": 14902018402467198225, + "value": 1, + }, + { + "arrowStrikethrough": False, + "arrows": "to", + "color": "#000000", + "from": 17918514325589227856, + "title": "", + "to": 7678824742430955432, + "value": 1, + }, + { + "arrowStrikethrough": False, + "arrows": "to", + "color": "#000000", + "from": 14902018402467198225, + "title": "", + "to": 17918514325589227856, + "value": 1, + }, + { + "arrowStrikethrough": False, + "arrows": "to", + "color": "#000000", + "from": 14902018402467198225, + "title": "", + "to": 11577954539736240602, + "value": 1, + }, + { + "arrowStrikethrough": False, + "arrows": "to", + "color": "#000000", + "from": 11577954539736240602, + "title": "", + "to": 7718004695861170879, + "value": 1, + }, + ] + + +def test_networkx_full_history(): + g = build_graph() + + networkxGraph = export.to_networkx(g) + assert networkxGraph.number_of_nodes() == 5 + assert networkxGraph.number_of_edges() == 7 + + nodeList = list(networkxGraph.nodes(data=True)) + server_list = [ + ( + "ServerA", + { + "OS_version": [ + (1693555200000, "Ubuntu 20.04"), + (1693555260000, "Ubuntu 20.04"), + (1693555320000, "Ubuntu 20.04"), + ], + "datasource": "data/network_traffic_edges.csv", + "hardware_type": "Blade Server", + "primary_function": [ + (1693555200000, "Database"), + (1693555260000, "Database"), + (1693555320000, "Database"), + ], + "server_name": "Alpha", + "update_history": [ + 1693555200000, + 1693555260000, + 1693555320000, + 1693555500000, + 1693556400000, + ], + "uptime_days": [ + (1693555200000, 120), + (1693555260000, 121), + (1693555320000, 122), + ], + }, + ), + ( + "ServerB", + { + "OS_version": [(1693555500000, "Red Hat 8.1")], + "datasource": "data/network_traffic_edges.csv", + "hardware_type": "Rack Server", + "primary_function": [(1693555500000, "Web Server")], + "server_name": "Beta", + "update_history": [ + 1693555200000, + 1693555500000, + 1693555800000, + 1693556700000, + ], + "uptime_days": [(1693555500000, 45)], + }, + ), + ( + "ServerC", + { + "OS_version": [(1693555800000, "Windows Server 2022")], + "datasource": "data/network_traffic_edges.csv", + "hardware_type": "Blade Server", + "primary_function": [(1693555800000, "File Storage")], + "server_name": "Charlie", + "update_history": [ + 1693555500000, + 1693555800000, + 1693556400000, + 1693557000000, + 1693557060000, + 1693557120000, + ], + "uptime_days": [(1693555800000, 90)], + }, + ), + ( + "ServerD", + { + "OS_version": [(1693556100000, "Ubuntu 20.04")], + "datasource": "data/network_traffic_edges.csv", + "hardware_type": "Tower Server", + "primary_function": [(1693556100000, "Application Server")], + "server_name": "Delta", + "update_history": [ + 1693555800000, + 1693556100000, + 1693557000000, + 1693557060000, + 1693557120000, + ], + "uptime_days": [(1693556100000, 60)], + }, + ), + ( + "ServerE", + { + "OS_version": [(1693556400000, "Red Hat 8.1")], + "datasource": "data/network_traffic_edges.csv", + "hardware_type": "Rack Server", + "primary_function": [(1693556400000, "Backup")], + "server_name": "Echo", + "update_history": [1693556100000, 1693556400000, 1693556700000], + "uptime_days": [(1693556400000, 30)], + }, + ), + ] + assert nodeList == server_list + + edgeList = list(networkxGraph.edges(data=True)) + resultList = [ + ( + "ServerA", + "ServerB", + { + "data_size_MB": [(1693555200000, 5.6)], + "datasource": "data/network_traffic_edges.csv", + "is_encrypted": True, + "layer": "Critical System Request", + "update_history": [1693555200000], + }, + ), + ( + "ServerA", + "ServerC", + { + "data_size_MB": [(1693555500000, 7.1)], + "datasource": "data/network_traffic_edges.csv", + "is_encrypted": False, + "layer": "File Transfer", + "update_history": [1693555500000], + }, + ), + ( + "ServerB", + "ServerD", + { + "data_size_MB": [(1693555800000, 3.2)], + "datasource": "data/network_traffic_edges.csv", + "is_encrypted": True, + "layer": "Standard Service Request", + "update_history": [1693555800000], + }, + ), + ( + "ServerC", + "ServerA", + { + "data_size_MB": [(1693556400000, 4.5)], + "datasource": "data/network_traffic_edges.csv", + "is_encrypted": True, + "layer": "Critical System Request", + "update_history": [1693556400000], + }, + ), + ( + "ServerD", + "ServerC", + { + "data_size_MB": [ + (1693557000000, 5.0), + (1693557060000, 10.0), + (1693557120000, 15.0), + ], + "datasource": "data/network_traffic_edges.csv", + "is_encrypted": True, + "layer": "Standard Service Request", + "update_history": [1693557000000, 1693557060000, 1693557120000], + }, + ), + ( + "ServerD", + "ServerE", + { + "data_size_MB": [(1693556100000, 8.9)], + "datasource": "data/network_traffic_edges.csv", + "is_encrypted": False, + "layer": "Administrative Command", + "update_history": [1693556100000], + }, + ), + ( + "ServerE", + "ServerB", + { + "data_size_MB": [(1693556700000, 6.2)], + "datasource": "data/network_traffic_edges.csv", + "is_encrypted": False, + "layer": "File Transfer", + "update_history": [1693556700000], + }, + ), + ] + assert edgeList == resultList + + +def test_networkx_exploded(): + g = build_graph() + + networkxGraph = export.to_networkx(g, explode_edges=True) + assert networkxGraph.number_of_nodes() == 5 + assert networkxGraph.number_of_edges() == 9 + + edgeList = list(networkxGraph.edges(data=True)) + resultList = [ + ( + "ServerA", + "ServerB", + { + "data_size_MB": [(1693555200000, 5.6)], + "datasource": "data/network_traffic_edges.csv", + "is_encrypted": True, + "layer": "Critical System Request", + "update_history": 1693555200000, + }, + ), + ( + "ServerA", + "ServerC", + { + "data_size_MB": [(1693555500000, 7.1)], + "datasource": "data/network_traffic_edges.csv", + "is_encrypted": False, + "layer": "File Transfer", + "update_history": 1693555500000, + }, + ), + ( + "ServerB", + "ServerD", + { + "data_size_MB": [(1693555800000, 3.2)], + "datasource": "data/network_traffic_edges.csv", + "is_encrypted": True, + "layer": "Standard Service Request", + "update_history": 1693555800000, + }, + ), + ( + "ServerC", + "ServerA", + { + "data_size_MB": [(1693556400000, 4.5)], + "datasource": "data/network_traffic_edges.csv", + "is_encrypted": True, + "layer": "Critical System Request", + "update_history": 1693556400000, + }, + ), + ( + "ServerD", + "ServerC", + { + "data_size_MB": [(1693557000000, 5.0)], + "datasource": "data/network_traffic_edges.csv", + "is_encrypted": True, + "layer": "Standard Service Request", + "update_history": 1693557000000, + }, + ), + ( + "ServerD", + "ServerC", + { + "data_size_MB": [(1693557060000, 10.0)], + "datasource": "data/network_traffic_edges.csv", + "is_encrypted": True, + "layer": "Standard Service Request", + "update_history": 1693557060000, + }, + ), + ( + "ServerD", + "ServerC", + { + "data_size_MB": [(1693557120000, 15.0)], + "datasource": "data/network_traffic_edges.csv", + "is_encrypted": True, + "layer": "Standard Service Request", + "update_history": 1693557120000, + }, + ), + ( + "ServerD", + "ServerE", + { + "data_size_MB": [(1693556100000, 8.9)], + "datasource": "data/network_traffic_edges.csv", + "is_encrypted": False, + "layer": "Administrative Command", + "update_history": 1693556100000, + }, + ), + ( + "ServerE", + "ServerB", + { + "data_size_MB": [(1693556700000, 6.2)], + "datasource": "data/network_traffic_edges.csv", + "is_encrypted": False, + "layer": "File Transfer", + "update_history": 1693556700000, + }, + ), + ] + assert edgeList == resultList + + +def test_networkx_no_props(): + g = build_graph() + + networkxGraph = export.to_networkx( + g, include_vertex_properties=False, include_edge_properties=False + ) + + nodeList = list(networkxGraph.nodes(data=True)) + resultList = [ + ( + "ServerA", + { + "update_history": [ + 1693555200000, + 1693555260000, + 1693555320000, + 1693555500000, + 1693556400000, + ] + }, + ), + ( + "ServerB", + { + "update_history": [ + 1693555200000, + 1693555500000, + 1693555800000, + 1693556700000, + ] + }, + ), + ( + "ServerC", + { + "update_history": [ + 1693555500000, + 1693555800000, + 1693556400000, + 1693557000000, + 1693557060000, + 1693557120000, + ] + }, + ), + ( + "ServerD", + { + "update_history": [ + 1693555800000, + 1693556100000, + 1693557000000, + 1693557060000, + 1693557120000, + ] + }, + ), + ("ServerE", {"update_history": [1693556100000, 1693556400000, 1693556700000]}), + ] + assert nodeList == resultList + + edgeList = list(networkxGraph.edges(data=True)) + resultList = [ + ( + "ServerA", + "ServerB", + {"layer": "Critical System Request", "update_history": [1693555200000]}, + ), + ( + "ServerA", + "ServerC", + {"layer": "File Transfer", "update_history": [1693555500000]}, + ), + ( + "ServerB", + "ServerD", + {"layer": "Standard Service Request", "update_history": [1693555800000]}, + ), + ( + "ServerC", + "ServerA", + {"layer": "Critical System Request", "update_history": [1693556400000]}, + ), + ( + "ServerD", + "ServerC", + { + "layer": "Standard Service Request", + "update_history": [1693557000000, 1693557060000, 1693557120000], + }, + ), + ( + "ServerD", + "ServerE", + {"layer": "Administrative Command", "update_history": [1693556100000]}, + ), + ( + "ServerE", + "ServerB", + {"layer": "File Transfer", "update_history": [1693556700000]}, + ), + ] + assert edgeList == resultList + + networkxGraph = export.to_networkx( + g, + include_vertex_properties=False, + include_edge_properties=False, + include_update_history=False, + ) + + nodeList = list(networkxGraph.nodes(data=True)) + resultList = [ + ("ServerA", {}), + ("ServerB", {}), + ("ServerC", {}), + ("ServerD", {}), + ("ServerE", {}), + ] + assert nodeList == resultList + + edgeList = list(networkxGraph.edges(data=True)) + resultList = [ + ("ServerA", "ServerB", {"layer": "Critical System Request"}), + ("ServerA", "ServerC", {"layer": "File Transfer"}), + ("ServerB", "ServerD", {"layer": "Standard Service Request"}), + ("ServerC", "ServerA", {"layer": "Critical System Request"}), + ("ServerD", "ServerC", {"layer": "Standard Service Request"}), + ("ServerD", "ServerE", {"layer": "Administrative Command"}), + ("ServerE", "ServerB", {"layer": "File Transfer"}), + ] + assert edgeList == resultList + + networkxGraph = export.to_networkx( + g, include_edge_properties=False, explode_edges=True + ) + edgeList = list(networkxGraph.edges(data=True)) + resultList = [ + ( + "ServerA", + "ServerB", + {"layer": "Critical System Request", "update_history": 1693555200000}, + ), + ( + "ServerA", + "ServerC", + {"layer": "File Transfer", "update_history": 1693555500000}, + ), + ( + "ServerB", + "ServerD", + {"layer": "Standard Service Request", "update_history": 1693555800000}, + ), + ( + "ServerC", + "ServerA", + {"layer": "Critical System Request", "update_history": 1693556400000}, + ), + ( + "ServerD", + "ServerC", + {"layer": "Standard Service Request", "update_history": 1693557000000}, + ), + ( + "ServerD", + "ServerC", + {"layer": "Standard Service Request", "update_history": 1693557060000}, + ), + ( + "ServerD", + "ServerC", + {"layer": "Standard Service Request", "update_history": 1693557120000}, + ), + ( + "ServerD", + "ServerE", + {"layer": "Administrative Command", "update_history": 1693556100000}, + ), + ( + "ServerE", + "ServerB", + {"layer": "File Transfer", "update_history": 1693556700000}, + ), + ] + assert edgeList == resultList + + +def test_networkx_no_history(): + g = build_graph() + + networkxGraph = export.to_networkx( + g, include_property_histories=False, include_update_history=False + ) + + nodeList = list(networkxGraph.nodes(data=True)) + resultList = [ + ( + "ServerA", + { + "OS_version": "Ubuntu 20.04", + "datasource": "data/network_traffic_edges.csv", + "hardware_type": "Blade Server", + "primary_function": "Database", + "server_name": "Alpha", + "uptime_days": 122, + }, + ), + ( + "ServerB", + { + "OS_version": "Red Hat 8.1", + "datasource": "data/network_traffic_edges.csv", + "hardware_type": "Rack Server", + "primary_function": "Web Server", + "server_name": "Beta", + "uptime_days": 45, + }, + ), + ( + "ServerC", + { + "OS_version": "Windows Server 2022", + "datasource": "data/network_traffic_edges.csv", + "hardware_type": "Blade Server", + "primary_function": "File Storage", + "server_name": "Charlie", + "uptime_days": 90, + }, + ), + ( + "ServerD", + { + "OS_version": "Ubuntu 20.04", + "datasource": "data/network_traffic_edges.csv", + "hardware_type": "Tower Server", + "primary_function": "Application Server", + "server_name": "Delta", + "uptime_days": 60, + }, + ), + ( + "ServerE", + { + "OS_version": "Red Hat 8.1", + "datasource": "data/network_traffic_edges.csv", + "hardware_type": "Rack Server", + "primary_function": "Backup", + "server_name": "Echo", + "uptime_days": 30, + }, + ), + ] + assert nodeList == resultList + + edgeList = list(networkxGraph.edges(data=True)) + resultList = [ + ( + "ServerA", + "ServerB", + { + "data_size_MB": 5.6, + "datasource": "data/network_traffic_edges.csv", + "is_encrypted": True, + "layer": "Critical System Request", + }, + ), + ( + "ServerA", + "ServerC", + { + "data_size_MB": 7.1, + "datasource": "data/network_traffic_edges.csv", + "is_encrypted": False, + "layer": "File Transfer", + }, + ), + ( + "ServerB", + "ServerD", + { + "data_size_MB": 3.2, + "datasource": "data/network_traffic_edges.csv", + "is_encrypted": True, + "layer": "Standard Service Request", + }, + ), + ( + "ServerC", + "ServerA", + { + "data_size_MB": 4.5, + "datasource": "data/network_traffic_edges.csv", + "is_encrypted": True, + "layer": "Critical System Request", + }, + ), + ( + "ServerD", + "ServerC", + { + "data_size_MB": 15.0, + "datasource": "data/network_traffic_edges.csv", + "is_encrypted": True, + "layer": "Standard Service Request", + }, + ), + ( + "ServerD", + "ServerE", + { + "data_size_MB": 8.9, + "datasource": "data/network_traffic_edges.csv", + "is_encrypted": False, + "layer": "Administrative Command", + }, + ), + ( + "ServerE", + "ServerB", + { + "data_size_MB": 6.2, + "datasource": "data/network_traffic_edges.csv", + "is_encrypted": False, + "layer": "File Transfer", + }, + ), + ] + assert edgeList == resultList + + networkxGraph = export.to_networkx( + g, include_property_histories=False, explode_edges=True + ) + edgeList = list(networkxGraph.edges(data=True)) + resultList = [ + ( + "ServerA", + "ServerB", + { + "data_size_MB": 5.6, + "datasource": "data/network_traffic_edges.csv", + "is_encrypted": True, + "layer": "Critical System Request", + "update_history": 1693555200000, + }, + ), + ( + "ServerA", + "ServerC", + { + "data_size_MB": 7.1, + "datasource": "data/network_traffic_edges.csv", + "is_encrypted": False, + "layer": "File Transfer", + "update_history": 1693555500000, + }, + ), + ( + "ServerB", + "ServerD", + { + "data_size_MB": 3.2, + "datasource": "data/network_traffic_edges.csv", + "is_encrypted": True, + "layer": "Standard Service Request", + "update_history": 1693555800000, + }, + ), + ( + "ServerC", + "ServerA", + { + "data_size_MB": 4.5, + "datasource": "data/network_traffic_edges.csv", + "is_encrypted": True, + "layer": "Critical System Request", + "update_history": 1693556400000, + }, + ), + ( + "ServerD", + "ServerC", + { + "data_size_MB": 5.0, + "datasource": "data/network_traffic_edges.csv", + "is_encrypted": True, + "layer": "Standard Service Request", + "update_history": 1693557000000, + }, + ), + ( + "ServerD", + "ServerC", + { + "data_size_MB": 10.0, + "datasource": "data/network_traffic_edges.csv", + "is_encrypted": True, + "layer": "Standard Service Request", + "update_history": 1693557060000, + }, + ), + ( + "ServerD", + "ServerC", + { + "data_size_MB": 15.0, + "datasource": "data/network_traffic_edges.csv", + "is_encrypted": True, + "layer": "Standard Service Request", + "update_history": 1693557120000, + }, + ), + ( + "ServerD", + "ServerE", + { + "data_size_MB": 8.9, + "datasource": "data/network_traffic_edges.csv", + "is_encrypted": False, + "layer": "Administrative Command", + "update_history": 1693556100000, + }, + ), + ( + "ServerE", + "ServerB", + { + "data_size_MB": 6.2, + "datasource": "data/network_traffic_edges.csv", + "is_encrypted": False, + "layer": "File Transfer", + "update_history": 1693556700000, + }, + ), + ] + assert edgeList == resultList + + +def save_df_to_json(df, filename): + df.to_json(filename) + # Below is if you want to pretty print the json + # json_str = df.to_json() + # parsed = json.loads(json_str) + # with open(filename, "w") as f: + # json.dump(parsed, f, indent=4) + + +# DO NOT RUN UNLESS RECREATING THE OUTPUT +def build_to_df(): + g = build_graph() + + edge_df = export.to_edge_df(g) + save_df_to_json(edge_df, "expected/dataframe_output/edge_df_all.json") + edge_df = export.to_edge_df(g, include_edge_properties=False) + save_df_to_json(edge_df, "expected/dataframe_output/edge_df_no_props.json") + edge_df = export.to_edge_df(g, include_update_history=False) + save_df_to_json(edge_df, "expected/dataframe_output/edge_df_no_hist.json") + edge_df = export.to_edge_df(g, include_property_histories=False) + save_df_to_json(edge_df, "expected/dataframe_output/edge_df_no_prop_hist.json") + + edge_df = export.to_edge_df(g, explode_edges=True) + save_df_to_json(edge_df, "expected/dataframe_output/edge_df_exploded.json") + edge_df = export.to_edge_df(g, explode_edges=True, include_edge_properties=False) + save_df_to_json(edge_df, "expected/dataframe_output/edge_df_exploded_no_props.json") + edge_df = export.to_edge_df(g, explode_edges=True, include_update_history=False) + save_df_to_json(edge_df, "expected/dataframe_output/edge_df_exploded_no_hist.json") + edge_df = export.to_edge_df(g, explode_edges=True, include_property_histories=False) + save_df_to_json( + edge_df, "expected/dataframe_output/edge_df_exploded_no_prop_hist.json" + ) + + vertex_df = export.to_vertex_df(g) + save_df_to_json(vertex_df, "expected/dataframe_output/vertex_df_all.json") + vertex_df = export.to_vertex_df(g, include_vertex_properties=False) + save_df_to_json(vertex_df, "expected/dataframe_output/vertex_df_no_props.json") + vertex_df = export.to_vertex_df(g, include_update_history=False) + save_df_to_json(vertex_df, "expected/dataframe_output/vertex_df_no_hist.json") + vertex_df = export.to_vertex_df(g, include_property_histories=False) + save_df_to_json(vertex_df, "expected/dataframe_output/vertex_df_no_prop_hist.json") + + +def compare_df(df1, df2): + # Have to do this way due to the number of maps inside the dataframes + s1 = df1.to_json() + s2 = df2.to_json() + data1 = json.loads(s1) + data2 = json.loads(s2) + assert data1 == data2 + + +def test_to_df(): + g = build_graph() + + compare_df( + export.to_edge_df(g), + pd.read_json(base_dir / "expected/dataframe_output/edge_df_all.json"), + ) + + compare_df( + export.to_edge_df(g, include_edge_properties=False), + pd.read_json(base_dir / "expected/dataframe_output/edge_df_no_props.json"), + ) + + compare_df( + export.to_edge_df(g, include_update_history=False), + pd.read_json(base_dir / "expected/dataframe_output/edge_df_no_hist.json"), + ) + + compare_df( + export.to_edge_df(g, include_property_histories=False), + pd.read_json(base_dir / "expected/dataframe_output/edge_df_no_prop_hist.json"), + ) + + compare_df( + export.to_edge_df(g, explode_edges=True), + pd.read_json(base_dir / "expected/dataframe_output/edge_df_exploded.json"), + ) + compare_df( + export.to_edge_df(g, explode_edges=True, include_edge_properties=False), + pd.read_json( + base_dir / "expected/dataframe_output/edge_df_exploded_no_props.json" + ), + ) + + compare_df( + export.to_edge_df(g, explode_edges=True, include_update_history=False), + pd.read_json( + base_dir / "expected/dataframe_output/edge_df_exploded_no_hist.json" + ), + ) + + compare_df( + export.to_edge_df(g, explode_edges=True, include_property_histories=False), + pd.read_json( + base_dir / "expected/dataframe_output/edge_df_exploded_no_prop_hist.json" + ), + ) + + compare_df( + export.to_vertex_df(g), + pd.read_json(base_dir / "expected/dataframe_output/vertex_df_all.json"), + ) + compare_df( + export.to_vertex_df(g, include_vertex_properties=False), + pd.read_json(base_dir / "expected/dataframe_output/vertex_df_no_props.json"), + ) + compare_df( + export.to_vertex_df(g, include_update_history=False), + pd.read_json(base_dir / "expected/dataframe_output/vertex_df_no_hist.json"), + ) + compare_df( + export.to_vertex_df(g, include_property_histories=False), + pd.read_json( + base_dir / "expected/dataframe_output/vertex_df_no_prop_hist.json" + ), + ) diff --git a/python/tests/test_graphdb.py b/python/tests/test_graphdb.py index aed3939434..89eef86330 100644 --- a/python/tests/test_graphdb.py +++ b/python/tests/test_graphdb.py @@ -1,60 +1,68 @@ -import re +import math import sys -import time -import datetime +import pandas as pd +import pandas.core.frame import pytest -from raphtory import Graph +from raphtory import Graph, GraphWithDeletions, PyDirection from raphtory import algorithms from raphtory import graph_loader import tempfile from math import isclose import datetime -def create_graph(num_shards): - g = Graph(num_shards) - edges = [ - (1, 1, 2), - (2, 1, 3), - (-1, 2, 1), - (0, 1, 1), - (7, 3, 2), - (1, 1, 1) - ] +edges = [(1, 1, 2), (2, 1, 3), (-1, 2, 1), (0, 1, 1), (7, 3, 2), (1, 1, 1)] + + +def create_graph(): + g = Graph() g.add_vertex(0, 1, {"type": "wallet", "cost": 99.5}) g.add_vertex(-1, 2, {"type": "wallet", "cost": 10.0}) - g.add_vertex(6, 3, {"type": "wallet", "cost": 76}) + g.add_vertex(6, 3, {"type": "wallet", "cost": 76.0}) for e in edges: - g.add_edge(e[0], e[1], e[2], {"prop1": 1, - "prop2": 9.8, "prop3": "test"}) + g.add_edge(e[0], e[1], e[2], {"prop1": 1, "prop2": 9.8, "prop3": "test"}) + + return g + + +def create_graph_with_deletions(): + g = GraphWithDeletions() + + g.add_vertex(0, 1, {"type": "wallet", "cost": 99.5}) + g.add_vertex(-1, 2, {"type": "wallet", "cost": 10.0}) + g.add_vertex(6, 3, {"type": "wallet", "cost": 76.0}) + for e in edges: + g.add_edge(e[0], e[1], e[2], {"prop1": 1, "prop2": 9.8, "prop3": "test"}) + g.edge(edges[0][1], edges[0][2]).add_constant_properties({"static": "test"}) + g.delete_edge(10, edges[0][1], edges[0][2]) return g def test_graph_len_edge_len(): - g = create_graph(2) + g = create_graph() - assert g.num_vertices() == 3 - assert g.num_edges() == 5 + assert g.count_vertices() == 3 + assert g.count_edges() == 5 def test_id_iterable(): - g = create_graph(2) + g = create_graph() - assert g.vertices.id().max() == 3 - assert g.vertices.id().min() == 1 - assert set(g.vertices.id().collect()) == {1, 2, 3} - out_neighbours = g.vertices.out_neighbours().id().collect() + assert g.vertices.id.max() == 3 + assert g.vertices.id.min() == 1 + assert set(g.vertices.id.collect()) == {1, 2, 3} + out_neighbours = g.vertices.out_neighbours.id.collect() out_neighbours = (set(n) for n in out_neighbours) - out_neighbours = dict(zip(g.vertices.id(), out_neighbours)) + out_neighbours = dict(zip(g.vertices.id, out_neighbours)) assert out_neighbours == {1: {1, 2, 3}, 2: {1}, 3: {2}} def test_degree_iterable(): - g = create_graph(2) + g = create_graph() assert g.vertices.degree().min() == 2 assert g.vertices.degree().max() == 3 assert g.vertices.in_degree().min() == 1 @@ -69,14 +77,14 @@ def test_degree_iterable(): def test_vertices_time_iterable(): - g = create_graph(2) + g = create_graph() - assert g.vertices.earliest_time().min() == -1 - assert g.vertices.latest_time().max() == 7 + assert g.vertices.earliest_time.min() == -1 + assert g.vertices.latest_time.max() == 7 def test_graph_has_edge(): - g = create_graph(2) + g = create_graph() assert not g.window(-1, 1).has_edge(1, 3) assert g.window(-1, 3).has_edge(1, 3) @@ -84,213 +92,347 @@ def test_graph_has_edge(): def test_graph_has_vertex(): - g = create_graph(2) + g = create_graph() assert g.has_vertex(3) def test_windowed_graph_has_vertex(): - g = create_graph(2) + g = create_graph() assert g.window(-1, 1).has_vertex(1) def test_windowed_graph_get_vertex(): - g = create_graph(2) + g = create_graph() view = g.window(0, sys.maxsize) - assert view.vertex(1).id() == 1 + assert view.vertex(1).id == 1 assert view.vertex(10) is None assert view.vertex(1).degree() == 3 def test_windowed_graph_degree(): - g = create_graph(3) + g = create_graph() view = g.window(0, sys.maxsize) - degrees = [v.degree() for v in view.vertices()] + degrees = [v.degree() for v in view.vertices] degrees.sort() assert degrees == [2, 2, 3] - in_degrees = [v.in_degree() for v in view.vertices()] + in_degrees = [v.in_degree() for v in view.vertices] in_degrees.sort() assert in_degrees == [1, 1, 2] - out_degrees = [v.out_degree() for v in view.vertices()] + out_degrees = [v.out_degree() for v in view.vertices] out_degrees.sort() assert out_degrees == [0, 1, 3] def test_windowed_graph_get_edge(): - g = create_graph(2) + g = create_graph() max_size = sys.maxsize min_size = -sys.maxsize - 1 view = g.window(min_size, max_size) - assert (view.edge(1, 3).src().id(), view.edge(1, 3).dst().id()) == (1, 3) - assert view.edge(2, 3) == None - assert view.edge(6, 5) == None + assert (view.edge(1, 3).src.id, view.edge(1, 3).dst.id) == (1, 3) + assert view.edge(2, 3) is None + assert view.edge(6, 5) is None - assert (view.vertex(1).id(), view.vertex(3).id()) == (1, 3) + assert (view.vertex(1).id, view.vertex(3).id) == (1, 3) view = g.window(2, 3) - assert (view.edge(1, 3).src().id(), view.edge(1, 3).dst().id()) == (1, 3) + assert (view.edge(1, 3).src.id, view.edge(1, 3).dst.id) == (1, 3) view = g.window(3, 7) - assert view.edge(1, 3) == None + assert view.edge(1, 3) is None def test_windowed_graph_edges(): - g = create_graph(1) + g = create_graph() view = g.window(0, sys.maxsize) - tedges = [v.edges() for v in view.vertices()] + tedges = [v.edges for v in view.vertices] edges = [] for e_iter in tedges: for e in e_iter: - edges.append([e.src().id(), e.dst().id()]) + edges.append([e.src.id, e.dst.id]) - assert edges == [ - [1, 1], - [1, 1], - [1, 2], - [1, 3], - [1, 2], - [3, 2], - [1, 3], - [3, 2] - ] + assert edges == [[1, 1], [1, 1], [1, 2], [1, 3], [1, 2], [3, 2], [1, 3], [3, 2]] - tedges = [v.in_edges() for v in view.vertices()] + tedges = [v.in_edges for v in view.vertices] in_edges = [] for e_iter in tedges: for e in e_iter: - in_edges.append([e.src().id(), e.dst().id()]) + in_edges.append([e.src.id, e.dst.id]) - assert in_edges == [ - [1, 1], - [1, 2], - [3, 2], - [1, 3] - ] + assert in_edges == [[1, 1], [1, 2], [3, 2], [1, 3]] - tedges = [v.out_edges() for v in view.vertices()] + tedges = [v.out_edges for v in view.vertices] out_edges = [] for e_iter in tedges: for e in e_iter: - out_edges.append([e.src().id(), e.dst().id()]) + out_edges.append([e.src.id, e.dst.id]) - assert out_edges == [ - [1, 1], - [1, 2], - [1, 3], - [3, 2] - ] + assert out_edges == [[1, 1], [1, 2], [1, 3], [3, 2]] def test_windowed_graph_vertex_ids(): - g = create_graph(3) + g = create_graph() - vs = [v for v in g.window(-1, 2).vertices().id()] + vs = [v for v in g.window(-1, 2).vertices.id] vs.sort() assert vs == [1, 2] # this makes clear that the end of the range is exclusive - vs = [v for v in g.window(-5, 3).vertices().id()] + vs = [v for v in g.window(-5, 3).vertices.id] vs.sort() assert vs == [1, 2, 3] def test_windowed_graph_vertices(): - g = create_graph(1) + g = create_graph() view = g.window(-1, 0) - vertices = list(view.vertices().id()) + vertices = list(view.vertices.id) assert vertices == [1, 2] def test_windowed_graph_neighbours(): - g = create_graph(1) + g = create_graph() max_size = sys.maxsize min_size = -sys.maxsize - 1 view = g.window(min_size, max_size) - neighbours = view.vertices.neighbours().id().collect() + neighbours = view.vertices.neighbours.id.collect() assert neighbours == [[1, 2, 3], [1, 3], [1, 2]] - in_neighbours = view.vertices.in_neighbours().id().collect() + in_neighbours = view.vertices.in_neighbours.id.collect() assert in_neighbours == [[1, 2], [1, 3], [1]] - out_neighbours = view.vertices.out_neighbours().id().collect() + out_neighbours = view.vertices.out_neighbours.id.collect() assert out_neighbours == [[1, 2, 3], [1], [2]] def test_name(): - # Currently deadlocking g = Graph() g.add_vertex(1, "Ben") g.add_vertex(1, 10) g.add_edge(1, "Ben", "Hamza") - assert g.vertex(10).name() == "10" - assert g.vertex("Ben").name() == "Ben" + assert g.vertex(10).name == "10" + assert g.vertex("Ben").name == "Ben" + assert g.vertex("Hamza").name == "Hamza" + + +def test_getitem(): + g = Graph() + g.add_vertex(0, 1, {"cost": 0}) + g.add_vertex(1, 1, {"cost": 1}) + + assert ( + g.vertex(1).properties.temporal.get("cost") + == g.vertex(1).properties.temporal["cost"] + ) + + +def test_graph_properties(): + g = create_graph() + + props = {"prop 1": 1, "prop 2": "hi", "prop 3": True} + g.add_constant_properties(props) + + sp = g.properties.constant.keys() + sp.sort() + assert sp == ["prop 1", "prop 2", "prop 3"] + assert g.properties["prop 1"] == 1 + + props = {"prop 4": 11, "prop 5": "world", "prop 6": False} + g.add_property(1, props) + + props = {"prop 6": True} + g.add_property(2, props) + + def history_test(key, value): + if value is None: + assert g.properties.temporal.get(key) is None + else: + assert g.properties.temporal.get(key).items() == value + + history_test("prop 1", None) + history_test("prop 2", None) + history_test("prop 3", None) + history_test("prop 4", [(1, 11)]) + history_test("prop 5", [(1, "world")]) + history_test("prop 6", [(1, False), (2, True)]) + history_test("undefined", None) + + def time_history_test(time, key, value): + if value is None: + assert g.at(time).properties.temporal.get(key) is None + else: + assert g.at(time).properties.temporal.get(key).items() == value + + time_history_test(2, "prop 6", [(1, False), (2, True)]) + time_history_test(1, "static prop", None) + + def time_static_property_test(time, key, value): + assert g.at(time).properties.constant.get(key) == value + + def static_property_test(key, value): + assert g.properties.constant.get(key) == value + + time_static_property_test(1, "prop 1", 1) + time_static_property_test(100, "prop 1", 1) + static_property_test("prop 1", 1) + static_property_test("prop 3", True) + + # testing property + def time_property_test(time, key, value): + assert g.at(time).properties.get(key) == value + + def property_test(key, value): + assert g.properties.get(key) == value + + static_property_test("prop 2", "hi") + property_test("prop 2", "hi") + time_static_property_test(2, "prop 3", True) + time_property_test(2, "prop 3", True) + + # testing properties + assert g.properties.as_dict() == { + "prop 1": 1, + "prop 2": "hi", + "prop 3": True, + "prop 4": 11, + "prop 5": "world", + "prop 6": True, + } + + assert g.properties.temporal.latest() == { + "prop 4": 11, + "prop 5": "world", + "prop 6": True, + } + assert g.at(2).properties.as_dict() == { + "prop 1": 1, + "prop 2": "hi", + "prop 3": True, + "prop 4": 11, + "prop 5": "world", + "prop 6": True, + } + # testing property histories + assert g.properties.temporal.histories() == { + "prop 4": [(1, 11)], + "prop 5": [(1, "world")], + "prop 6": [(1, False), (2, True)], + } + + assert g.at(2).properties.temporal.histories() == { + "prop 4": [(1, 11)], + "prop 5": [(1, "world")], + "prop 6": [(1, False), (2, True)], + } + + # testing property names + expected_names = sorted( + ["prop 1", "prop 2", "prop 3", "prop 4", "prop 5", "prop 6"] + ) + assert sorted(g.properties.keys()) == expected_names + + expected_names_no_static = sorted(["prop 4", "prop 5", "prop 6"]) + assert sorted(g.properties.temporal.keys()) == expected_names_no_static -# assert g.vertex("Hamza").name() == "Hamza" TODO need to fix + assert sorted(g.at(1).properties.temporal.keys()) == expected_names_no_static + + # testing has_property + assert "prop 4" in g.properties + assert "prop 7" not in g.properties + assert "prop 7" not in g.at(1).properties + assert "prop 1" in g.properties + assert "prop 2" in g.at(1).properties + assert "static prop" not in g.properties.constant def test_vertex_properties(): g = Graph() g.add_edge(1, 1, 1) props_t1 = {"prop 1": 1, "prop 3": "hi", "prop 4": True} - g.add_vertex(1, 1, props_t1) + v = g.add_vertex(1, 1, props_t1) props_t2 = {"prop 1": 2, "prop 2": 0.6, "prop 4": False} - g.add_vertex(2, 1, props_t2) + v.add_updates(2, props_t2) props_t3 = {"prop 2": 0.9, "prop 3": "hello", "prop 4": True} - g.add_vertex(3, 1, props_t3) + v.add_updates(3, props_t3) + v.add_constant_properties({"static prop": 123}) - g.add_vertex_properties(1, {"static prop": 123}) - - # testing property_history + # testing property history def history_test(key, value): - assert g.vertex(1).property_history(key) == value - assert g.vertices.property_history(key).collect() == [value] - assert g.vertices.out_neighbours().property_history(key).collect() == [[value]] + if value is None: + assert g.vertex(1).properties.temporal.get(key) is None + assert g.vertices.properties.temporal.get(key) is None + assert g.vertices.out_neighbours.properties.temporal.get(key) is None + else: + assert g.vertex(1).properties.temporal.get(key).items() == value + assert g.vertices.properties.temporal.get(key).items() == [value] + assert g.vertices.out_neighbours.properties.temporal.get(key).items() == [ + [value] + ] history_test("prop 1", [(1, 1), (2, 2)]) history_test("prop 2", [(2, 0.6), (3, 0.9)]) - history_test("prop 3", [(1, "hi"), (3, 'hello')]) + history_test("prop 3", [(1, "hi"), (3, "hello")]) history_test("prop 4", [(1, True), (2, False), (3, True)]) - history_test("undefined", []) + history_test("undefined", None) def time_history_test(time, key, value): - assert g.at(time).vertex(1).property_history(key) == value - assert g.at(time).vertices.property_history(key).collect() == [value] - assert g.at(time).vertices.out_neighbours().property_history(key).collect() == [[value]] + if value is None: + assert g.at(time).vertex(1).properties.temporal.get(key) is None + assert g.at(time).vertices.properties.temporal.get(key) is None + assert ( + g.at(time).vertices.out_neighbours.properties.temporal.get(key) is None + ) + else: + assert g.at(time).vertex(1).properties.temporal.get(key).items() == value + assert g.at(time).vertices.properties.temporal.get(key).items() == [value] + assert g.at(time).vertices.out_neighbours.properties.temporal.get( + key + ).items() == [[value]] time_history_test(1, "prop 4", [(1, True)]) - time_history_test(1, "static prop", []) + time_history_test(1, "static prop", None) def time_static_property_test(time, key, value): gg = g.at(time) - assert gg.vertex(1).static_property(key) == value - assert gg.vertices.static_property(key).collect() == [value] - assert gg.vertices.out_neighbours().static_property(key).collect() == [[value]] + if value is None: + assert gg.vertex(1).properties.constant.get(key) is None + assert gg.vertices.properties.constant.get(key) is None + assert gg.vertices.out_neighbours.properties.constant.get(key) is None + else: + assert gg.vertex(1).properties.constant.get(key) == value + assert gg.vertices.properties.constant.get(key) == [value] + assert gg.vertices.out_neighbours.properties.constant.get(key) == [[value]] def static_property_test(key, value): - assert g.vertex(1).static_property(key) == value - assert g.vertices.static_property(key).collect() == [value] - assert g.vertices.out_neighbours().static_property(key).collect() == [[value]] + if value is None: + assert g.vertex(1).properties.constant.get(key) is None + assert g.vertices.properties.constant.get(key) is None + assert g.vertices.out_neighbours.properties.constant.get(key) is None + else: + assert g.vertex(1).properties.constant.get(key) == value + assert g.vertices.properties.constant.get(key) == [value] + assert g.vertices.out_neighbours.properties.constant.get(key) == [[value]] time_static_property_test(1, "static prop", 123) time_static_property_test(100, "static prop", 123) @@ -300,19 +442,36 @@ def static_property_test(key, value): # testing property def time_property_test(time, key, value): gg = g.at(time) - assert gg.vertex(1).property(key) == value - assert gg.vertices.property(key).collect() == [value] - assert gg.vertices.out_neighbours().property(key).collect() == [[value]] + if value is None: + assert gg.vertex(1).properties.get(key) is None + assert gg.vertices.properties.get(key) is None + assert gg.vertices.out_neighbours.properties.get(key) is None + else: + assert gg.vertex(1).properties.get(key) == value + assert gg.vertices.properties.get(key) == [value] + assert gg.vertices.out_neighbours.properties.get(key) == [[value]] def property_test(key, value): - assert g.vertex(1).property(key) == value - assert g.vertices.property(key).collect() == [value] - assert g.vertices.out_neighbours().property(key).collect() == [[value]] + if value is None: + assert g.vertex(1).properties.get(key) is None + assert g.vertices.properties.get(key) is None + assert g.vertices.out_neighbours.properties.get(key) is None + else: + assert g.vertex(1).properties.get(key) == value + assert g.vertices.properties.get(key) == [value] + assert g.vertices.out_neighbours.properties.get(key) == [[value]] def no_static_property_test(key, value): - assert g.vertex(1).property(key, include_static=False) == value - assert g.vertices.property(key, include_static=False).collect() == [value] - assert g.vertices.out_neighbours().property(key, include_static=False).collect() == [[value]] + if value is None: + assert g.vertex(1).properties.temporal.get(key) is None + assert g.vertices.properties.temporal.get(key) is None + assert g.vertices.out_neighbours.properties.temporal.get(key) is None + else: + assert g.vertex(1).properties.temporal.get(key).value() == value + assert g.vertices.properties.temporal.get(key).value() == [value] + assert g.vertices.out_neighbours.properties.temporal.get(key).value() == [ + [value] + ] property_test("static prop", 123) assert g.vertex(1)["static prop"] == 123 @@ -322,185 +481,295 @@ def no_static_property_test(key, value): time_property_test(1, "prop 2", None) # testing properties - assert g.vertex(1).properties() == {'prop 2': 0.9, 'prop 3': 'hello', 'prop 1': 2, 'prop 4': True, - 'static prop': 123} - assert g.vertices.properties().collect() == [{'prop 2': 0.9, 'prop 3': 'hello', 'prop 1': 2, 'prop 4': True, - 'static prop': 123}] - assert g.vertices.out_neighbours().properties().collect() == [[ - {'prop 2': 0.9, 'prop 3': 'hello', 'prop 1': 2, 'prop 4': True, - 'static prop': 123}]] - - assert g.vertex(1).properties(include_static=False) == {'prop 2': 0.9, 'prop 3': 'hello', 'prop 1': 2, - 'prop 4': True} - assert g.vertices.properties(include_static=False).collect() == [{'prop 2': 0.9, 'prop 3': 'hello', 'prop 1': 2, - 'prop 4': True}] - assert g.vertices.out_neighbours().properties(include_static=False).collect() == [ - [{'prop 2': 0.9, 'prop 3': 'hello', 'prop 1': 2, - 'prop 4': True}]] - - assert g.at(2).vertex(1).properties() == {'prop 1': 2, 'prop 4': False, 'prop 2': 0.6, 'static prop': 123, - 'prop 3': 'hi'} - assert g.at(2).vertices.properties().collect() == [{'prop 1': 2, 'prop 4': False, 'prop 2': 0.6, 'static prop': 123, - 'prop 3': 'hi'}] - assert g.at(2).vertices.out_neighbours().properties().collect() == [ - [{'prop 1': 2, 'prop 4': False, 'prop 2': 0.6, 'static prop': 123, - 'prop 3': 'hi'}]] + assert g.vertex(1).properties == { + "prop 2": 0.9, + "prop 3": "hello", + "prop 1": 2, + "prop 4": True, + "static prop": 123, + } + assert g.vertices.properties == { + "prop 2": [0.9], + "prop 3": ["hello"], + "prop 1": [2], + "prop 4": [True], + "static prop": [123], + } + assert g.vertices.out_neighbours.properties == { + "prop 2": [[0.9]], + "prop 3": [["hello"]], + "prop 1": [[2]], + "prop 4": [[True]], + "static prop": [[123]], + } + + assert g.vertex(1).properties.temporal.latest() == { + "prop 2": 0.9, + "prop 3": "hello", + "prop 1": 2, + "prop 4": True, + } + assert g.vertices.properties.temporal.latest() == { + "prop 2": [0.9], + "prop 3": ["hello"], + "prop 1": [2], + "prop 4": [True], + } + assert g.vertices.out_neighbours.properties.temporal.latest() == { + "prop 2": [[0.9]], + "prop 3": [["hello"]], + "prop 1": [[2]], + "prop 4": [[True]], + } + + assert g.at(2).vertex(1).properties == { + "prop 1": 2, + "prop 4": False, + "prop 2": 0.6, + "static prop": 123, + "prop 3": "hi", + } + assert g.at(2).vertices.properties == { + "prop 1": [2], + "prop 4": [False], + "prop 2": [0.6], + "static prop": [123], + "prop 3": ["hi"], + } + assert g.at(2).vertices.out_neighbours.properties == { + "prop 1": [[2]], + "prop 4": [[False]], + "prop 2": [[0.6]], + "static prop": [[123]], + "prop 3": [["hi"]], + } # testing property histories - assert g.vertex(1).property_histories() == {'prop 3': [(1, 'hi'), (3, 'hello')], 'prop 1': [(1, 1), (2, 2)], - 'prop 4': [(1, True), (2, False), (3, True)], - 'prop 2': [(2, 0.6), (3, 0.9)]} - assert g.vertices.property_histories().collect() == [ - {'prop 3': [(1, 'hi'), (3, 'hello')], 'prop 1': [(1, 1), (2, 2)], - 'prop 4': [(1, True), (2, False), (3, True)], - 'prop 2': [(2, 0.6), (3, 0.9)]}] - assert g.vertices.out_neighbours().property_histories().collect() == [ - [{'prop 3': [(1, 'hi'), (3, 'hello')], 'prop 1': [(1, 1), (2, 2)], - 'prop 4': [(1, True), (2, False), (3, True)], - 'prop 2': [(2, 0.6), (3, 0.9)]}]] - - assert g.at(2).vertex(1).property_histories() == {'prop 2': [(2, 0.6)], 'prop 4': [(1, True), (2, False)], - 'prop 1': [(1, 1), (2, 2)], 'prop 3': [(1, 'hi')]} - assert g.at(2).vertices.property_histories().collect() == [{'prop 2': [(2, 0.6)], 'prop 4': [(1, True), (2, False)], - 'prop 1': [(1, 1), (2, 2)], 'prop 3': [(1, 'hi')]}] - assert g.at(2).vertices.out_neighbours().property_histories().collect() == [ - [{'prop 2': [(2, 0.6)], 'prop 4': [(1, True), (2, False)], - 'prop 1': [(1, 1), (2, 2)], 'prop 3': [(1, 'hi')]}]] + assert g.vertex(1).properties.temporal == { + "prop 3": [(1, "hi"), (3, "hello")], + "prop 1": [(1, 1), (2, 2)], + "prop 4": [(1, True), (2, False), (3, True)], + "prop 2": [(2, 0.6), (3, 0.9)], + } + assert g.vertices.properties.temporal == { + "prop 3": [[(1, "hi"), (3, "hello")]], + "prop 1": [[(1, 1), (2, 2)]], + "prop 4": [[(1, True), (2, False), (3, True)]], + "prop 2": [[(2, 0.6), (3, 0.9)]], + } + assert g.vertices.out_neighbours.properties.temporal == { + "prop 3": [[[(1, "hi"), (3, "hello")]]], + "prop 1": [[[(1, 1), (2, 2)]]], + "prop 4": [[[(1, True), (2, False), (3, True)]]], + "prop 2": [[[(2, 0.6), (3, 0.9)]]], + } + + assert g.at(2).vertex(1).properties.temporal == { + "prop 2": [(2, 0.6)], + "prop 4": [(1, True), (2, False)], + "prop 1": [(1, 1), (2, 2)], + "prop 3": [(1, "hi")], + } + assert g.at(2).vertices.properties.temporal == { + "prop 2": [[(2, 0.6)]], + "prop 4": [[(1, True), (2, False)]], + "prop 1": [[(1, 1), (2, 2)]], + "prop 3": [[(1, "hi")]], + } + assert g.at(2).vertices.out_neighbours.properties.temporal == { + "prop 2": [[[(2, 0.6)]]], + "prop 4": [[[(1, True), (2, False)]]], + "prop 1": [[[(1, 1), (2, 2)]]], + "prop 3": [[[(1, "hi")]]], + } # testing property names - expected_names = sorted(['prop 4', 'prop 1', 'prop 2', 'prop 3', 'static prop']) - assert sorted(g.vertex(1).property_names()) == expected_names - names = g.vertices.property_names().collect() - assert len(names) == 1 and sorted(names[0]) == expected_names - names = g.vertices.out_neighbours().property_names().collect() - assert len(names) == 1 and len(names[0]) == 1 and sorted(names[0][0]) == expected_names - - expected_names_no_static = sorted(['prop 4', 'prop 1', 'prop 2', 'prop 3']) - assert sorted(g.vertex(1).property_names(include_static=False)) == expected_names_no_static - names = g.vertices.property_names(include_static=False).collect() - assert len(names) == 1 and sorted(names[0]) == expected_names_no_static - names = g.vertices.out_neighbours().property_names(include_static=False).collect() - assert len(names) == 1 and len(names[0]) == 1 and sorted(names[0][0]) == expected_names_no_static - - assert sorted(g.at(1).vertex(1).property_names(include_static=False)) == expected_names_no_static - names = g.at(1).vertices.property_names(include_static=False).collect() - assert len(names) == 1 and sorted(names[0]) == expected_names_no_static - names = g.at(1).vertices.out_neighbours().property_names(include_static=False).collect() - assert len(names) == 1 and len(names[0]) == 1 and sorted(names[0][0]) == expected_names_no_static + expected_names = sorted(["prop 4", "prop 1", "prop 2", "prop 3", "static prop"]) + assert sorted(g.vertex(1).properties.keys()) == expected_names + assert sorted(g.vertices.properties.keys()) == expected_names + assert sorted(g.vertices.out_neighbours.properties.keys()) == expected_names + + expected_names_no_static = sorted(["prop 4", "prop 1", "prop 2", "prop 3"]) + assert sorted(g.vertex(1).properties.temporal.keys()) == expected_names_no_static + assert sorted(g.vertices.properties.temporal.keys()) == expected_names_no_static + assert ( + sorted(g.vertices.out_neighbours.properties.temporal.keys()) + == expected_names_no_static + ) + + expected_names_no_static_at_1 = sorted(["prop 4", "prop 1", "prop 3"]) + assert ( + sorted(g.at(1).vertex(1).properties.temporal.keys()) + == expected_names_no_static_at_1 + ) + assert ( + sorted(g.at(1).vertices.properties.temporal.keys()) + == expected_names_no_static_at_1 + ) + assert ( + sorted(g.at(1).vertices.out_neighbours.properties.temporal.keys()) + == expected_names_no_static_at_1 + ) # testing has_property - assert g.vertex(1).has_property("prop 4") - assert g.vertices.has_property("prop 4").collect() == [True] - assert g.vertices.out_neighbours().has_property("prop 4").collect() == [[True]] + assert "prop 4" in g.vertex(1).properties + assert "prop 4" in g.vertices.properties + assert "prop 4" in g.vertices.out_neighbours.properties - assert g.vertex(1).has_property("prop 2") - assert g.vertices.has_property("prop 2").collect() == [True] - assert g.vertices.out_neighbours().has_property("prop 2").collect() == [[True]] + assert "prop 2" in g.vertex(1).properties + assert "prop 2" in g.vertices.properties + assert "prop 2" in g.vertices.out_neighbours.properties - assert not g.vertex(1).has_property("prop 5") - assert g.vertices.has_property("prop 5").collect() == [False] - assert g.vertices.out_neighbours().has_property("prop 5").collect() == [[False]] + assert "prop 5" not in g.vertex(1).properties + assert "prop 5" not in g.vertices.properties + assert "prop 5" not in g.vertices.out_neighbours.properties - assert not g.at(1).vertex(1).has_property("prop 2") - assert g.at(1).vertices.has_property("prop 2").collect() == [False] - assert g.at(1).vertices.out_neighbours().has_property("prop 2").collect() == [[False]] + assert "prop 2" not in g.at(1).vertex(1).properties + assert "prop 2" not in g.at(1).vertices.properties + assert "prop 2" not in g.at(1).vertices.out_neighbours.properties - assert g.vertex(1).has_property("static prop") - assert g.vertices.has_property("static prop").collect() == [True] - assert g.vertices.out_neighbours().has_property("static prop").collect() == [[True]] + assert "static prop" in g.vertex(1).properties + assert "static prop" in g.vertices.properties + assert "static prop" in g.vertices.out_neighbours.properties - assert g.at(1).vertex(1).has_property("static prop") - assert g.at(1).vertices.has_property("static prop").collect() == [True] - assert g.at(1).vertices.out_neighbours().has_property("static prop").collect() == [[True]] + assert "static prop" in g.at(1).vertex(1).properties + assert "static prop" in g.at(1).vertices.properties + assert "static prop" in g.at(1).vertices.out_neighbours.properties - assert not g.at(1).vertex(1).has_property("static prop", include_static=False) - assert g.at(1).vertices.has_property("static prop", include_static=False).collect() == [False] - assert g.at(1).vertices.out_neighbours().has_property("static prop", include_static=False).collect() == [[False]] + assert "static prop" not in g.at(1).vertex(1).properties.temporal + assert "static prop" not in g.at(1).vertices.properties.temporal + assert "static prop" not in g.at(1).vertices.out_neighbours.properties.temporal - assert g.vertex(1).has_static_property("static prop") - assert g.vertices.has_static_property("static prop").collect() == [True] - assert g.vertices.out_neighbours().has_static_property("static prop").collect() == [[True]] + assert "static prop" in g.vertex(1).properties.constant + assert "static prop" in g.vertices.properties.constant + assert "static prop" in g.vertices.out_neighbours.properties.constant - assert not g.vertex(1).has_static_property("prop 2") - assert g.vertices.has_static_property("prop 2").collect() == [False] - assert g.vertices.out_neighbours().has_static_property("prop 2").collect() == [[False]] + assert "prop 2" not in g.vertex(1).properties.constant + assert "prop 2" not in g.vertices.properties.constant + assert "prop 2" not in g.vertices.out_neighbours.properties.constant - assert g.at(1).vertex(1).has_static_property("static prop") - assert g.at(1).vertices.has_static_property("static prop").collect() == [True] - assert g.at(1).vertices.out_neighbours().has_static_property("static prop").collect() == [[True]] + assert "static prop" in g.at(1).vertex(1).properties.constant + assert "static prop" in g.at(1).vertices.properties.constant + assert "static prop" in g.at(1).vertices.out_neighbours.properties.constant def test_edge_properties(): g = Graph() props_t1 = {"prop 1": 1, "prop 3": "hi", "prop 4": True} - g.add_edge(1, 1, 2, props_t1) + e = g.add_edge(1, 1, 2, props_t1) props_t2 = {"prop 1": 2, "prop 2": 0.6, "prop 4": False} - g.add_edge(2, 1, 2, props_t2) + e.add_updates(2, props_t2) props_t3 = {"prop 2": 0.9, "prop 3": "hello", "prop 4": True} - g.add_edge(3, 1, 2, props_t3) - - g.add_edge_properties(1, 2, {"static prop": 123}) - - # testing property_history - assert g.edge(1, 2).property_history("prop 1") == [(1, 1), (2, 2)] - assert g.edge(1, 2).property_history("prop 2") == [(2, 0.6), (3, 0.9)] - assert g.edge(1, 2).property_history("prop 3") == [(1, "hi"), (3, 'hello')] - assert g.edge(1, 2).property_history("prop 4") == [(1, True), (2, False), (3, True)] - assert g.edge(1, 2).property_history("undefined") == [] - assert g.at(1).edge(1, 2).property_history("prop 4") == [(1, True)] - assert g.at(1).edge(1, 2).property_history("static prop") == [] + e.add_updates(3, props_t3) + + e.add_constant_properties({"static prop": 123}) + + # testing property history + assert g.edge(1, 2).properties.temporal.get("prop 1") == [(1, 1), (2, 2)] + assert g.edge(1, 2).properties.temporal.get("prop 2") == [(2, 0.6), (3, 0.9)] + assert g.edge(1, 2).properties.temporal.get("prop 3") == [(1, "hi"), (3, "hello")] + assert g.edge(1, 2).properties.temporal.get("prop 4") == [ + (1, True), + (2, False), + (3, True), + ] + assert g.edge(1, 2).properties.temporal.get("undefined") is None + assert g.at(1).edge(1, 2).properties.temporal.get("prop 4") == [(1, True)] + assert g.at(1).edge(1, 2).properties.temporal.get("static prop") is None - assert g.at(1).edge(1, 2).static_property("static prop") == 123 - assert g.at(100).edge(1, 2).static_property("static prop") == 123 - assert g.edge(1, 2).static_property("static prop") == 123 - assert g.edge(1, 2).static_property("prop 4") is None + assert g.at(1).edge(1, 2).properties.constant.get("static prop") == 123 + assert g.at(100).edge(1, 2).properties.constant.get("static prop") == 123 + assert g.edge(1, 2).properties.constant.get("static prop") == 123 + assert g.edge(1, 2).properties.constant.get("prop 4") is None # testing property - assert g.edge(1, 2).property("static prop") == 123 + assert g.edge(1, 2).properties.get("static prop") == 123 assert g.edge(1, 2)["static prop"] == 123 - assert g.edge(1, 2).property("static prop", include_static=False) is None - assert g.edge(1, 2).property("prop 1", include_static=False) == 2 - assert g.at(2).edge(1, 2).property("prop 2") == 0.6 - assert g.at(1).edge(1, 2).property("prop 2") is None + assert g.edge(1, 2).properties.temporal.get("static prop") is None + assert g.edge(1, 2).properties.temporal.get("prop 1").value() == 2 + assert g.at(2).edge(1, 2).properties.get("prop 2") == 0.6 + assert g.at(1).edge(1, 2).properties.get("prop 2") is None # testing properties - assert g.edge(1, 2).properties() == {'prop 2': 0.9, 'prop 3': 'hello', 'prop 1': 2, 'prop 4': True, - 'static prop': 123} + assert g.edge(1, 2).properties == { + "prop 2": 0.9, + "prop 3": "hello", + "prop 1": 2, + "prop 4": True, + "static prop": 123, + } - assert g.edge(1, 2).properties(include_static=False) == {'prop 2': 0.9, 'prop 3': 'hello', 'prop 1': 2, - 'prop 4': True} + assert g.edge(1, 2).properties.temporal.latest() == { + "prop 2": 0.9, + "prop 3": "hello", + "prop 1": 2, + "prop 4": True, + } - assert g.at(2).edge(1, 2).properties() == {'prop 1': 2, 'prop 4': False, 'prop 2': 0.6, 'static prop': 123, - 'prop 3': 'hi'} + assert g.at(2).edge(1, 2).properties == { + "prop 1": 2, + "prop 4": False, + "prop 2": 0.6, + "static prop": 123, + "prop 3": "hi", + } # testing property histories - assert g.edge(1, 2).property_histories() == {'prop 3': [(1, 'hi'), (3, 'hello')], 'prop 1': [(1, 1), (2, 2)], - 'prop 4': [(1, True), (2, False), (3, True)], - 'prop 2': [(2, 0.6), (3, 0.9)]} + assert g.edge(1, 2).properties.temporal == { + "prop 3": [(1, "hi"), (3, "hello")], + "prop 1": [(1, 1), (2, 2)], + "prop 4": [(1, True), (2, False), (3, True)], + "prop 2": [(2, 0.6), (3, 0.9)], + } - assert g.at(2).edge(1, 2).property_histories() == {'prop 2': [(2, 0.6)], 'prop 4': [(1, True), (2, False)], - 'prop 1': [(1, 1), (2, 2)], 'prop 3': [(1, 'hi')]} + assert g.at(2).edge(1, 2).properties.temporal == { + "prop 2": [(2, 0.6)], + "prop 4": [(1, True), (2, False)], + "prop 1": [(1, 1), (2, 2)], + "prop 3": [(1, "hi")], + } # testing property names - assert g.edge(1, 2).property_names().sort() == ['prop 4', 'prop 1', 'prop 2', 'prop 3', 'static prop'].sort() + assert sorted(g.edge(1, 2).properties.keys()) == sorted( + ["prop 4", "prop 1", "prop 2", "prop 3", "static prop"] + ) - assert g.edge(1, 2).property_names(include_static=False).sort() == ['prop 4', 'prop 1', 'prop 2', 'prop 3'].sort() + assert sorted(g.edge(1, 2).properties.temporal.keys()) == sorted( + ["prop 4", "prop 1", "prop 2", "prop 3"] + ) - assert g.at(1).edge(1, 2).property_names(include_static=False).sort() == ['prop 4', 'prop 1', 'prop 2', - 'prop 3'].sort() + assert sorted(g.at(1).edge(1, 2).properties.temporal.keys()) == sorted( + ["prop 4", "prop 1", "prop 3"] + ) # testing has_property - assert g.edge(1, 2).has_property("prop 4") - assert g.edge(1, 2).has_property("prop 2") - assert not g.edge(1, 2).has_property("prop 5") - assert not g.at(1).edge(1, 2).has_property("prop 2") - assert g.edge(1, 2).has_property("static prop") - assert g.at(1).edge(1, 2).has_property("static prop") - assert not g.at(1).edge(1, 2).has_property("static prop", include_static=False) + assert "prop 4" in g.edge(1, 2).properties + assert "prop 2" in g.edge(1, 2).properties + assert "prop 5" not in g.edge(1, 2).properties + assert "prop 2" not in g.at(1).edge(1, 2).properties + assert "static prop" in g.edge(1, 2).properties + assert "static prop" in g.at(1).edge(1, 2).properties + assert "static prop" not in g.at(1).edge(1, 2).properties.temporal + + assert "static prop" in g.edge(1, 2).properties.constant + assert "prop 2" not in g.edge(1, 2).properties.constant + assert "static prop" in g.at(1).edge(1, 2).properties.constant + + +def test_graph_as_property(): + g = Graph() + g.add_edge(0, 1, 2, {"graph": g}) + assert "graph" in g.edge(1, 2).properties + assert g.edge(1, 2).properties["graph"].has_edge(1, 2) + - assert g.edge(1, 2).has_static_property("static prop") - assert not g.edge(1, 2).has_static_property("prop 2") - assert g.at(1).edge(1, 2).has_static_property("static prop") +def test_map_and_list_property(): + g = Graph() + g.add_edge(0, 1, 2, {"map": {"test": 1, "list": [1, 2, 3]}}) + e_props = g.edge(1, 2).properties + assert "map" in e_props + assert e_props["map"]["test"] == 1 + assert e_props["map"]["list"] == [1, 2, 3] def test_exploded_edge_time(): @@ -509,15 +778,12 @@ def test_exploded_edge_time(): his = e.history() exploded_his = [] for ee in e.explode(): - exploded_his.append(ee.time()) + exploded_his.append(ee.time) assert his == exploded_his -# assert g.vertex(1).property_history("prop 3") == [(1, 3), (3, 'hello')] - - def test_algorithms(): - g = Graph(1) + g = Graph() lotr_graph = graph_loader.lotr_graph() g.add_edge(1, 1, 2, {"prop1": 1}) g.add_edge(2, 2, 3, {"prop1": 1}) @@ -542,39 +808,42 @@ def test_algorithms(): assert min_in_degree == 1 assert clustering_coefficient == 1.0 - lotr_clustering_coefficient = algorithms.local_clustering_coefficient(lotr_graph, 'Frodo') - lotr_local_triangle_count = algorithms.local_triangle_count(lotr_graph, 'Frodo') + lotr_clustering_coefficient = algorithms.local_clustering_coefficient( + lotr_graph, "Frodo" + ) + lotr_local_triangle_count = algorithms.local_triangle_count(lotr_graph, "Frodo") assert lotr_clustering_coefficient == 0.1984313726425171 assert lotr_local_triangle_count == 253 def test_graph_time_api(): - g = create_graph(1) + g = create_graph() - earliest_time = g.earliest_time() - latest_time = g.latest_time() + earliest_time = g.earliest_time + latest_time = g.latest_time assert len(list(g.rolling(1))) == latest_time - earliest_time + 1 - assert len(list(g.expanding(2))) == (latest_time - earliest_time) / 2 + assert len(list(g.expanding(2))) == math.ceil((latest_time + 1 - earliest_time) / 2) w = g.window(2, 6) - assert len(list(w.rolling(window=10, step=3))) == 1 + assert len(list(w.rolling(window=10, step=3))) == 2 def test_save_load_graph(): - g = create_graph(1) + g = create_graph() g.add_vertex(1, 11, {"type": "wallet", "balance": 99.5}) g.add_vertex(2, 12, {"type": "wallet", "balance": 10.0}) - g.add_vertex(3, 13, {"type": "wallet", "balance": 76}) + g.add_vertex(3, 13, {"type": "wallet", "balance": 76.0}) g.add_edge(4, 11, 12, {"prop1": 1, "prop2": 9.8, "prop3": "test"}) g.add_edge(5, 12, 13, {"prop1": 1321, "prop2": 9.8, "prop3": "test"}) g.add_edge(6, 13, 11, {"prop1": 645, "prop2": 9.8, "prop3": "test"}) tmpdirname = tempfile.TemporaryDirectory() - g.save_to_file(tmpdirname.name) + graph_path = tmpdirname.name + "/test_graph.bin" + g.save_to_file(graph_path) - del (g) + del g - g = Graph.load_from_file(tmpdirname.name) + g = Graph.load_from_file(graph_path) view = g.window(0, 10) assert g.has_vertex(13) @@ -582,17 +851,19 @@ def test_save_load_graph(): assert view.vertex(13).out_degree() == 1 assert view.vertex(13).degree() == 2 - triangles = algorithms.local_triangle_count(view, 13) # How many triangles is 13 involved in + triangles = algorithms.local_triangle_count( + view, 13 + ) # How many triangles is 13 involved in assert triangles == 1 v = view.vertex(11) - assert v.property_histories() == {'type': [(1, 'wallet')], 'balance': [(1, 99.5)]} + assert v.properties.temporal == {"type": [(1, "wallet")], "balance": [(1, 99.5)]} tmpdirname.cleanup() def test_graph_at(): - g = create_graph(1) + g = create_graph() view = g.at(2) assert view.vertex(1).degree() == 3 @@ -603,7 +874,7 @@ def test_graph_at(): def test_add_node_string(): - g = Graph(1) + g = Graph() g.add_vertex(0, 1, {}) g.add_vertex(1, "haaroon", {}) @@ -614,7 +885,7 @@ def test_add_node_string(): def test_add_edge_string(): - g = Graph(1) + g = Graph() g.add_edge(0, 1, 2, {}) g.add_edge(1, "haaroon", "ben", {}) @@ -629,7 +900,7 @@ def test_add_edge_string(): def test_all_neighbours_window(): - g = Graph(4) + g = Graph() g.add_edge(1, 1, 2, {}) g.add_edge(1, 2, 3, {}) g.add_edge(2, 3, 2, {}) @@ -638,13 +909,13 @@ def test_all_neighbours_window(): view = g.at(2) v = view.vertex(2) - assert list(v.window(0, 2).in_neighbours().id()) == [1] - assert list(v.window(0, 2).out_neighbours().id()) == [3] - assert list(v.window(0, 2).neighbours().id()) == [1, 3] + assert list(v.window(0, 2).in_neighbours.id) == [1] + assert list(v.window(0, 2).out_neighbours.id) == [3] + assert list(v.window(0, 2).neighbours.id) == [1, 3] def test_all_degrees_window(): - g = Graph(4) + g = Graph() g.add_edge(1, 1, 2, {}) g.add_edge(1, 2, 3, {}) g.add_edge(2, 3, 2, {}) @@ -667,7 +938,7 @@ def test_all_degrees_window(): def test_all_edge_window(): - g = Graph(4) + g = Graph() g.add_edge(1, 1, 2, {}) g.add_edge(1, 2, 3, {}) g.add_edge(2, 3, 2, {}) @@ -678,24 +949,38 @@ def test_all_edge_window(): view = g.at(4) v = view.vertex(2) - assert sorted(v.window(0, 4).in_edges().src().id()) == [1, 3, 4] - assert sorted(v.window(t_end=4).in_edges().src().id()) == [1, 3, 4] - assert sorted(v.window(t_start=2).in_edges().src().id()) == [3, 4] - assert sorted(v.window(0, 4).out_edges().dst().id()) == [3] - assert sorted(v.window(t_end=3).out_edges().dst().id()) == [3] - assert sorted(v.window(t_start=2).out_edges().dst().id()) == [4] - assert sorted((e.src().id(), e.dst().id()) for e in v.window(0, 4).edges()) == [(1, 2), (2, 3), (3, 2), (4, 2)] - assert sorted((e.src().id(), e.dst().id()) for e in v.window(t_end=4).edges()) == [(1, 2), (2, 3), (3, 2), (4, 2)] - assert sorted((e.src().id(), e.dst().id()) for e in v.window(t_start=1).edges()) == [(1, 2), (2, 3), (2, 4), (3, 2), - (4, 2)] + assert sorted(v.window(0, 4).in_edges.src.id) == [1, 3, 4] + assert sorted(v.window(t_end=4).in_edges.src.id) == [1, 3, 4] + assert sorted(v.window(t_start=2).in_edges.src.id) == [3, 4] + assert sorted(v.window(0, 4).out_edges.dst.id) == [3] + assert sorted(v.window(t_end=3).out_edges.dst.id) == [3] + assert sorted(v.window(t_start=2).out_edges.dst.id) == [4] + assert sorted((e.src.id, e.dst.id) for e in v.window(0, 4).edges) == [ + (1, 2), + (2, 3), + (3, 2), + (4, 2), + ] + assert sorted((e.src.id, e.dst.id) for e in v.window(t_end=4).edges) == [ + (1, 2), + (2, 3), + (3, 2), + (4, 2), + ] + assert sorted((e.src.id, e.dst.id) for e in v.window(t_start=1).edges) == [ + (1, 2), + (2, 3), + (2, 4), + (3, 2), + (4, 2), + ] def test_static_prop_change(): # with pytest.raises(Exception): - g = Graph(1) - - g.add_edge(0, 1, 2, {}) - g.add_vertex_properties(1, {"name": "value1"}) + g = Graph() + v = g.add_vertex(0, 1) + v.add_constant_properties({"name": "value1"}) expected_msg = ( """Exception: Failed to mutate graph\n""" @@ -707,11 +992,11 @@ def test_static_prop_change(): # with pytest.raises(Exception, match=re.escape(expected_msg)): with pytest.raises(Exception): - g.add_vertex_properties(1, {"name": "value2"}) + v.add_constant_properties({"name": "value2"}) def test_triplet_count(): - g = Graph(1) + g = Graph() g.add_edge(0, 1, 2, {}) g.add_edge(0, 2, 3, {}) @@ -722,7 +1007,7 @@ def test_triplet_count(): def test_global_clustering_coeffficient(): - g = Graph(1) + g = Graph() g.add_edge(0, 1, 2, {}) g.add_edge(0, 2, 3, {}) @@ -736,7 +1021,7 @@ def test_global_clustering_coeffficient(): def test_edge_time_apis(): - g = Graph(1) + g = Graph() g.add_edge(1, 1, 2, {"prop2": 10}) g.add_edge(2, 2, 4, {"prop2": 11}) @@ -747,34 +1032,34 @@ def test_edge_time_apis(): e = g.edge(1, 2) for e in e.expanding(1): - assert e.src().name() == '1' - assert e.dst().name() == '2' + assert e.src.name == "1" + assert e.dst.name == "2" ls = [] - for e in v.edges(): - ls.append(e.src().name()) - ls.append(e.dst().name()) + for e in v.edges: + ls.append(e.src.name) + ls.append(e.dst.name) - assert ls == ['1', '2', '1', '5'] + assert ls == ["1", "2", "1", "5"] v = g.vertex(2) ls = [] - for e in v.in_edges(): - ls.append(e.src().name()) - ls.append(e.dst().name()) + for e in v.in_edges: + ls.append(e.src.name) + ls.append(e.dst.name) - assert ls == ['1', '2'] + assert ls == ["1", "2"] ls = [] - for e in v.out_edges(): - ls.append(e.src().name()) - ls.append(e.dst().name()) + for e in v.out_edges: + ls.append(e.src.name) + ls.append(e.dst.name) - assert ls == ['2', '4'] + assert ls == ["2", "4"] def test_edge_earliest_latest_time(): - g = Graph(1) + g = Graph() g.add_edge(0, 1, 2, {}) g.add_edge(1, 1, 2, {}) g.add_edge(2, 1, 2, {}) @@ -782,31 +1067,31 @@ def test_edge_earliest_latest_time(): g.add_edge(1, 1, 3, {}) g.add_edge(2, 1, 3, {}) - assert g.edge(1, 2).earliest_time() == 0 - assert g.edge(1, 2).latest_time() == 2 + assert g.edge(1, 2).earliest_time == 0 + assert g.edge(1, 2).latest_time == 2 - assert list(g.vertex(1).edges().earliest_time()) == [0, 0] - assert list(g.vertex(1).edges().latest_time()) == [2, 2] - assert list(g.vertex(1).at(1).edges().earliest_time()) == [0, 0] - assert list(g.vertex(1).at(1).edges().latest_time()) == [1, 1] + assert list(g.vertex(1).edges.earliest_time) == [0, 0] + assert list(g.vertex(1).edges.latest_time) == [2, 2] + assert list(g.vertex(1).at(1).edges.earliest_time) == [0, 0] + assert list(g.vertex(1).at(1).edges.latest_time) == [1, 1] def test_vertex_earliest_time(): - g = Graph(1) + g = Graph() g.add_vertex(0, 1, {}) g.add_vertex(1, 1, {}) g.add_vertex(2, 1, {}) view = g.at(1) - assert view.vertex(1).earliest_time() == 0 - assert view.vertex(1).latest_time() == 1 + assert view.vertex(1).earliest_time == 0 + assert view.vertex(1).latest_time == 1 view = g.at(3) - assert view.vertex(1).earliest_time() == 0 - assert view.vertex(1).latest_time() == 2 + assert view.vertex(1).earliest_time == 0 + assert view.vertex(1).latest_time == 2 def test_vertex_history(): - g = Graph(1) + g = Graph() g.add_vertex(1, 1, {}) g.add_vertex(2, 1, {}) @@ -819,17 +1104,17 @@ def test_vertex_history(): g.add_vertex(7, "Lord Farquaad", {}) g.add_vertex(8, "Lord Farquaad", {}) - assert (g.vertex(1).history() == [1, 2, 3, 4, 8]) - assert (g.vertex("Lord Farquaad").history() == [4, 6, 7, 8]) + assert g.vertex(1).history() == [1, 2, 3, 4, 8] + assert g.vertex("Lord Farquaad").history() == [4, 6, 7, 8] view = g.window(1, 8) - assert (view.vertex(1).history() == [1, 2, 3, 4]) - assert (view.vertex("Lord Farquaad").history() == [4, 6, 7]) + assert view.vertex(1).history() == [1, 2, 3, 4] + assert view.vertex("Lord Farquaad").history() == [4, 6, 7] def test_edge_history(): - g = Graph(1) + g = Graph() g.add_edge(1, 1, 2) g.add_edge(2, 1, 3) @@ -838,30 +1123,86 @@ def test_edge_history(): view = g.window(1, 5) - assert (g.edge(1, 2).history() == [1, 3]) - - # also needs to be fixed in Pedros PR - # assert(view.edge(1, 4).history() == [4]) + assert g.edge(1, 2).history() == [1, 3] + assert view.edge(1, 4).history() == [4] def test_lotr_edge_history(): g = graph_loader.lotr_graph() - assert (g.edge('Frodo', 'Gandalf').history() == [329, 555, 861, 1056, 1130, 1160, 1234, 1241, 1390, 1417, 1656, - 1741, 1783, 1785, 1792, 1804, 1809, 1999, 2056, 2254, 2925, 2999, - 3703, 3914, 4910, 5620, 5775, 6381, 6531, 6578, 6661, 6757, 7041, - 7356, 8183, 8190, 8276, 8459, 8598, 8871, 9098, 9343, 9903, 11189, - 11192, 11279, 11365, 14364, 21551, 21706, 23212, 26958, 27060, - 29024, 30173, 30737, 30744, 31023, 31052, 31054, 31103, 31445, - 32656]) - assert (g.at(1000).edge('Frodo', 'Gandalf').history() == [329, 555, 861]) - assert (g.edge('Frodo', 'Gandalf').at(1000).history() == [329, 555, 861]) - assert (g.window(100, 1000).edge('Frodo', 'Gandalf').history() == [329, 555, 861]) - assert (g.edge('Frodo', 'Gandalf').window(100, 1000).history() == [329, 555, 861]) + assert g.edge("Frodo", "Gandalf").history() == [ + 329, + 555, + 861, + 1056, + 1130, + 1160, + 1234, + 1241, + 1390, + 1417, + 1656, + 1741, + 1783, + 1785, + 1792, + 1804, + 1809, + 1999, + 2056, + 2254, + 2925, + 2999, + 3703, + 3914, + 4910, + 5620, + 5775, + 6381, + 6531, + 6578, + 6661, + 6757, + 7041, + 7356, + 8183, + 8190, + 8276, + 8459, + 8598, + 8871, + 9098, + 9343, + 9903, + 11189, + 11192, + 11279, + 11365, + 14364, + 21551, + 21706, + 23212, + 26958, + 27060, + 29024, + 30173, + 30737, + 30744, + 31023, + 31052, + 31054, + 31103, + 31445, + 32656, + ] + assert g.at(1000).edge("Frodo", "Gandalf").history() == [329, 555, 861] + assert g.edge("Frodo", "Gandalf").at(1000).history() == [329, 555, 861] + assert g.window(100, 1000).edge("Frodo", "Gandalf").history() == [329, 555, 861] + assert g.edge("Frodo", "Gandalf").window(100, 1000).history() == [329, 555, 861] -def test_connected_components(): - g = Graph(1) +def gen_graph(): + g = Graph() g.add_edge(10, 1, 3, {}) g.add_edge(11, 1, 2, {}) g.add_edge(12, 1, 2, {}) @@ -874,66 +1215,112 @@ def test_connected_components(): g.add_edge(15, 4, 7, {}) g.add_edge(10, 4, 7, {}) g.add_edge(10, 5, 8, {}) + return g + +def test_connected_components(): + g = gen_graph() actual = algorithms.weakly_connected_components(g, 20) - expected = {'1': 1, '2': 1, '3': 1, '4': 1, '5': 1, '6': 1, '7': 1, '8': 1} - assert (actual == expected) + expected = {"1": 1, "2": 1, "3": 1, "4": 1, "5": 1, "6": 1, "7": 1, "8": 1} + assert actual.get_all() == expected + assert actual.get("1") == 1 -def test_page_rank(): - g = Graph(1) - g.add_edge(10, 1, 3, {}) - g.add_edge(11, 1, 2, {}) - g.add_edge(12, 1, 2, {}) - g.add_edge(9, 1, 2, {}) - g.add_edge(12, 2, 4, {}) - g.add_edge(13, 2, 5, {}) - g.add_edge(14, 5, 5, {}) - g.add_edge(14, 5, 4, {}) - g.add_edge(5, 4, 6, {}) - g.add_edge(15, 4, 7, {}) - g.add_edge(10, 4, 7, {}) - g.add_edge(10, 5, 8, {}) +def test_algo_result(): + g = gen_graph() + + actual = algorithms.weakly_connected_components(g, 20) + expected = {"1": 1, "2": 1, "3": 1, "4": 1, "5": 1, "6": 1, "7": 1, "8": 1} + assert actual.get_all() == expected + assert actual.get("1") == 1 + assert actual.get("not a node") == None + expected_array = [ + ("1", 1), + ("2", 1), + ("3", 1), + ("4", 1), + ("5", 1), + ("6", 1), + ("7", 1), + ("8", 1), + ] + assert sorted(actual.sort_by_value()) == expected_array + assert actual.sort_by_key() == sorted(expected_array, reverse=True) + assert actual.sort_by_key(reverse=False) == expected_array + assert sorted(actual.top_k(8)) == expected_array + assert len(actual.group_by()[1]) == 8 + assert type(actual.to_df()) == pandas.core.frame.DataFrame + df = actual.to_df() + expected_result = pd.DataFrame({"Key": ["1"], "Value": [1]}) + row_with_one = df[df["Key"] == "1"] + row_with_one.reset_index(inplace=True, drop=True) + assert row_with_one.equals(expected_result) + # Algo Str u64 + actual = algorithms.weakly_connected_components(g) + all_res = actual.get_all() + sorted_res = {k: all_res[k] for k in sorted(all_res)} + assert sorted_res == { + "1": 1, + "2": 1, + "3": 1, + "4": 1, + "5": 1, + "6": 1, + "7": 1, + "8": 1, + } + # algo str f64 + actual = algorithms.pagerank(g) + expected_result = { + "3": 0.10274080842110422, + "2": 0.10274080842110422, + "4": 0.1615298183542792, + "6": 0.14074777909144864, + "1": 0.07209850165402759, + "5": 0.1615298183542792, + "7": 0.14074777909144864, + "8": 0.11786468661230831, + } + assert actual.get_all() == expected_result + assert actual.get("Not a node") == None + assert len(actual.to_df()) == 8 + # algo str vector + actual = algorithms.temporally_reachable_nodes(g, 20, 11, [1, 2], [4, 5]) + assert sorted(actual.get_all()) == ["1", "2", "3", "4", "5", "6", "7", "8"] - actual = algorithms.pagerank(g, 20) + +def test_page_rank(): + g = gen_graph() + actual = algorithms.pagerank(g) expected = { - '1': 0.07209850165402759, - '2': 0.10274080842110422, - '3': 0.10274080842110422, - '4': 0.1615298183542792, - '5': 0.1615298183542792, - '6': 0.14074777909144864, - '7': 0.14074777909144864, - '8': 0.11786468661230831, + "1": 0.07209850165402759, + "2": 0.10274080842110422, + "3": 0.10274080842110422, + "4": 0.1615298183542792, + "5": 0.1615298183542792, + "6": 0.14074777909144864, + "7": 0.14074777909144864, + "8": 0.11786468661230831, } - assert (actual == expected) + assert actual.get_all() == expected -def test_generic_taint(): - g = Graph(1) - g.add_edge(10, 1, 3, {}) - g.add_edge(11, 1, 2, {}) - g.add_edge(12, 1, 2, {}) - g.add_edge(9, 1, 2, {}) - g.add_edge(12, 2, 4, {}) - g.add_edge(13, 2, 5, {}) - g.add_edge(14, 5, 5, {}) - g.add_edge(14, 5, 4, {}) - g.add_edge(5, 4, 6, {}) - g.add_edge(15, 4, 7, {}) - g.add_edge(10, 4, 7, {}) - g.add_edge(10, 5, 8, {}) +def test_temporal_reachability(): + g = gen_graph() - actual = algorithms.generic_taint(g, 20, 11, [1, 2], [4, 5]) + actual = algorithms.temporally_reachable_nodes(g, 20, 11, [1, 2], [4, 5]) expected = { - '1': [(11, 'start')], - '2': [(11, 'start'), (12, '1'), (11, '1')], - '3': [], - '4': [(12, '2')], - '5': [(13, '2')], + "1": [(11, "start")], + "2": [(11, "start"), (12, "1"), (11, "1")], + "3": [], + "4": [(12, "2")], + "5": [(13, "2")], + "6": [], + "7": [], + "8": [], } - assert (actual == expected) + assert actual.get_all() == expected # def test_generic_taint_loader(): @@ -956,19 +1343,36 @@ def test_generic_taint(): def test_layer(): - g = Graph(1) + g = Graph() g.add_edge(0, 1, 2) - g.add_edge(0, 1, 3, layer='layer1') - g.add_edge(0, 1, 4, layer='layer2') + g.add_edge(0, 1, 3, layer="layer1") + g.add_edge(0, 1, 4, layer="layer2") + + assert g.default_layer().count_edges() == 1 + assert g.layers(["layer1"]).count_edges() == 1 + assert g.layers(["layer2"]).count_edges() == 1 + - assert (g.default_layer().num_edges() == 1) - assert (g.layer('layer1').num_edges() == 1) - assert (g.layer('layer2').num_edges() == 1) +def test_layer_vertex(): + g = Graph() + + g.add_edge(0, 1, 2, layer="layer1") + g.add_edge(0, 2, 3, layer="layer2") + g.add_edge(3, 2, 4, layer="layer1") + neighbours = g.layers(["layer1", "layer2"]).vertex(1).neighbours.collect() + assert sorted(neighbours[0].layers(["layer2"]).edges.id) == [(2, 3)] + assert sorted(g.layers(["layer2"]).vertex(neighbours[0].name).edges.id) == [(2, 3)] + assert sorted(g.layers(["layer1"]).vertex(neighbours[0].name).edges.id) == [ + (1, 2), + (2, 4), + ] + assert sorted(g.layers(["layer1"]).edges().id) == [(1, 2), (2, 4)] + assert sorted(g.layers(["layer1", "layer2"]).edges().id) == [(1, 2), (2, 3), (2, 4)] def test_rolling_as_iterable(): - g = Graph(1) + g = Graph() g.add_vertex(1, 1) g.add_vertex(4, 4) @@ -977,25 +1381,25 @@ def test_rolling_as_iterable(): # a normal operation is reusing the object returned by rolling twice, to get both results and an index. # So the following should work fine: - n_vertices = [w.num_vertices() for w in rolling] - time_index = [w.start() for w in rolling] + n_vertices = [w.count_vertices() for w in rolling] + time_index = [w.start for w in rolling] assert n_vertices == [1, 0, 0, 1] assert time_index == [1, 2, 3, 4] def test_layer_name(): - g = Graph(4) + g = Graph() g.add_edge(0, 0, 1) g.add_edge(0, 0, 2, layer="awesome layer") - assert g.edge(0, 1).layer_name() == "default layer" - assert g.edge(0, 2, "awesome layer").layer_name() == "awesome layer" + assert g.edge(0, 1).layer_names == ["_default"] + assert g.edge(0, 2).layer_names == ["awesome layer"] def test_window_size(): - g = Graph(4) + g = Graph() g.add_vertex(1, 1) g.add_vertex(4, 4) @@ -1003,12 +1407,15 @@ def test_window_size(): def test_time_index(): - g = Graph(4) + g = Graph() w = g.window("2020-01-01", "2020-01-03") rolling = w.rolling("1 day") time_index = rolling.time_index() - assert list(time_index) == [datetime.datetime(2020, 1, 1, 23, 59, 59, 999000), datetime.datetime(2020, 1, 2, 23, 59, 59, 999000)] + assert list(time_index) == [ + datetime.datetime(2020, 1, 1, 23, 59, 59, 999000), + datetime.datetime(2020, 1, 2, 23, 59, 59, 999000), + ] w = g.window(1, 3) rolling = w.rolling(1) @@ -1022,89 +1429,663 @@ def test_time_index(): def test_datetime_props(): - g = Graph(4) + g = Graph() dt1 = datetime.datetime(2020, 1, 1, 23, 59, 59, 999000) g.add_vertex(0, 0, {"time": dt1}) - assert g.vertex(0).property("time") == dt1 + assert g.vertex(0).properties.get("time") == dt1 dt2 = datetime.datetime(2020, 1, 1, 23, 59, 59, 999999) g.add_vertex(0, 1, {"time": dt2}) - assert g.vertex(1).property("time") == dt2 + assert g.vertex(1).properties.get("time") == dt2 + - def test_date_time(): - g = Graph(1) + g = Graph() - g.add_edge('2014-02-02', 1, 2) - g.add_edge('2014-02-03', 1, 3) - g.add_edge('2014-02-04', 1, 4) - g.add_edge('2014-02-05', 1, 2) + g.add_edge("2014-02-02", 1, 2) + g.add_edge("2014-02-03", 1, 3) + g.add_edge("2014-02-04", 1, 4) + g.add_edge("2014-02-05", 1, 2) - assert g.earliest_date_time() == datetime.datetime(2014, 2, 2, 0, 0) - assert g.latest_date_time() == datetime.datetime(2014, 2, 5, 0, 0) + assert g.earliest_date_time == datetime.datetime(2014, 2, 2, 0, 0) + assert g.latest_date_time == datetime.datetime(2014, 2, 5, 0, 0) e = g.edge(1, 3) exploded_edges = [] for edge in e.explode(): - exploded_edges.append(edge.date_time()) + exploded_edges.append(edge.date_time) assert exploded_edges == [datetime.datetime(2014, 2, 3)] - assert g.edge(1, 2).earliest_date_time() == datetime.datetime(2014, 2, 2, 0, 0) - assert g.edge(1, 2).latest_date_time() == datetime.datetime(2014, 2, 5, 0, 0) + assert g.edge(1, 2).earliest_date_time == datetime.datetime(2014, 2, 2, 0, 0) + assert g.edge(1, 2).latest_date_time == datetime.datetime(2014, 2, 5, 0, 0) + + assert g.vertex(1).earliest_date_time == datetime.datetime(2014, 2, 2, 0, 0) + assert g.vertex(1).latest_date_time == datetime.datetime(2014, 2, 5, 0, 0) - assert g.vertex(1).earliest_date_time() == datetime.datetime(2014, 2, 2, 0, 0) - assert g.vertex(1).latest_date_time() == datetime.datetime(2014, 2, 5, 0, 0) def test_date_time_window(): - g = Graph(1) + g = Graph() - g.add_edge('2014-02-02', 1, 2) - g.add_edge('2014-02-03', 1, 3) - g.add_edge('2014-02-04', 1, 4) - g.add_edge('2014-02-05', 1, 2) - g.add_edge('2014-02-06', 1, 2) + g.add_edge("2014-02-02", 1, 2) + g.add_edge("2014-02-03", 1, 3) + g.add_edge("2014-02-04", 1, 4) + g.add_edge("2014-02-05", 1, 2) + g.add_edge("2014-02-06", 1, 2) - view = g.window('2014-02-02', '2014-02-04') - view2 = g.window('2014-02-02', '2014-02-05') + view = g.window("2014-02-02", "2014-02-04") + view2 = g.window("2014-02-02", "2014-02-05") - assert view.start_date_time() == datetime.datetime(2014, 2, 2, 0, 0) - assert view.end_date_time() == datetime.datetime(2014, 2, 4, 0, 0) + assert view.start_date_time == datetime.datetime(2014, 2, 2, 0, 0) + assert view.end_date_time == datetime.datetime(2014, 2, 4, 0, 0) - assert view.earliest_date_time() == datetime.datetime(2014, 2, 2, 0, 0) - assert view.latest_date_time() == datetime.datetime(2014, 2, 4, 0, 0) + assert view.earliest_date_time == datetime.datetime(2014, 2, 2, 0, 0) + assert view.latest_date_time == datetime.datetime(2014, 2, 3, 0, 0) - assert view2.edge(1, 2).start_date_time() == datetime.datetime(2014, 2, 2, 0, 0) - assert view2.edge(1, 2).end_date_time() == datetime.datetime(2014, 2, 5, 0, 0) + assert view2.edge(1, 2).start_date_time == datetime.datetime(2014, 2, 2, 0, 0) + assert view2.edge(1, 2).end_date_time == datetime.datetime(2014, 2, 5, 0, 0) - assert view.vertex(1).earliest_date_time() == datetime.datetime(2014, 2, 2, 0, 0) - assert view.vertex(1).latest_date_time() == datetime.datetime(2014, 2, 3, 0, 0) + assert view.vertex(1).earliest_date_time == datetime.datetime(2014, 2, 2, 0, 0) + assert view.vertex(1).latest_date_time == datetime.datetime(2014, 2, 3, 0, 0) e = view.edge(1, 2) exploded_edges = [] for edge in e.explode(): - exploded_edges.append(edge.date_time()) + exploded_edges.append(edge.date_time) assert exploded_edges == [datetime.datetime(2014, 2, 2)] def test_datetime_add_vertex(): - g = Graph(1) + g = Graph() g.add_vertex(datetime.datetime(2014, 2, 2), 1) g.add_vertex(datetime.datetime(2014, 2, 3), 2) g.add_vertex(datetime.datetime(2014, 2, 4), 2) g.add_vertex(datetime.datetime(2014, 2, 5), 4) g.add_vertex(datetime.datetime(2014, 2, 6), 5) - view = g.window('2014-02-02', '2014-02-04') - view2 = g.window('2014-02-02', '2014-02-05') + view = g.window("2014-02-02", "2014-02-04") + view2 = g.window("2014-02-02", "2014-02-05") + + assert view.start_date_time == datetime.datetime(2014, 2, 2, 0, 0) + assert view.end_date_time == datetime.datetime(2014, 2, 4, 0, 0) + + assert view2.earliest_date_time == datetime.datetime(2014, 2, 2, 0, 0) + assert view2.latest_date_time == datetime.datetime(2014, 2, 4, 0, 0) + + assert view2.vertex(1).start_date_time == datetime.datetime(2014, 2, 2, 0, 0) + assert view2.vertex(1).end_date_time == datetime.datetime(2014, 2, 5, 0, 0) + + assert view.vertex(2).earliest_date_time == datetime.datetime(2014, 2, 3, 0, 0) + assert view.vertex(2).latest_date_time == datetime.datetime(2014, 2, 3, 0, 0) + + +def test_equivalent_vertices_edges_and_sets(): + g = Graph() + g.add_vertex(1, 1) + g.add_vertex(1, 2) + g.add_vertex(1, 3) + + g.add_edge(1, 1, 2) + g.add_edge(1, 2, 3) + + assert g.vertex(1) == g.vertex(1) + assert list(g.vertex(1).neighbours)[0] == list(g.vertex(3).neighbours)[0] + assert set(g.vertex(1).neighbours) == set(g.vertex(3).neighbours) + assert set(g.vertex(1).out_edges) == set(g.vertex(2).in_edges) + + assert g.edge(1, 1) == g.edge(1, 1) + + +def test_subgraph(): + g = create_graph() + empty_graph = g.subgraph([]) + assert empty_graph.vertices.collect() == [] + + vertex1 = g.vertices[1] + subgraph = g.subgraph([vertex1]) + assert subgraph.vertices.collect() == [vertex1] + + subgraph_from_str = g.subgraph(["1"]) + assert subgraph_from_str.vertices.collect() == [vertex1] + + subgraph_from_int = g.subgraph([1]) + assert subgraph_from_int.vertices.collect() == [vertex1] + + mg = subgraph.materialize() + assert mg.vertices.collect()[0].properties["type"] == "wallet" + assert mg.vertices.collect()[0].name == "1" + + props = {"prop 4": 11, "prop 5": "world", "prop 6": False} + mg.add_property(1, props) + + props = {"prop 1": 1, "prop 2": "hi", "prop 3": True} + mg.add_constant_properties(props) + x = mg.properties.keys() + x.sort() + assert x == ["prop 1", "prop 2", "prop 3", "prop 4", "prop 5", "prop 6"] + + +def test_materialize_graph(): + g = Graph() + + edges = [(1, 1, 2), (2, 1, 3), (-1, 2, 1), (0, 1, 1), (7, 3, 2), (1, 1, 1)] + + g.add_vertex(0, 1, {"type": "wallet", "cost": 99.5}) + g.add_vertex(-1, 2, {"type": "wallet", "cost": 10.0}) + g.add_vertex(6, 3, {"type": "wallet", "cost": 76.0}) + g.add_vertex(6, 4).add_constant_properties({"abc": "xyz"}) + + for e in edges: + g.add_edge(e[0], e[1], e[2], {"prop1": 1, "prop2": 9.8, "prop3": "test"}) + + g.add_edge(8, 2, 4) + + sprop = {"sprop 1": "kaggle", "sprop 2": True} + g.add_constant_properties(sprop) + assert g.properties.constant == sprop + + mg = g.materialize() + + assert mg.vertex(1).properties.get("type") == "wallet" + assert mg.vertex(4).properties == {"abc": "xyz"} + assert mg.vertex(4).properties.constant.get("abc") == "xyz" + assert mg.vertex(1).history() == [-1, 0, 1, 2] + assert mg.vertex(4).history() == [6, 8] + assert mg.vertices.id.collect() == [1, 2, 3, 4] + assert set(mg.edges().id) == {(1, 1), (1, 2), (1, 3), (2, 1), (3, 2), (2, 4)} + assert g.vertices.id.collect() == mg.vertices.id.collect() + assert set(g.edges().id) == set(mg.edges().id) + assert mg.vertex(1).properties.constant == {} + assert mg.vertex(4).properties.constant == {"abc": "xyz"} + assert g.edge(1, 2).id == (1, 2) + assert mg.edge(1, 2).id == (1, 2) + assert mg.has_edge(1, 2) + assert g.has_edge(1, 2) + assert mg.has_edge(2, 1) + assert g.has_edge(2, 1) + + sprop2 = {"sprop 3": 11, "sprop 4": 10} + mg.add_constant_properties(sprop2) + sprop.update(sprop2) + assert mg.properties.constant == sprop + + +def test_deletions(): + g = create_graph_with_deletions() + for e in edges: + assert g.at(e[0]).has_edge(e[1], e[2]) + + assert not g.window(start=11).has_edge(edges[0][1], edges[0][2]) + for e in edges[1:]: + assert g.window(start=11).has_edge(e[1], e[2]) + + assert list(g.edge(edges[0][1], edges[0][2]).explode().latest_time) == [10] + + +def test_load_from_pandas(): + import pandas as pd + + df = pd.DataFrame( + { + "src": [1, 2, 3, 4, 5], + "dst": [2, 3, 4, 5, 6], + "time": [1, 2, 3, 4, 5], + "weight": [1.0, 2.0, 3.0, 4.0, 5.0], + "marbles": ["red", "blue", "green", "yellow", "purple"], + } + ) + + g = Graph.load_from_pandas(df, "src", "dst", "time", ["weight", "marbles"]) + + assert g.vertices.id.collect() == [1, 2, 3, 4, 5, 6] + edges = [] + for e in g.edges(): + weight = e["weight"] + marbles = e["marbles"] + edges.append((e.src.id, e.dst.id, weight, marbles)) + + assert edges == [ + (1, 2, 1.0, "red"), + (2, 3, 2.0, "blue"), + (3, 4, 3.0, "green"), + (4, 5, 4.0, "yellow"), + (5, 6, 5.0, "purple"), + ] + + +def test_load_from_pandas_into_existing_graph(): + edges_df = pd.DataFrame( + { + "src": [1, 2, 3, 4, 5], + "dst": [2, 3, 4, 5, 6], + "time": [1, 2, 3, 4, 5], + "weight": [1.0, 2.0, 3.0, 4.0, 5.0], + "marbles": ["red", "blue", "green", "yellow", "purple"], + } + ) + + vertices_df = pd.DataFrame( + { + "id": [1, 2, 3, 4, 5, 6], + "name": ["Alice", "Bob", "Carol", "Dave", "Eve", "Frank"], + "time": [1, 2, 3, 4, 5, 6], + } + ) + + g = Graph() + + g.load_vertices_from_pandas(vertices_df, "id", "time", ["name"]) + + g.load_edges_from_pandas(edges_df, "src", "dst", "time", ["weight", "marbles"]) + + assert g.vertices.id.collect() == [1, 2, 3, 4, 5, 6] + edges = [] + for e in g.edges(): + weight = e["weight"] + marbles = e["marbles"] + edges.append((e.src.id, e.dst.id, weight, marbles)) + + assert edges == [ + (1, 2, 1.0, "red"), + (2, 3, 2.0, "blue"), + (3, 4, 3.0, "green"), + (4, 5, 4.0, "yellow"), + (5, 6, 5.0, "purple"), + ] + + vertices = [] + for v in g.vertices: + name = v["name"] + vertices.append((v.id, name)) + + assert vertices == [ + (1, "Alice"), + (2, "Bob"), + (3, "Carol"), + (4, "Dave"), + (5, "Eve"), + (6, "Frank"), + ] + + +def test_load_from_pandas_vertices(): + edges_df = pd.DataFrame( + { + "src": [1, 2, 3, 4, 5], + "dst": [2, 3, 4, 5, 6], + "time": [1, 2, 3, 4, 5], + "weight": [1.0, 2.0, 3.0, 4.0, 5.0], + "marbles": ["red", "blue", "green", "yellow", "purple"], + } + ) + + vertices_df = pd.DataFrame( + { + "id": [1, 2, 3, 4, 5, 6], + "name": ["Alice", "Bob", "Carol", "Dave", "Eve", "Frank"], + "time": [1, 2, 3, 4, 5, 6], + } + ) + + g = Graph.load_from_pandas( + edges_df, + src="src", + dst="dst", + time="time", + props=["weight", "marbles"], + vertex_df=vertices_df, + vertex_col="id", + vertex_time_col="time", + vertex_props=["name"], + ) + + assert g.vertices.id.collect() == [1, 2, 3, 4, 5, 6] + edges = [] + for e in g.edges(): + weight = e["weight"] + marbles = e["marbles"] + edges.append((e.src.id, e.dst.id, weight, marbles)) + + assert edges == [ + (1, 2, 1.0, "red"), + (2, 3, 2.0, "blue"), + (3, 4, 3.0, "green"), + (4, 5, 4.0, "yellow"), + (5, 6, 5.0, "purple"), + ] + + vertices = [] + for v in g.vertices: + name = v["name"] + vertices.append((v.id, name)) + + assert vertices == [ + (1, "Alice"), + (2, "Bob"), + (3, "Carol"), + (4, "Dave"), + (5, "Eve"), + (6, "Frank"), + ] + + +def test_load_from_pandas_with_types(): + edges_df = pd.DataFrame( + { + "src": [1, 2, 3, 4, 5], + "dst": [2, 3, 4, 5, 6], + "time": [1, 2, 3, 4, 5], + "weight": [1.0, 2.0, 3.0, 4.0, 5.0], + "marbles": ["red", "blue", "green", "yellow", "purple"], + "marbles_const": ["red", "blue", "green", "yellow", "purple"], + "layers": ["layer 1", "layer 2", "layer 3", "layer 4", "layer 5"], + } + ) + vertices_df = pd.DataFrame( + { + "id": [1, 2, 3, 4, 5, 6], + "name": ["Alice", "Bob", "Carol", "Dave", "Eve", "Frank"], + "time": [1, 2, 3, 4, 5, 6], + "type": [ + "Person 1", + "Person 2", + "Person 3", + "Person 4", + "Person 5", + "Person 6", + ], + } + ) + g = Graph() + g.load_vertices_from_pandas( + vertices_df, + "id", + "time", + ["name"], + shared_const_props={"type": "Person", "tag": "test_tag"}, + ) + assert g.vertices.properties.constant.get("type").collect() == [ + "Person", + "Person", + "Person", + "Person", + "Person", + "Person", + ] + assert g.vertices.properties.constant.get("tag").collect() == [ + "test_tag", + "test_tag", + "test_tag", + "test_tag", + "test_tag", + "test_tag", + ] + + g = Graph() + g.load_vertices_from_pandas( + vertices_df, "id", "time", ["name"], const_props=["type"] + ) + assert g.vertices.properties.constant.get("type").collect() == [ + "Person 1", + "Person 2", + "Person 3", + "Person 4", + "Person 5", + "Person 6", + ] + + g = Graph() + g.load_edges_from_pandas( + edges_df, + "src", + "dst", + "time", + ["weight", "marbles"], + const_props=["marbles_const"], + shared_const_props={"type": "Edge", "tag": "test_tag"}, + layer="test_layer", + ) + + assert g.layers(["test_layer"]).edges().src.id.collect() == [1, 2, 3, 4, 5] + assert g.edges().properties.constant.get("type").collect() == [ + {"test_layer": "Edge"}, + {"test_layer": "Edge"}, + {"test_layer": "Edge"}, + {"test_layer": "Edge"}, + {"test_layer": "Edge"}, + ] + assert g.edges().properties.constant.get("tag").collect() == [ + {"test_layer": "test_tag"}, + {"test_layer": "test_tag"}, + {"test_layer": "test_tag"}, + {"test_layer": "test_tag"}, + {"test_layer": "test_tag"}, + ] + assert g.edges().properties.constant.get("marbles_const").collect() == [ + {"test_layer": "red"}, + {"test_layer": "blue"}, + {"test_layer": "green"}, + {"test_layer": "yellow"}, + {"test_layer": "purple"}, + ] + + g = Graph() + g.load_edges_from_pandas( + edges_df, "src", "dst", "time", ["weight", "marbles"], layer_in_df="layers" + ) + assert g.layers(["layer 1"]).edges().src.id.collect() == [1] + assert g.layers(["layer 1", "layer 2"]).edges().src.id.collect() == [1, 2] + assert g.layers(["layer 1", "layer 2", "layer 3"]).edges().src.id.collect() == [ + 1, + 2, + 3, + ] + assert g.layers(["layer 1", "layer 4", "layer 5"]).edges().src.id.collect() == [ + 1, + 4, + 5, + ] + + g = Graph.load_from_pandas( + edges_df, + "src", + "dst", + "time", + layer="test_layer", + vertex_df=vertices_df, + vertex_col="id", + vertex_time_col="time", + vertex_props=["name"], + vertex_shared_const_props={"type": "Person"}, + ) + assert g.vertices.properties.constant.get("type").collect() == [ + "Person", + "Person", + "Person", + "Person", + "Person", + "Person", + ] + assert g.layers(["test_layer"]).edges().src.id.collect() == [1, 2, 3, 4, 5] + + g = Graph.load_from_pandas( + edges_df, + "src", + "dst", + "time", + layer_in_df="layers", + vertex_df=vertices_df, + vertex_col="id", + vertex_time_col="time", + vertex_props=["name"], + vertex_const_props=["type"], + ) + assert g.vertices.properties.constant.get("type").collect() == [ + "Person 1", + "Person 2", + "Person 3", + "Person 4", + "Person 5", + "Person 6", + ] + assert g.layers(["layer 1"]).edges().src.id.collect() == [1] + assert g.layers(["layer 1", "layer 2"]).edges().src.id.collect() == [1, 2] + assert g.layers(["layer 1", "layer 2", "layer 3"]).edges().src.id.collect() == [ + 1, + 2, + 3, + ] + assert g.layers(["layer 1", "layer 4", "layer 5"]).edges().src.id.collect() == [ + 1, + 4, + 5, + ] + + g = Graph.load_from_pandas( + edges_df, + src="src", + dst="dst", + time="time", + props=["weight", "marbles"], + vertex_df=vertices_df, + vertex_col="id", + vertex_time_col="time", + vertex_props=["name"], + layer_in_df="layers", + ) + + g.load_vertex_props_from_pandas( + vertices_df, "id", const_props=["type"], shared_const_props={"tag": "test_tag"} + ) + assert g.vertices.properties.constant.get("type").collect() == [ + "Person 1", + "Person 2", + "Person 3", + "Person 4", + "Person 5", + "Person 6", + ] + assert g.vertices.properties.constant.get("tag").collect() == [ + "test_tag", + "test_tag", + "test_tag", + "test_tag", + "test_tag", + "test_tag", + ] + + g.load_edge_props_from_pandas( + edges_df, + "src", + "dst", + const_props=["marbles_const"], + shared_const_props={"tag": "test_tag"}, + layer_in_df="layers", + ) + assert g.layers(["layer 1", "layer 2", "layer 3"]).edges().properties.constant.get( + "marbles_const" + ).collect() == [{"layer 1": "red"}, {"layer 2": "blue"}, {"layer 3": "green"}] + assert g.edges().properties.constant.get("tag").collect() == [ + {"layer 1": "test_tag"}, + {"layer 2": "test_tag"}, + {"layer 3": "test_tag"}, + {"layer 4": "test_tag"}, + {"layer 5": "test_tag"}, + ] + + +def test_edge_layer(): + g = Graph() + g.add_edge(1, 1, 2, layer="layer 1").add_constant_properties( + {"test_prop": "test_val"} + ) + g.add_edge(1, 2, 3, layer="layer 2").add_constant_properties( + {"test_prop": "test_val 2"} + ) + assert g.edges().properties.constant.get("test_prop") == [ + {"layer 1": "test_val"}, + {"layer 2": "test_val 2"}, + ] + + +def test_layers_earliest_time(): + g = Graph() + e = g.add_edge(1, 1, 2, layer="test") + e = g.edge(1, 2) + print(e) + assert e.earliest_time == 1 + + +def test_layers_earliest_time(): + g = Graph() + e = g.add_edge(1, 1, 2, layer="test") + e = g.edge(1, 2) + print(e) + assert e.earliest_time == 1 + + +def test_edge_explode_layers(): + g = Graph() + g.add_edge(1, 1, 2, {"layer": 1}, layer="1") + g.add_edge(1, 1, 2, {"layer": 2}, layer="2") + g.add_edge(1, 2, 1, {"layer": 1}, layer="1") + g.add_edge(1, 2, 1, {"layer": 2}, layer="2") + + layered_edges = g.edge(1, 2).explode_layers() + e_layers = [ee.layer_names for ee in layered_edges] + e_layer_prop = [[str(ee.properties["layer"])] for ee in layered_edges] + assert e_layers == e_layer_prop + print(e_layers) + + nested_layered_edges = g.vertices.out_edges.explode_layers() + e_layers = [[ee.layer_names for ee in edges] for edges in nested_layered_edges] + e_layer_prop = [ + [[str(ee.properties["layer"])] for ee in layered_edges] + for layered_edges in nested_layered_edges + ] + assert e_layers == e_layer_prop + print(e_layers) + + print(g.vertices.out_neighbours.collect) + nested_layered_edges = g.vertices.out_neighbours.out_edges.explode_layers() + print(nested_layered_edges) + e_layers = [ + [ee.layer_names for ee in layered_edges] + for layered_edges in nested_layered_edges + ] + e_layer_prop = [ + [[str(ee.properties["layer"])] for ee in layered_edges] + for layered_edges in nested_layered_edges + ] + assert e_layers == e_layer_prop + print(e_layers) - assert view.start_date_time() == datetime.datetime(2014, 2, 2, 0, 0) - assert view.end_date_time() == datetime.datetime(2014, 2, 4, 0, 0) - assert view2.earliest_date_time() == datetime.datetime(2014, 2, 2, 0, 0) - assert view2.latest_date_time() == datetime.datetime(2014, 2, 5, 0, 0) +def test_hits_algorithm(): + g = graph_loader.lotr_graph() + assert algorithms.hits(g).get("Aldor") == ( + 0.0035840950440615416, + 0.007476256228983402, + ) + - assert view2.vertex(1).start_date_time() == datetime.datetime(2014, 2, 2, 0, 0) - assert view2.vertex(1).end_date_time() == datetime.datetime(2014, 2, 5, 0, 0) +def test_balance_algorithm(): + g = Graph() + edges_str = [ + ("1", "2", 10.0, 1), + ("1", "4", 20.0, 2), + ("2", "3", 5.0, 3), + ("3", "2", 2.0, 4), + ("3", "1", 1.0, 5), + ("4", "3", 10.0, 6), + ("4", "1", 5.0, 7), + ("1", "5", 2.0, 8), + ] + for src, dst, val, time in edges_str: + g.add_edge(time, src, dst, {"value_dec": val}) + result = algorithms.balance(g, "value_dec", PyDirection("BOTH"), None).get_all() + assert result == {"1": -26.0, "2": 7.0, "3": 12.0, "4": 5.0, "5": 2.0} - assert view.vertex(2).earliest_date_time() == datetime.datetime(2014, 2, 3, 0, 0) - assert view.vertex(2).latest_date_time() == datetime.datetime(2014, 2, 3, 0, 0) + result = algorithms.balance(g, "value_dec", PyDirection("IN"), None).get_all() + assert result == {"1": 6.0, "2": 12.0, "3": 15.0, "4": 20.0, "5": 2.0} + result = algorithms.balance(g, "value_dec", PyDirection("OUT"), None).get_all() + assert result == {"1": -32.0, "2": -5.0, "3": -3.0, "4": -15.0, "5": 0.0} diff --git a/python/tests/test_graphql.py b/python/tests/test_graphql.py new file mode 100644 index 0000000000..552e9901d5 --- /dev/null +++ b/python/tests/test_graphql.py @@ -0,0 +1,159 @@ +import sys +import tempfile + + +def test_graphQL(): + from raphtory import Graph + from raphtory import graphqlserver + import random + import string + import os + + g1 = Graph() + g1.add_edge(1, "ben", "hamza") + g1.add_edge(2, "haaroon", "hamza") + g1.add_edge(3, "ben", "haaroon") + + g2 = Graph() + g2 = Graph() + g2.add_edge(1, "Naomi", "Shivam") + g2.add_edge(2, "Shivam", "Pedro") + g2.add_edge(3, "Pedro", "Rachel") + graphs = {"g1": g1, "g2": g2} + + g3 = Graph() + g3.add_edge(1, "ben_saved", "hamza_saved") + g3.add_edge(2, "haaroon_saved", "hamza_saved") + g3.add_edge(3, "ben_saved", "haaroon_saved") + + g4 = Graph() + g4.add_edge(1, "Naomi_saved", "Shivam_saved") + g4.add_edge(2, "Shivam_saved", "Pedro_saved") + g4.add_edge(3, "Pedro_saved", "Rachel_saved") + + temp_dir = tempfile.mkdtemp() + + g3.save_to_file(temp_dir + "/g3") + g4.save_to_file(temp_dir + "/g4") + + map_server = graphqlserver.run_server(graphs=graphs, port=1736, daemon=True) + dir_server = graphqlserver.run_server(graph_dir=temp_dir, port=1737, daemon=True) + map_dir_server = graphqlserver.run_server( + graphs=graphs, graph_dir=temp_dir, port=1738, daemon=True + ) + + query_g1 = """{graph(name: "g1") {nodes {name}}}""" + query_g2 = """{graph(name: "g2") {nodes {name}}}""" + query_g3 = """{graph(name: "g3") {nodes {name}}}""" + query_g4 = """{graph(name: "g4") {nodes {name}}}""" + + assert str(map_server.query(query_g1)).replace( + " ", "" + ) == "{'graph': {'nodes': [{'name': 'ben'}, {'name': 'hamza'}, {'name': 'haaroon'}]}}".replace( + " ", "" + ) + assert str(map_server.query(query_g2)).replace( + " ", "" + ) == "{'graph': {'nodes': [{'name': 'Naomi'}, {'name': 'Shivam'}, {'name': 'Pedro'}, {'name': 'Rachel'}]}}".replace( + " ", "" + ) + assert str(dir_server.query(query_g3)).replace( + " ", "" + ) == "{'graph': {'nodes': [{'name': 'ben_saved'}, {'name': 'hamza_saved'}, {'name': 'haaroon_saved'}]}}".replace( + " ", "" + ) + assert str(dir_server.query(query_g4)).replace( + " ", "" + ) == "{'graph': {'nodes': [{'name': 'Naomi_saved'}, {'name': 'Shivam_saved'}, {'name': 'Pedro_saved'}, {'name': 'Rachel_saved'}]}}".replace( + " ", "" + ) + + assert str(map_dir_server.query(query_g1)).replace( + " ", "" + ) == "{'graph': {'nodes': [{'name': 'ben'}, {'name': 'hamza'}, {'name': 'haaroon'}]}}".replace( + " ", "" + ) + assert str(map_dir_server.query(query_g2)).replace( + " ", "" + ) == "{'graph': {'nodes': [{'name': 'Naomi'}, {'name': 'Shivam'}, {'name': 'Pedro'}, {'name': 'Rachel'}]}}".replace( + " ", "" + ) + assert str(map_dir_server.query(query_g4)).replace( + " ", "" + ) == "{'graph': {'nodes': [{'name': 'Naomi_saved'}, {'name': 'Shivam_saved'}, {'name': 'Pedro_saved'}, {'name': 'Rachel_saved'}]}}".replace( + " ", "" + ) + assert str(map_dir_server.query(query_g3)).replace( + " ", "" + ) == "{'graph': {'nodes': [{'name': 'ben_saved'}, {'name': 'hamza_saved'}, {'name': 'haaroon_saved'}]}}".replace( + " ", "" + ) + + +def test_graphqlclient(): + from raphtory import Graph + from raphtory import graphqlserver + from raphtory import graphqlclient + import os + + temp_dir = tempfile.mkdtemp() + + g1 = Graph() + g1.add_edge(1, "ben", "hamza") + g1.add_edge(2, "haaroon", "hamza") + g1.add_edge(3, "ben", "haaroon") + g1.save_to_file(temp_dir + "/g1.bincode") + + dir_server = graphqlserver.run_server(graph_dir=temp_dir, port=1739, daemon=True) + + # create a client + raphtory_client = graphqlclient.RaphtoryGraphQLClient(url="http://localhost:1739/") + + # load a graph into the client from a path + res = raphtory_client.load_graphs_from_path(temp_dir) + assert res == {"loadGraphsFromPath": ["g1.bincode"]} + + # run a get nodes query and check the results + query = """query GetNodes($graphname: String!) { + graph(name: $graphname) { + nodes { + name + } + } + }""" + variables = {"graphname": "g1.bincode"} + res = raphtory_client.query(query, variables) + assert res == { + "graph": {"nodes": [{"name": "ben"}, {"name": "hamza"}, {"name": "haaroon"}]} + } + + # load a new graph into the client from a path + multi_graph_temp_dir = tempfile.mkdtemp() + g2 = Graph() + g2.add_edge(1, "ben", "hamza") + g2.add_edge(2, "haaroon", "hamza") + g2.save_to_file(multi_graph_temp_dir + "/g2.bincode") + g3 = Graph() + g3.add_edge(1, "shivam", "rachel") + g3.add_edge(2, "lucas", "shivam") + g3.save_to_file(multi_graph_temp_dir + "/g3.bincode") + res = raphtory_client.load_new_graphs_from_path(multi_graph_temp_dir) + result_sorted = {"loadNewGraphsFromPath": sorted(res["loadNewGraphsFromPath"])} + assert result_sorted == {"loadNewGraphsFromPath": ["g2.bincode", "g3.bincode"]} + + # upload a graph + g4 = Graph() + g4.add_vertex(0, 1) + res = raphtory_client.send_graph("hello", g4) + assert res == {"sendGraph": "hello"} + # Ensure the sent graph can be queried + query = """query GetNodes($graphname: String!) { + graph(name: $graphname) { + nodes { + name + } + } + }""" + variables = {"graphname": "hello"} + res = raphtory_client.query(query, variables) + assert res == {"graph": {"nodes": [{"name": "1"}]}} diff --git a/python/tests/test_iterables.py b/python/tests/test_iterables.py new file mode 100644 index 0000000000..7a0045b700 --- /dev/null +++ b/python/tests/test_iterables.py @@ -0,0 +1,253 @@ +import math +import sys + +import pandas as pd +import pandas.core.frame +import pytest +from raphtory import Graph, GraphWithDeletions, PyDirection +from raphtory import algorithms +from raphtory import graph_loader +import tempfile +from math import isclose +import datetime + + +def test_pyprophistvaluelist(): + g = Graph() + edges_str = [ + ("1", "2", 10, 1), + ("1", "2", 10, 1), + ("1", "4", 20, 2), + ("2", "3", 5, 3), + ("3", "2", 2, 4), + ("3", "1", 1, 5), + ("4", "3", 10, 6), + ("4", "1", 5, 7), + ("1", "5", 2, 8), + ] + for src, dst, val, time in edges_str: + g.add_edge(time, src, dst, {"value_dec": val}) + + v = g.vertex("1") + res = sorted(v.out_edges.properties.temporal.get("value_dec").values().sum()) + assert res == [2, 20, 20] + + res = sorted(v.out_edges.properties.temporal.get("value_dec").values().count()) + assert res == [1, 1, 2] + + res = v.out_edges.properties.temporal.get("value_dec").values().sum().sum() + assert res == 42 + + res = v.out_edges.properties.temporal.get("value_dec").values().count().sum() + assert res == 4 + + g = Graph() + edges_str = [ + ("1", "2", 10, 1), + ("1", "2", 10, 2), + ("1", "2", 100, 3), + ("1", "4", 20, 2), + ("2", "3", 5, 3), + ("3", "2", 2, 4), + ("3", "1", 1, 5), + ("4", "3", 10, 6), + ("4", "1", 5, 7), + ("1", "5", 2, 8), + ("1", "5", 1, 9), + ("1", "5", 5, 10), + ] + for src, dst, val, time in edges_str: + g.add_edge(time, src, dst, {"value_dec": val}) + v = g.vertex("1") + res = v.out_edges.properties.temporal.get( + "value_dec" + ).values() # PyPropHistValueList([[10, 10, 10], [20], [2]]) + assert res.sum() == [120, 20, 8] + assert res.min() == [10, 20, 1] + assert res.max() == [100, 20, 5] + assert sorted(res.count()) == [1, 3, 3] + assert res.median() == [10, 20, 2] + assert list(res.mean()) == [40, 20, 8 / 3] + assert list(res.average()) == [40, 20, 8 / 3] + + +def test_empty_lists(): + # This checks that empty lists are handled correctly on all python property types + g = Graph() + edges_str = [ + ("1", "2", 10, 1), + ("1", "2", 10, 1), + ("1", "4", 20, 2), + ("2", "3", 5, 3), + ("3", "2", 2, 4), + ("3", "1", 1, 5), + ("4", "3", 10, 6), + ("4", "1", 5, 7), + ("1", "5", 2, 8), + ] + for src, dst, val, time in edges_str: + g.add_edge(time, src, dst, {"value_dec": val}) + assert ( + g.vertices + .out_edges.properties.temporal.get("value_dec") + .values() + .median() + .median() + .median() + == 5 + ) + assert ( + g.vertices + .out_edges.properties.temporal.get("value_dec") + .values() + .mean() + .mean() + .mean() + == 1.3333333333333335 + ) + + +def test_propiterable(): + import raphtory + + g = raphtory.Graph() + edges_str = [ + ("1", "2", 10, 1), + ("1", "2", 10, 1), + ("1", "2", 10, 1), + ("1", "4", 20, 2), + ("2", "3", 5, 3), + ("3", "2", 2, 4), + ("3", "1", 1, 5), + ("4", "3", 10, 6), + ("4", "1", 5, 7), + ("1", "5", 2, 8), + ] + for src, dst, val, time in edges_str: + g.add_edge(time, src, dst, {"value_dec": val}) + + v = g.vertex("1") + result = v.out_edges.properties.temporal.get("value_dec").values().flatten() + assert sorted(result) == [2, 10, 10, 10, 20] + assert result.sum() == 52 + assert result.median() == 10 + assert result.mean() == 10.4 + assert result.average() == 10.4 + assert result.min() == 2 + assert result.max() == 20 + assert result.count() == 5 + + assert v.out_edges.properties.get("value_dec").sum() == 32 + assert v.out_edges.properties.get("value_dec").median() == 10 + + total = g.vertices.in_edges.properties.get("value_dec").sum() + assert sorted(total) == [2, 6, 12, 15, 20] + + total = g.vertices.edges.properties.get("value_dec").sum() + assert sorted(total) == [2, 17, 18, 35, 38] + + total = dict( + zip(g.vertices.id, g.vertices.out_edges.properties.get("value_dec").sum()) + ) + assert total == {1: 32, 2: 5, 3: 3, 4: 15, 5: None} + + total = g.vertices.out_edges.properties.get("value_dec").sum().sum() + assert total == 55 + + total = g.vertices.out_edges.properties.get("value_dec").sum().median() + assert total == 5 + + total = g.vertices.out_edges.properties.get("value_dec").sum().drop_none() + assert sorted(total) == [3, 5, 15, 32] + + total = g.vertices.out_edges.properties.get("value_dec").median() + assert list(total) == [10, 5, 10, 2, None] + + total = g.vertex("1").in_edges.properties.get("value_dec").sum() + assert total == 6 + + total = g.vertex("1").in_edges.properties.get("value_dec").median() + assert total == 5 + + +def test_pypropvalue_list_listlist(): + g = Graph() + edges_str = [ + ("1", "2", 10, 1), + ("1", "2", 10, 2), + ("1", "2", 100, 3), + ("1", "4", 20, 2), + ("2", "3", 5, 3), + ("3", "2", 2, 4), + ("3", "1", 1, 5), + ("4", "3", 10, 6), + ("4", "1", 5, 7), + ("1", "5", 2, 8), + ("1", "5", 1, 9), + ("1", "5", 5, 10), + ] + for src, dst, val, time in edges_str: + g.add_edge(time, src, dst, {"value_dec": val}) + v = g.vertex("1") + res = g.edges().properties.get( + "value_dec" + ) # PyPropValueList([100, 20, 5, 5, 5, 10, 1, 2]) + res_v = v.edges.properties.get("value_dec") # PyPropValueList([100, 5, 20, 1, 5]) + res_ll = g.vertices.edges.properties.get("value_dec") + + assert res.sum() == 148 + assert res_v.sum() == 131 + assert res_ll.sum() == [131, 107, 35, 18, 5] + + assert res.median() == 5 + assert res_v.median() == 5 + assert res_ll.median() == [5, 5, 10, 5, 5] + + assert res.min() == 1 + assert res_v.min() == 1 + assert res_ll.min() == [1, 2, 5, 1, 5] + + assert res.max() == 100 + assert res_v.max() == 100 + assert res_ll.max() == [100, 100, 20, 10, 5] + + assert res.count() == 8 + assert res_v.count() == 5 + assert res_ll.count() == [5, 3, 3, 4, 1] + + assert res.mean() == res.average() == 18.5 + assert res_v.mean() == res_v.average() == 26.2 + assert ( + res_ll.mean() + == res_ll.average() + == [26.2, 35.666666666666664, 11.666666666666666, 4.5, 5.0] + ) + + +def test_pytemporalprops(): + g = Graph() + edges_str = [ + ("1", "2", 10, 1), + ("1", "2", 10, 2), + ("1", "2", 100, 3), + ("1", "4", 20, 2), + ("2", "3", 5, 3), + ("3", "2", 2, 4), + ("3", "1", 1, 5), + ("4", "3", 10, 6), + ("4", "1", 5, 7), + ("1", "5", 2, 8), + ("1", "5", 1, 9), + ("1", "5", 5, 10), + ] + for src, dst, val, time in edges_str: + g.add_edge(time, src, dst, {"value_dec": val}) + v = g.vertex("1") + res = list(v.out_edges)[0].properties.temporal.get("value_dec") + + assert res.sum() == 120 + assert res.min() == (1, 10) + assert res.max() == (3, 100) + assert res.count() == 3 + assert res.mean() == res.average() == 40.0 + assert res.median() == (2, 10) diff --git a/raphtory-benchmark/Cargo.toml b/raphtory-benchmark/Cargo.toml index 92ecb9c65f..bc89d1c4eb 100644 --- a/raphtory-benchmark/Cargo.toml +++ b/raphtory-benchmark/Cargo.toml @@ -7,8 +7,7 @@ edition = "2021" [dependencies] criterion = "0.4" -raphtory = { path = "../raphtory" } -raphtory-io = { path = "../raphtory-io" } +raphtory = { path = "../raphtory" , features=["io"]} sorted_vector_map = "0.1" rand = "0.8.5" rayon = "1" diff --git a/raphtory-benchmark/benches/algobench.rs b/raphtory-benchmark/benches/algobench.rs index 0e9663d35a..fae8bd1eb2 100644 --- a/raphtory-benchmark/benches/algobench.rs +++ b/raphtory-benchmark/benches/algobench.rs @@ -1,10 +1,14 @@ use crate::common::bench; use criterion::{criterion_group, criterion_main, Criterion}; -use raphtory::algorithms::local_clustering_coefficient::local_clustering_coefficient; -use raphtory::algorithms::local_triangle_count::local_triangle_count; -use raphtory::db::graph::Graph; -use raphtory::db::view_api::*; +use raphtory::{ + algorithms::{ + local_clustering_coefficient::local_clustering_coefficient, + local_triangle_count::local_triangle_count, + }, + prelude::*, +}; use rayon::prelude::*; + mod common; //TODO swap to new trianglecount @@ -26,7 +30,7 @@ pub fn local_triangle_count_analysis(c: &mut Criterion) { let mut group = c.benchmark_group("local_triangle_count"); group.sample_size(10); bench(&mut group, "local_triangle_count", None, |b| { - let g = raphtory_io::graph_loader::example::lotr_graph::lotr_graph(1); + let g = raphtory::graph_loader::example::lotr_graph::lotr_graph(); let windowed_graph = g.window(i64::MIN, i64::MAX); b.iter(|| { @@ -45,7 +49,7 @@ pub fn local_clustering_coefficient_analysis(c: &mut Criterion) { let mut group = c.benchmark_group("local_clustering_coefficient"); bench(&mut group, "local_clustering_coefficient", None, |b| { - let g: Graph = Graph::new(1); + let g: Graph = Graph::new(); let windowed_graph = g.window(0, 5); let vs = vec![ @@ -75,7 +79,7 @@ pub fn local_clustering_coefficient_analysis(c: &mut Criterion) { ]; for (src, dst, t) in &vs { - g.add_edge(*t, *src, *dst, &vec![], None).unwrap(); + g.add_edge(*t, *src, *dst, NO_PROPS, None).unwrap(); } b.iter(|| local_clustering_coefficient(&windowed_graph, 1)) diff --git a/raphtory-benchmark/benches/base.rs b/raphtory-benchmark/benches/base.rs index 8a984dc0e3..29bcd29543 100644 --- a/raphtory-benchmark/benches/base.rs +++ b/raphtory-benchmark/benches/base.rs @@ -1,5 +1,6 @@ -use crate::common::{bootstrap_graph, run_large_ingestion_benchmarks}; +use crate::common::{bootstrap_graph, run_analysis_benchmarks, run_large_ingestion_benchmarks}; use criterion::{criterion_group, criterion_main, Criterion, Throughput}; +use raphtory::{graph_loader::example::lotr_graph::lotr_graph, prelude::*}; mod common; @@ -18,8 +19,31 @@ pub fn base(c: &mut Criterion) { large_group.throughput(Throughput::Elements(1_000)); large_group.measurement_time(std::time::Duration::from_secs(3)); // Make an option of None - run_large_ingestion_benchmarks(&mut large_group, || bootstrap_graph(4, 10000), None); + run_large_ingestion_benchmarks(&mut large_group, || bootstrap_graph(10000), None); large_group.finish(); + let mut graph_group = c.benchmark_group("lotr_graph"); + let graph = lotr_graph(); + run_analysis_benchmarks(&mut graph_group, || graph.clone(), None); + graph_group.finish(); + let mut graph_window_group_100 = c.benchmark_group("lotr_graph_window_100"); + graph_window_group_100.sample_size(10); + run_analysis_benchmarks( + &mut graph_window_group_100, + || graph.window(i64::MIN, i64::MAX), + None, + ); + graph_window_group_100.finish(); + let mut graph_window_group_10 = c.benchmark_group("lotr_graph_window_10"); + let latest = graph.end().expect("non-empty graph"); + let earliest = graph.start().expect("non-empty graph"); + let start = latest - (latest - earliest) / 10; + graph_window_group_10.sample_size(10); + run_analysis_benchmarks( + &mut graph_window_group_10, + || graph.window(start, latest + 1), + None, + ); + graph_window_group_10.finish(); } criterion_group!(benches, base); diff --git a/raphtory-benchmark/benches/common/mod.rs b/raphtory-benchmark/benches/common/mod.rs index c15390c148..1103a0c47e 100644 --- a/raphtory-benchmark/benches/common/mod.rs +++ b/raphtory-benchmark/benches/common/mod.rs @@ -1,8 +1,8 @@ +#![allow(dead_code)] + use criterion::{measurement::WallTime, BatchSize, Bencher, BenchmarkGroup, BenchmarkId}; -use rand::seq::*; -use rand::{distributions::Uniform, Rng}; -use raphtory::db::graph::Graph; -use raphtory::db::view_api::*; +use rand::{distributions::Uniform, seq::*, Rng}; +use raphtory::prelude::*; use std::collections::HashSet; fn make_index_gen() -> Box> { @@ -17,8 +17,8 @@ fn make_time_gen() -> Box> { Box::new(rng.sample_iter(range)) } -pub fn bootstrap_graph(num_shards: usize, num_vertices: usize) -> Graph { - let graph = Graph::new(num_shards); +pub fn bootstrap_graph(num_vertices: usize) -> Graph { + let graph = Graph::new(); let mut indexes = make_index_gen(); let mut times = make_time_gen(); let num_edges = num_vertices / 2; @@ -26,7 +26,9 @@ pub fn bootstrap_graph(num_shards: usize, num_vertices: usize) -> Graph { let source = indexes.next().unwrap(); let target = indexes.next().unwrap(); let time = times.next().unwrap(); - graph.add_edge(time, source, target, &vec![], None).unwrap(); + graph + .add_edge(time, source, target, NO_PROPS, None) + .unwrap(); } graph } @@ -68,7 +70,7 @@ pub fn run_ingestion_benchmarks( |b: &mut Bencher| { b.iter_batched_ref( || (make_graph(), time_sample()), - |(g, t): &mut (Graph, i64)| g.add_vertex(*t, 0, &vec![]), + |(g, t): &mut (Graph, i64)| g.add_vertex(*t, 0, NO_PROPS), BatchSize::SmallInput, ) }, @@ -80,7 +82,7 @@ pub fn run_ingestion_benchmarks( |b: &mut Bencher| { b.iter_batched_ref( || (make_graph(), index_sample()), - |(g, v): &mut (Graph, u64)| g.add_vertex(0, *v, &vec![]), + |(g, v): &mut (Graph, u64)| g.add_vertex(0, *v, NO_PROPS), BatchSize::SmallInput, ) }, @@ -92,7 +94,7 @@ pub fn run_ingestion_benchmarks( |b: &mut Bencher| { b.iter_batched_ref( || (make_graph(), time_sample()), - |(g, t)| g.add_edge(*t, 0, 0, &vec![], None), + |(g, t)| g.add_edge(*t, 0, 0, NO_PROPS, None), BatchSize::SmallInput, ) }, @@ -104,7 +106,7 @@ pub fn run_ingestion_benchmarks( |b: &mut Bencher| { b.iter_batched_ref( || (make_graph(), index_sample(), index_sample()), - |(g, s, d)| g.add_edge(0, *s, *d, &vec![], None), + |(g, s, d)| g.add_edge(0, *s, *d, NO_PROPS, None), BatchSize::SmallInput, ) }, @@ -122,9 +124,6 @@ pub fn run_large_ingestion_benchmarks( ) where F: FnMut() -> Graph, { - let mut times_gen = make_time_gen(); - let mut time_sample = || times_gen.next().unwrap(); - let updates = 1000; bench( @@ -141,7 +140,7 @@ pub fn run_large_ingestion_benchmarks( }, |(g, times)| { for t in times.iter() { - g.add_edge(*t, 0, 0, &vec![], None).unwrap() + g.add_edge(*t, 0, 0, NO_PROPS, None).unwrap(); } }, BatchSize::SmallInput, @@ -163,7 +162,7 @@ pub fn run_large_ingestion_benchmarks( }, |(g, times)| { for t in times.iter() { - g.add_edge(*t, "0", "0", &vec![], None).unwrap() + g.add_edge(*t, "0", "0", NO_PROPS, None).unwrap(); } }, BatchSize::SmallInput, @@ -185,7 +184,7 @@ pub fn run_large_ingestion_benchmarks( }, |(g, times)| { for t in times.iter() { - g.add_edge(*t, "test", "other", &vec![], None).unwrap() + g.add_edge(*t, "test", "other", NO_PROPS, None).unwrap(); } }, BatchSize::SmallInput, @@ -213,10 +212,10 @@ pub fn run_large_ingestion_benchmarks( *t, src_gen.next().unwrap(), dst_gen.next().unwrap(), - &vec![], + NO_PROPS, None, ) - .unwrap() + .unwrap(); } }, BatchSize::SmallInput, @@ -244,10 +243,10 @@ pub fn run_large_ingestion_benchmarks( *t, src_gen.next().unwrap(), dst_gen.next().unwrap(), - &vec![], + NO_PROPS, None, ) - .unwrap() + .unwrap(); } }, BatchSize::SmallInput, @@ -273,13 +272,13 @@ pub fn run_analysis_benchmarks( let vertices: HashSet = graph.vertices().id().collect(); bench(group, "num_edges", parameter, |b: &mut Bencher| { - b.iter(|| graph.num_edges()) + b.iter(|| graph.count_edges()) }); bench(group, "has_edge_existing", parameter, |b: &mut Bencher| { let mut rng = rand::thread_rng(); let edge = edges.iter().choose(&mut rng).expect("non-empty graph"); - b.iter(|| graph.has_edge(edge.0, edge.1, None)) + b.iter(|| graph.has_edge(edge.0, edge.1, Layer::All)) }); bench( @@ -297,12 +296,12 @@ pub fn run_analysis_benchmarks( break edge; } }; - b.iter(|| graph.has_edge(edge.0, edge.1, None)) + b.iter(|| graph.has_edge(edge.0, edge.1, Layer::All)) }, ); bench(group, "num_vertices", parameter, |b: &mut Bencher| { - b.iter(|| graph.num_vertices()) + b.iter(|| graph.count_vertices()) }); bench( diff --git a/raphtory-benchmark/benches/edge_add.rs b/raphtory-benchmark/benches/edge_add.rs index d6c9572a83..6f8c3118e7 100644 --- a/raphtory-benchmark/benches/edge_add.rs +++ b/raphtory-benchmark/benches/edge_add.rs @@ -1,10 +1,11 @@ use criterion::{criterion_group, criterion_main, Criterion}; -use raphtory::core::vertex::InputVertex; -use raphtory::db::graph::Graph; +use raphtory::{core::entities::vertices::input_vertex::InputVertex, prelude::*}; mod common; -use rand::distributions::{Alphanumeric, DistString}; -use rand::{thread_rng, Rng}; +use rand::{ + distributions::{Alphanumeric, DistString}, + thread_rng, Rng, +}; fn random_string(n: usize) -> String { Alphanumeric.sample_string(&mut rand::thread_rng(), n) @@ -30,12 +31,12 @@ pub fn graph(c: &mut Criterion) { id_group.finish(); let mut graph_group = c.benchmark_group("edge_add"); - let mut g = Graph::new(1); + let g = Graph::new(); graph_group.bench_function("string input", |bencher| { let src: String = random_string(16); let dst: String = random_string(16); let t: i64 = thread_rng().gen(); - bencher.iter(|| g.add_edge(t, src.clone(), dst.clone(), &vec![], None)) + bencher.iter(|| g.add_edge(t, src.clone(), dst.clone(), NO_PROPS, None)) }); graph_group.finish(); } diff --git a/raphtory-benchmark/benches/graph_ops.rs b/raphtory-benchmark/benches/graph_ops.rs index bb9eefbddc..962d009b42 100644 --- a/raphtory-benchmark/benches/graph_ops.rs +++ b/raphtory-benchmark/benches/graph_ops.rs @@ -1,13 +1,12 @@ use common::run_analysis_benchmarks; use criterion::{criterion_group, criterion_main, Criterion}; -use raphtory::db::view_api::*; -use raphtory_io::graph_loader::example::sx_superuser_graph::sx_superuser_graph; +use raphtory::{db::api::view::*, graph_loader::example::sx_superuser_graph::sx_superuser_graph}; mod common; pub fn graph(c: &mut Criterion) { let mut graph_group = c.benchmark_group("analysis_graph"); - let graph = sx_superuser_graph(2).unwrap(); + let graph = sx_superuser_graph().unwrap(); run_analysis_benchmarks(&mut graph_group, || graph.clone(), None); graph_group.finish(); let mut graph_window_group_100 = c.benchmark_group("analysis_graph_window_100"); diff --git a/raphtory-benchmark/benches/parameterized.rs b/raphtory-benchmark/benches/parameterized.rs index d23057f8db..843a04fe8f 100644 --- a/raphtory-benchmark/benches/parameterized.rs +++ b/raphtory-benchmark/benches/parameterized.rs @@ -12,7 +12,7 @@ pub fn parameterized(c: &mut Criterion) { let mut ingestion_group = c.benchmark_group("ingestion-num_vertices"); ingestion_group.plot_config(PlotConfiguration::default().summary_scale(AxisScale::Logarithmic)); for num_vertices in vertices { - let make_graph = || bootstrap_graph(4, num_vertices); + let make_graph = || bootstrap_graph(num_vertices); ingestion_group.throughput(Throughput::Elements(num_vertices as u64)); ingestion_group.sample_size(10); ingestion_group.warm_up_time(std::time::Duration::from_secs(1)); diff --git a/raphtory-benchmark/benches/tgraph_benchmarks.rs b/raphtory-benchmark/benches/tgraph_benchmarks.rs index d4b2009ff4..93f0f54897 100644 --- a/raphtory-benchmark/benches/tgraph_benchmarks.rs +++ b/raphtory-benchmark/benches/tgraph_benchmarks.rs @@ -1,9 +1,8 @@ -use std::collections::BTreeSet; - use criterion::{criterion_group, criterion_main, BenchmarkId, Criterion, Throughput}; use rand::{distributions::Uniform, Rng}; -use raphtory::core::{lsm::LSMSet, tadjset::TAdjSet}; +use raphtory::core::entities::vertices::structure::adjset::AdjSet; use sorted_vector_map::SortedVectorSet; +use std::collections::BTreeSet; fn btree_set_u64(c: &mut Criterion) { let mut group = c.benchmark_group("btree_set_u64_range_insert"); @@ -28,20 +27,6 @@ fn btree_set_u64(c: &mut Criterion) { }, ); - group.bench_with_input( - BenchmarkId::new("LSMTree with u64", size), - &init_vals, - |b, vals| { - b.iter(|| { - let mut bs = LSMSet::default(); - for v in vals.iter() { - bs.find(*v); - bs.insert(*v); - } - }); - }, - ); - group.bench_with_input( BenchmarkId::new("SortedVec with u64", size), &init_vals, @@ -80,7 +65,7 @@ fn bm_tadjset(c: &mut Criterion) { .take(*size as usize) .collect(); - let mut tadjset = TAdjSet::default(); + let mut tadjset = AdjSet::default(); group.bench_with_input( BenchmarkId::new("TAdjSet insert", size), diff --git a/raphtory-graphql/Cargo.toml b/raphtory-graphql/Cargo.toml index c34d79eebf..1b6192e23e 100644 --- a/raphtory-graphql/Cargo.toml +++ b/raphtory-graphql/Cargo.toml @@ -13,29 +13,35 @@ readme.workspace = true homepage.workspace = true [dependencies] -raphtory = { path = "../raphtory", version = "0.4.0" } - +raphtory = { path = "../raphtory", version = "0.5.7", features = ['vectors'] } +bincode = "1" +base64 = "0.21.2" +thiserror = "1.0.44" dotenv = "0.15.0" itertools = "0.10" serde = {version = "1.0.147", features = ["derive"]} once_cell = "1.17.2" - poem = "1.3.48" tokio = {version = "1.18.2", features = ["full"]} - async-graphql = {version = "5.0.5", features = ["dynamic-schema"]} dynamic-graphql = "0.7.3" async-graphql-poem = "5.0.5" - +parking_lot = { version = "0.12" , features = ["serde", "arc_lock", "send_guard"] } futures-util = "0.3.0" async-stream = "0.3.0" - opentelemetry = {version = "0.18.0", features = ["rt-tokio"]} opentelemetry-jaeger = {version = "0.17.0", features = ["rt-tokio"]} tracing = "0.1.37" tracing-opentelemetry = "0.18.0" tracing-subscriber = {version = "0.3.16", features = ["std", "env-filter"]} +walkdir = "2" +ordered-float = "3.7.0" +uuid = "1.4.1" +async-openai = "0.14.0" +clap = { version = "4.3.11", features = ["derive"] } +chrono = { version = "0.4", features = ["serde"] } [dev-dependencies] serde_json = "1.0" +tempfile = "3.6.0" diff --git a/raphtory-graphql/src/data.rs b/raphtory-graphql/src/data.rs index aeedb3128b..87c353b026 100644 --- a/raphtory-graphql/src/data.rs +++ b/raphtory-graphql/src/data.rs @@ -1,32 +1,116 @@ -use raphtory::db::graph::Graph; -use std::collections::HashMap; -use std::fs; -use std::path::{Path, PathBuf}; +use parking_lot::RwLock; +use raphtory::{ + core::Prop, + prelude::{Graph, GraphViewOps, PropertyAdditionOps}, + search::IndexedGraph, + vectors::VectorizedGraph, +}; +use std::{ + collections::{HashMap, HashSet}, + path::Path, +}; +use walkdir::WalkDir; +#[derive(Default)] pub(crate) struct Data { - pub(crate) graphs: HashMap, + pub(crate) graphs: RwLock>>, + pub(crate) vector_stores: RwLock>>, } impl Data { - pub fn load(directory_path: &str) -> Self { - let paths = fs::read_dir(directory_path).unwrap_or_else(|_| { - panic!("path '{directory_path}' doesn't exist or it is not a directory") - }); - - let graphs = paths - .filter_map(|entry| { - let path:PathBuf = entry.unwrap().path(); - if path.is_dir(){ - let graph = Graph::load_from_file(&path).ok()?; - let filename = path.file_name()?.to_str()?.to_string(); - Some((filename, graph)) - } - else{ - None + pub fn from_map(graphs: HashMap) -> Self { + let graphs = RwLock::new(Self::convert_graphs(graphs)); + let vector_stores = RwLock::new(HashMap::new()); + Self { + graphs, + vector_stores, + } + } + + pub fn from_directory(directory_path: &str) -> Self { + let graphs = RwLock::new(Self::load_from_file(directory_path)); + let vector_stores = RwLock::new(HashMap::new()); + Self { + graphs, + vector_stores, + } + } + + pub fn from_map_and_directory(graphs: HashMap, directory_path: &str) -> Self { + let mut graphs = Self::convert_graphs(graphs); + graphs.extend(Self::load_from_file(directory_path)); + let graphs = RwLock::new(graphs); + let vector_stores = RwLock::new(HashMap::new()); + Self { + graphs, + vector_stores, + } + } + + fn convert_graphs(graphs: HashMap) -> HashMap> { + graphs + .into_iter() + .map(|(name, g)| { + ( + name, + IndexedGraph::from_graph(&g).expect("Unable to index graph"), + ) + }) + .collect() + } + + pub fn load_from_file(path: &str) -> HashMap> { + let mut valid_paths = HashSet::::new(); + + for entry in WalkDir::new(path).into_iter().filter_map(|e| e.ok()) { + let path = entry.path(); + let path_string = path.display().to_string(); + let filename = path.file_name().and_then(|name| name.to_str()); + if let Some(filename) = filename { + if path.is_file() && !filename.starts_with('.') { + valid_paths.insert(path_string); } + } + } + + let mut graphs_loaded: Vec = vec![]; + let mut is_graph_already_loaded = |graph_name: String| { + if graphs_loaded.contains(&graph_name) { + panic!("Graph by name {} is already loaded", graph_name); + } else { + graphs_loaded.push(graph_name); + } + }; + + let graphs: HashMap> = valid_paths + .into_iter() + .map(|path| { + println!("loading graph from {path}"); + let graph = Graph::load_from_file(&path).expect("Unable to load from graph"); + graph + .add_constant_properties([("path".to_string(), Prop::str(path.clone()))]) + .expect("Failed to add static property"); + let maybe_graph_name = graph.properties().get("name"); + + return match maybe_graph_name { + None => { + let graph_name = Path::new(&path).file_name().unwrap().to_str().unwrap(); + is_graph_already_loaded(graph_name.to_string()); + (graph_name.to_string(), graph) + } + Some(graph_name) => { + is_graph_already_loaded(graph_name.to_string()); + (graph_name.to_string(), graph) + } + }; + }) + .map(|(name, g)| { + ( + name, + IndexedGraph::from_graph(&g).expect("Unable to index graph"), + ) }) .collect(); - - Self { graphs } + graphs } } diff --git a/raphtory-graphql/src/embeddings.rs b/raphtory-graphql/src/embeddings.rs new file mode 100644 index 0000000000..439c7f3ae1 --- /dev/null +++ b/raphtory-graphql/src/embeddings.rs @@ -0,0 +1,19 @@ +use async_openai::{ + types::{CreateEmbeddingRequest, EmbeddingInput}, + Client, +}; +use itertools::Itertools; +use raphtory::vectors::Embedding; + +pub async fn openai_embedding(texts: Vec) -> Vec { + println!("computing embeddings for {} texts", texts.len()); + let client = Client::new(); + let request = CreateEmbeddingRequest { + model: "text-embedding-ada-002".to_owned(), + input: EmbeddingInput::StringArray(texts), + user: None, + }; + let response = client.embeddings().create(request).await.unwrap(); + println!("Generated embeddings successfully"); + response.data.into_iter().map(|e| e.embedding).collect_vec() +} diff --git a/raphtory-graphql/src/lib.rs b/raphtory-graphql/src/lib.rs index 80488e566e..64619c5a0c 100644 --- a/raphtory-graphql/src/lib.rs +++ b/raphtory-graphql/src/lib.rs @@ -1,31 +1,101 @@ -pub use crate::model::algorithm::Algorithm; -pub use crate::server::RaphtoryServer; +pub use crate::{model::algorithm::Algorithm, server::RaphtoryServer}; +use base64::{prelude::BASE64_URL_SAFE_NO_PAD, DecodeError, Engine}; +use raphtory::{core::utils::errors::GraphError, db::api::view::internal::MaterializedGraph}; +pub mod embeddings; mod model; mod observability; mod routes; -mod server; +pub mod server; mod data; +#[derive(thiserror::Error, Debug)] +pub enum UrlDecodeError { + #[error("Bincode operation failed")] + BincodeError { + #[from] + source: Box, + }, + #[error("Base64 decoding failed")] + DecodeError { + #[from] + source: DecodeError, + }, +} + +pub fn url_encode_graph>(graph: G) -> Result { + let g: MaterializedGraph = graph.into(); + Ok(BASE64_URL_SAFE_NO_PAD.encode(bincode::serialize(&g)?)) +} + +pub fn url_decode_graph>(graph: T) -> Result { + Ok(bincode::deserialize( + &BASE64_URL_SAFE_NO_PAD.decode(graph)?, + )?) +} #[cfg(test)] mod graphql_test { use super::*; - use dynamic_graphql::dynamic::DynamicRequestExt; - use dynamic_graphql::{App, FieldValue}; - use raphtory::db::graph::Graph; + use crate::{data::Data, model::App}; + use async_graphql::UploadValue; + use dynamic_graphql::{Request, Variables}; + use raphtory::{db::api::view::internal::IntoDynamic, prelude::*}; + use serde_json::json; use std::collections::HashMap; - use std::env; + use tempfile::tempdir; + + #[tokio::test] + async fn search_for_gandalf_query() { + let graph = Graph::new(); + graph + .add_vertex(0, "Gandalf", [("kind".to_string(), Prop::str("wizard"))]) + .expect("Could not add vertex!"); + graph + .add_vertex(0, "Frodo", [("kind".to_string(), Prop::str("Hobbit"))]) + .expect("Could not add vertex!"); + + let graphs = HashMap::from([("lotr".to_string(), graph)]); + let data = data::Data::from_map(graphs); + let schema = App::create_schema().data(data).finish().unwrap(); + + let query = r#" + { + graph(name: "lotr") { + search(query: "kind:wizard", limit: 10, offset: 0) { + name + } + } + } + "#; + let req = Request::new(query); + let res = schema.execute(req).await; + let data = res.data.into_json().unwrap(); + + assert_eq!( + data, + json!({ + "graph": { + "search": [ + { + "name": "Gandalf" + } + ] + } + }), + ); + } #[tokio::test] async fn basic_query() { - let graph = Graph::new(1); - graph.add_vertex(0, 11, &vec![]); + let graph = Graph::new(); + graph + .add_vertex(0, 11, NO_PROPS) + .expect("Could not add vertex!"); + let graphs = HashMap::from([("lotr".to_string(), graph)]); - let data = data::Data { graphs }; + let data = data::Data::from_map(graphs); - #[derive(App)] - struct App(model::QueryRoot); let schema = App::create_schema().data(data).finish().unwrap(); let query = r#" @@ -37,10 +107,7 @@ mod graphql_test { } } "#; - - let root = model::QueryRoot; - let req = dynamic_graphql::Request::new(query).root_value(FieldValue::owned_any(root)); - + let req = Request::new(query); let res = schema.execute(req).await; let data = res.data.into_json().unwrap(); @@ -57,4 +124,359 @@ mod graphql_test { }), ); } + + #[tokio::test] + async fn query_nodefilter() { + let graph = Graph::new(); + if let Err(err) = graph.add_vertex(0, "gandalf", NO_PROPS) { + panic!("Could not add vertex! {:?}", err); + } + if let Err(err) = graph.add_vertex(0, "bilbo", NO_PROPS) { + panic!("Could not add vertex! {:?}", err); + } + if let Err(err) = graph.add_vertex(0, "frodo", NO_PROPS) { + panic!("Could not add vertex! {:?}", err); + } + + let graphs = HashMap::from([("lotr".to_string(), graph)]); + let data = Data::from_map(graphs); + + let schema = App::create_schema().data(data).finish().unwrap(); + + let gandalf_query = r#" + { + graph(name: "lotr") { + nodes(filter: { name: { eq: "gandalf" } }) { + name + } + } + } + "#; + + let req = Request::new(gandalf_query); + let res = schema.execute(req).await; + let data = res.data.into_json().unwrap(); + + assert_eq!( + data, + json!({ + "graph": { + "nodes": [ + { + "name": "gandalf" + } + ] + } + }), + ); + + let not_gandalf_query = r#" + { + graph(name: "lotr") { + nodes(filter: { name: { ne: "gandalf" } }) { + name + } + } + } + "#; + + let req = Request::new(not_gandalf_query); + let res = schema.execute(req).await; + let data = res.data.into_json().unwrap(); + + assert_eq!( + data, + json!({ + "graph": { + "nodes": [ + { "name": "bilbo" }, + { "name": "frodo" } + ] + } + }), + ); + } + + #[tokio::test] + async fn query_properties() { + let graph = Graph::new(); + if let Err(err) = graph.add_vertex(0, "gandalf", NO_PROPS) { + panic!("Could not add vertex! {:?}", err); + } + if let Err(err) = graph.add_vertex(0, "bilbo", [("food".to_string(), Prop::str("lots"))]) { + panic!("Could not add vertex! {:?}", err); + } + if let Err(err) = graph.add_vertex(0, "frodo", [("food".to_string(), Prop::str("some"))]) { + panic!("Could not add vertex! {:?}", err); + } + + let graphs = HashMap::from([("lotr".to_string(), graph)]); + let data = data::Data::from_map(graphs); + + let schema = App::create_schema().data(data).finish().unwrap(); + + let prop_has_key_filter = r#" + { + graph(name: "lotr") { + nodes(filter: { propertyHas: { + key: "food" + }}) { + name + } + } + } + "#; + + let req = Request::new(prop_has_key_filter); + let res = schema.execute(req).await; + let data = res.data.into_json().unwrap(); + + assert_eq!( + data, + json!({ + "graph": { + "nodes": [ + { "name": "bilbo" }, + { "name": "frodo" }, + ] + } + }), + ); + + let prop_has_value_filter = r#" + { + graph(name: "lotr") { + nodes(filter: { propertyHas: { + valueStr: "lots" + }}) { + name + } + } + } + "#; + + let req = Request::new(prop_has_value_filter); + let res = schema.execute(req).await; + let data = res.data.into_json().unwrap(); + + assert_eq!( + data, + json!({ + "graph": { + "nodes": [ + { "name": "bilbo" }, + ] + } + }), + ); + } + + #[tokio::test] + async fn test_mutation() { + let test_dir = tempdir().unwrap(); + let g0 = Graph::new(); + let test_dir_path = test_dir.path().to_str().unwrap().replace(r#"\"#, r#"\\"#); + let f0 = &test_dir.path().join("g0"); + let f1 = &test_dir.path().join("g1"); + g0.save_to_file(f0).unwrap(); + + let g1 = Graph::new(); + g1.add_vertex(0, 1, NO_PROPS).unwrap(); + + let g2 = Graph::new(); + g2.add_vertex(0, 2, NO_PROPS).unwrap(); + + let data = Data::default(); + let schema = App::create_schema().data(data).finish().unwrap(); + + let list_graphs = r#" + { + subgraphs { + name + } + }"#; + + let list_nodes = |name: &str| { + format!( + r#"{{ + graph(name: "{}") {{ + nodes {{ + id + }} + }} + }}"#, + name + ) + }; + + let load_all = &format!( + r#"mutation {{ + loadGraphsFromPath(path: "{}") + }}"#, + test_dir_path + ); + + let load_new = &format!( + r#"mutation {{ + loadNewGraphsFromPath(path: "{}") + }}"#, + test_dir_path + ); + + // only g0 which is empty + let req = Request::new(load_all); + let res = schema.execute(req).await; + let res_json = res.data.into_json().unwrap(); + assert_eq!(res_json, json!({"loadGraphsFromPath": ["g0"]})); + + let req = Request::new(list_graphs); + let res = schema.execute(req).await; + let res_json = res.data.into_json().unwrap(); + assert_eq!(res_json, json!({"subgraphs": [{"name": "g0"}]})); + + let req = Request::new(list_nodes("g0")); + let res = schema.execute(req).await; + let res_json = res.data.into_json().unwrap(); + assert_eq!(res_json, json!({"graph": {"nodes": []}})); + + // add g1 to folder and replace g0 with g2 and load new graphs + g1.save_to_file(f1).unwrap(); + g2.save_to_file(f0).unwrap(); + let req = Request::new(load_new); + let res = schema.execute(req).await; + let res_json = res.data.into_json().unwrap(); + assert_eq!(res_json, json!({"loadNewGraphsFromPath": ["g1"]})); + + // g0 is still empty + let req = Request::new(list_nodes("g0")); + let res = schema.execute(req).await; + let res_json = res.data.into_json().unwrap(); + assert_eq!(res_json, json!({"graph": {"nodes": []}})); + + // g1 has node 1 + let req = Request::new(list_nodes("g1")); + let res = schema.execute(req).await; + let res_json = res.data.into_json().unwrap(); + assert_eq!(res_json, json!({"graph": {"nodes": [{"id": 1}]}})); + + // reload all graphs from folder + let req = Request::new(load_all); + schema.execute(req).await; + + // g0 now has node 2 + let req = Request::new(list_nodes("g0")); + let res = schema.execute(req).await; + let res_json = res.data.into_json().unwrap(); + assert_eq!(res_json, json!({"graph": {"nodes": [{"id": 2}]}})); + + // g1 still has node 1 + let req = Request::new(list_nodes("g1")); + let res = schema.execute(req).await; + let res_json = res.data.into_json().unwrap(); + assert_eq!(res_json, json!({"graph": {"nodes": [{"id": 1}]}})); + } + + #[tokio::test] + async fn test_graph_injection() { + let g = Graph::new(); + g.add_vertex(0, 1, NO_PROPS).unwrap(); + let tmp_file = tempfile::NamedTempFile::new().unwrap(); + let path = tmp_file.path(); + g.save_to_file(path).unwrap(); + let file = std::fs::File::open(path).unwrap(); + let upload_val = UploadValue { + filename: "test".into(), + content_type: Some("application/octet-stream".into()), + content: file, + }; + + let data = Data::default(); + let schema = App::create_schema().data(data).finish().unwrap(); + + let query = r##" + mutation($file: Upload!) { + uploadGraph(name: "test", graph: $file) + } + "##; + + let variables = serde_json::json!({ "file": null }); + let mut req = + dynamic_graphql::Request::new(query).variables(Variables::from_json(variables)); + req.set_upload("variables.file", upload_val); + let res = schema.execute(req).await; + println!("{:?}", res); + assert_eq!(res.errors.len(), 0); + let res_json = res.data.into_json().unwrap(); + assert_eq!(res_json, json!({"uploadGraph": "test"})); + + let list_nodes = r#" + query { + graph(name: "test") { + nodes { + id + } + } + } + "#; + + let req = Request::new(list_nodes); + let res = schema.execute(req).await; + assert_eq!(res.errors.len(), 0); + let res_json = res.data.into_json().unwrap(); + assert_eq!(res_json, json!({"graph": {"nodes": [{"id": 1}]}})); + } + + #[tokio::test] + async fn test_graph_send_receive_base64() { + let g = Graph::new(); + g.add_vertex(0, 1, NO_PROPS).unwrap(); + + let graph_str = url_encode_graph(g.clone()).unwrap(); + + let data = Data::default(); + let schema = App::create_schema().data(data).finish().unwrap(); + + let query = r#" + mutation($graph: String!) { + sendGraph(name: "test", graph: $graph) + } + "#; + let req = + Request::new(query).variables(Variables::from_json(json!({ "graph": graph_str }))); + + let res = schema.execute(req).await; + assert_eq!(res.errors.len(), 0); + let res_json = res.data.into_json().unwrap(); + assert_eq!(res_json, json!({"sendGraph": "test"})); + + let list_nodes = r#" + query { + graph(name: "test") { + nodes { + id + } + } + } + "#; + + let req = Request::new(list_nodes); + let res = schema.execute(req).await; + assert_eq!(res.errors.len(), 0); + let res_json = res.data.into_json().unwrap(); + assert_eq!(res_json, json!({"graph": {"nodes": [{"id": 1}]}})); + + let receive_graph = r#" + query { + receiveGraph(name: "test") + } + "#; + + let req = Request::new(receive_graph); + let res = schema.execute(req).await; + assert_eq!(res.errors.len(), 0); + let res_json = res.data.into_json().unwrap(); + let graph_encoded = res_json.get("receiveGraph").unwrap().as_str().unwrap(); + let graph_roundtrip = url_decode_graph(graph_encoded).unwrap().into_dynamic(); + assert_eq!(g, graph_roundtrip); + } } diff --git a/raphtory-graphql/src/main.rs b/raphtory-graphql/src/main.rs index 40ec59c0cb..c03084bac5 100644 --- a/raphtory-graphql/src/main.rs +++ b/raphtory-graphql/src/main.rs @@ -1,16 +1,52 @@ use crate::server::RaphtoryServer; +use clap::Parser; use dotenv::dotenv; use std::env; mod data; +mod embeddings; mod model; mod observability; mod routes; mod server; +#[derive(Parser, Debug)] +struct Args { + /// graphs to vectorize for similarity search + #[arg(short, long, num_args = 0.., value_delimiter = ' ')] + vectorize: Vec, + + /// directory to use to store the embbeding cache + // parenthesis are actually necessary or this does not compile! + #[arg(short, long, default_value_t = ("".to_string()))] + cache: String, +} + #[tokio::main] async fn main() { + let args = Args::parse(); + + let graphs_to_vectorize = args.vectorize; + let cache_dir = args.cache; + // let graphs_to_vectorize = vec!["jira".to_owned()]; + // let cache_dir = "/tmp/jira-cache-gte-small-batching"; + assert!( + graphs_to_vectorize.is_empty() || !cache_dir.is_empty(), + "Setting up a cache directory is mandatory if some graphs need to be vectorized" + ); + dotenv().ok(); let graph_directory = env::var("GRAPH_DIRECTORY").unwrap_or("/tmp/graphs".to_string()); - RaphtoryServer::new(&graph_directory).run().await.unwrap() + RaphtoryServer::from_directory(&graph_directory) + // .with_vectorized( + // graphs_to_vectorize, + // embeddings::openai_embedding, + // &PathBuf::from(cache_dir), + // None, + // ) + // .await // FIXME: re-enable, probably have two separate methods: with_vectorized, with_templates + // FIXME: maybe we should vectorize the graphs only when run() is called + .run() + .await + .unwrap() } diff --git a/raphtory-graphql/src/model/algorithm.rs b/raphtory-graphql/src/model/algorithm.rs index 5f00f368d4..de1cf2a2af 100644 --- a/raphtory-graphql/src/model/algorithm.rs +++ b/raphtory-graphql/src/model/algorithm.rs @@ -1,16 +1,18 @@ -use crate::model::DynamicGraph; -use async_graphql::dynamic::{ - Field, FieldFuture, FieldValue, InputValue, Object, ResolverContext, TypeRef, +use async_graphql::{ + dynamic::{Field, FieldFuture, FieldValue, InputValue, Object, ResolverContext, TypeRef}, + Context, FieldResult, +}; +use dynamic_graphql::{ + internal::{OutputTypeName, Register, Registry, ResolveOwned, TypeName}, + SimpleObject, }; -use async_graphql::{Context, FieldResult}; -use dynamic_graphql::internal::{OutputTypeName, Register, Registry, ResolveOwned, TypeName}; -use dynamic_graphql::SimpleObject; use once_cell::sync::Lazy; -use raphtory::algorithms::pagerank::unweighted_page_rank; -use raphtory::db::view_api::GraphViewOps; -use std::borrow::Cow; -use std::collections::HashMap; -use std::sync::Mutex; +use ordered_float::OrderedFloat; +use raphtory::{ + algorithms::pagerank::unweighted_page_rank, + db::api::view::{internal::DynamicGraph, GraphViewOps}, +}; +use std::{borrow::Cow, collections::HashMap, sync::Mutex}; type RegisterFunction = fn(&str, Registry, Object) -> (Registry, Object); @@ -94,6 +96,22 @@ impl From<(String, f64)> for Pagerank { } } +impl From<(String, OrderedFloat)> for Pagerank { + fn from((name, rank): (String, OrderedFloat)) -> Self { + let rank = rank.into_inner(); + Self { name, rank } + } +} + +impl From<(&String, &OrderedFloat)> for Pagerank { + fn from((name, rank): (&String, &OrderedFloat)) -> Self { + Self { + name: name.to_string(), + rank: rank.into_inner(), + } + } +} + impl Algorithm for Pagerank { fn output_type() -> TypeRef { // first _nn means that the list is never null, second _nn means no element is null @@ -114,7 +132,8 @@ impl Algorithm for Pagerank { let threads = ctx.args.get("threads").map(|v| v.u64()).transpose()?; let threads = threads.map(|v| v as usize); let tol = ctx.args.get("tol").map(|v| v.f64()).transpose()?; - let result = unweighted_page_rank(graph, iter_count, threads, tol, true) + let binding = unweighted_page_rank(graph, iter_count, threads, tol, true); + let result = binding .into_iter() .map(|pair| FieldValue::owned_any(Pagerank::from(pair))); Ok(Some(FieldValue::list(result))) diff --git a/raphtory-graphql/src/model/filters/edge_filter.rs b/raphtory-graphql/src/model/filters/edge_filter.rs new file mode 100644 index 0000000000..0ef6dfda89 --- /dev/null +++ b/raphtory-graphql/src/model/filters/edge_filter.rs @@ -0,0 +1,57 @@ +use crate::model::{ + filters::{ + primitive_filter::{StringFilter, StringVecFilter}, + property_filter::PropertyHasFilter, + }, + graph::edge::Edge, +}; +use dynamic_graphql::InputObject; +use raphtory::db::api::view::{EdgeViewOps, VertexViewOps}; + +#[derive(InputObject, Clone)] +pub struct EdgeFilter { + node_names: Option, + src: Option, + dst: Option, + property_has: Option, + pub(crate) layer_names: Option, +} + +impl EdgeFilter { + pub(crate) fn matches(&self, edge: &Edge) -> bool { + if let Some(names_filter) = &self.node_names { + let src = edge.ee.src().name(); + let dst = edge.ee.dst().name(); + if !names_filter.contains(&src) || !names_filter.contains(&dst) { + return false; + } + } + + if let Some(name_filter) = &self.src { + if !name_filter.matches(&edge.ee.src().name()) { + return false; + } + } + + if let Some(name_filter) = &self.dst { + if !name_filter.matches(&edge.ee.dst().name()) { + return false; + } + } + + if let Some(name_filter) = &self.layer_names { + return edge + .ee + .layer_names() + .any(|name| name_filter.contains(&name)); + } + + if let Some(property_has_filter) = &self.property_has { + if !property_has_filter.matches_edge_properties(&edge) { + return false; + } + } + + true + } +} diff --git a/raphtory-graphql/src/model/filters/mod.rs b/raphtory-graphql/src/model/filters/mod.rs new file mode 100644 index 0000000000..a3b093b581 --- /dev/null +++ b/raphtory-graphql/src/model/filters/mod.rs @@ -0,0 +1,4 @@ +pub(crate) mod edge_filter; +pub(crate) mod node_filter; +pub(crate) mod primitive_filter; +pub(crate) mod property_filter; diff --git a/raphtory-graphql/src/model/filters/node_filter.rs b/raphtory-graphql/src/model/filters/node_filter.rs new file mode 100644 index 0000000000..fa1b50fbe9 --- /dev/null +++ b/raphtory-graphql/src/model/filters/node_filter.rs @@ -0,0 +1,78 @@ +use crate::model::{ + filters::{ + primitive_filter::{NumberFilter, StringFilter, StringVecFilter}, + property_filter::PropertyHasFilter, + }, + graph::node::Node, +}; +use dynamic_graphql::InputObject; +use raphtory::db::api::view::VertexViewOps; + +#[derive(InputObject)] +pub struct NodeFilter { + names: Option, + name: Option, + node_type: Option, + in_degree: Option, + out_degree: Option, + property_has: Option, +} + +impl NodeFilter { + pub(crate) fn new(names: Vec) -> NodeFilter { + return NodeFilter { + names: Some(StringVecFilter { contains: names }), + name: None, + node_type: None, + in_degree: None, + out_degree: None, + property_has: None, + }; + } + + pub(crate) fn matches(&self, node: &Node) -> bool { + if let Some(names_filter) = &self.names { + if !names_filter.contains(&node.vv.name()) { + return false; + } + } + + if let Some(name_filter) = &self.name { + if !name_filter.matches(&node.vv.name()) { + return false; + } + } + + if let Some(type_filter) = &self.node_type { + let node_type = node + .vv + .properties() + .get("type") + .map(|v| v.to_string()) + .unwrap_or("NONE".to_string()); + if !type_filter.matches(&node_type) { + return false; + } + } + + if let Some(in_degree_filter) = &self.in_degree { + if !in_degree_filter.matches(node.vv.in_degree()) { + return false; + } + } + + if let Some(out_degree_filter) = &self.out_degree { + if !out_degree_filter.matches(node.vv.out_degree()) { + return false; + } + } + + if let Some(property_has_filter) = &self.property_has { + if !property_has_filter.matches_node_properties(&node) { + return false; + } + } + + true + } +} diff --git a/raphtory-graphql/src/model/filters/primitive_filter.rs b/raphtory-graphql/src/model/filters/primitive_filter.rs new file mode 100644 index 0000000000..8262bf9448 --- /dev/null +++ b/raphtory-graphql/src/model/filters/primitive_filter.rs @@ -0,0 +1,79 @@ +use dynamic_graphql::InputObject; + +#[derive(InputObject, Clone)] +pub(crate) struct StringVecFilter { + pub(crate) contains: Vec, +} + +impl StringVecFilter { + pub(crate) fn contains(&self, value: &str) -> bool { + self.contains.contains(&value.to_string()) + } +} + +#[derive(InputObject, Clone)] +pub(crate) struct StringFilter { + pub(crate) eq: Option, + pub(crate) ne: Option, +} + +impl StringFilter { + pub(crate) fn matches(&self, value: &str) -> bool { + if !self.eq.as_ref().map_or(true, |eq| value == eq) { + return false; + } + self.ne.as_ref().map_or(true, |ne| value != ne) + } +} + +#[derive(InputObject, Clone)] +pub(crate) struct NumberFilter { + gt: Option, + lt: Option, + eq: Option, + ne: Option, + gte: Option, + lte: Option, +} + +impl NumberFilter { + pub(crate) fn matches(&self, value: usize) -> bool { + if let Some(gt) = self.gt { + if value <= gt { + return false; + } + } + + if let Some(lt) = self.lt { + if value >= lt { + return false; + } + } + + if let Some(eq) = self.eq { + if value != eq { + return false; + } + } + + if let Some(ne) = self.ne { + if value == ne { + return false; + } + } + + if let Some(gte) = self.gte { + if value < gte { + return false; + } + } + + if let Some(lte) = self.lte { + if value > lte { + return false; + } + } + + true + } +} diff --git a/raphtory-graphql/src/model/filters/property_filter.rs b/raphtory-graphql/src/model/filters/property_filter.rs new file mode 100644 index 0000000000..0547661fa7 --- /dev/null +++ b/raphtory-graphql/src/model/filters/property_filter.rs @@ -0,0 +1,116 @@ +use crate::model::{ + filters::primitive_filter::NumberFilter, + graph::{edge::Edge, node::Node}, +}; +use dynamic_graphql::InputObject; +use raphtory::{core::Prop, db::api::view::VertexViewOps, prelude::EdgeViewOps}; + +#[derive(InputObject, Clone)] +pub(crate) struct PropertyHasFilter { + key: Option, + value_str: Option, + value_num: Option, +} + +impl PropertyHasFilter { + pub(crate) fn matches_node_properties(&self, node: &Node) -> bool { + let valid_prop = |prop| valid_prop(prop, &self.value_str, &self.value_num); + + return match &self.key { + Some(key) => { + if let Some(prop) = node.vv.properties().get(key) { + valid_prop(prop) + } else { + false + } + } + None => node.vv.properties().values().any(valid_prop), + }; + } + + pub(crate) fn matches_edge_properties(&self, edge: &Edge) -> bool { + let valid_prop = |prop| valid_prop(prop, &self.value_str, &self.value_num); + + return match &self.key { + Some(key) => { + if let Some(prop) = EdgeViewOps::properties(&edge.ee).get(key) { + valid_prop(prop) + } else { + false + } + } + None => EdgeViewOps::properties(&edge.ee).values().any(valid_prop), + }; + } +} + +fn valid_prop(prop: Prop, value_str: &Option, num_filter: &Option) -> bool { + if let Some(value_str) = value_str { + if value_neq_str_prop(value_str, &prop) { + return false; + } + } + + if let Some(num_filter) = num_filter { + if value_neq_num_prop(num_filter, &prop) { + return false; + } + } + + true +} + +fn value_neq_str_prop(value: &str, prop: &Prop) -> bool { + if let Prop::Str(prop_str) = prop { + return prop_str != value; + } + + false +} + +fn value_neq_num_prop(num_filter: &NumberFilter, prop: &Prop) -> bool { + match prop { + Prop::I32(i32_prop) => match_signed_num(num_filter, i64::from(*i32_prop)), + Prop::I64(i64_prop) => match_signed_num(num_filter, *i64_prop), + Prop::U8(u8_prop) => match_unsigned_num(num_filter, u64::from(*u8_prop)), + Prop::U16(u16_prop) => match_unsigned_num(num_filter, u64::from(*u16_prop)), + Prop::U32(u32_prop) => match_unsigned_num(num_filter, u64::from(*u32_prop)), + Prop::U64(u64_prop) => match_unsigned_num(num_filter, *u64_prop), + Prop::F32(f32_prop) => match_float(num_filter, f64::from(*f32_prop)), + Prop::F64(f64_prop) => match_float(num_filter, *f64_prop), + _ => false, + } +} + +fn match_signed_num(num_filter: &NumberFilter, signed_num: i64) -> bool { + if signed_num < 0 { + return false; + } + + let as_usize = signed_num as usize; + + if !num_filter.matches(as_usize) { + return true; + } + false +} + +fn match_unsigned_num(num_filter: &NumberFilter, unsigned_num: u64) -> bool { + let as_usize = unsigned_num as usize; + if !num_filter.matches(as_usize) { + return true; + } + false +} + +fn match_float(num_filter: &NumberFilter, float_num: f64) -> bool { + if float_num < 0.0 { + return false; + } + let rounded = float_num.round(); + let as_usize = rounded as usize; + if !num_filter.matches(as_usize) { + return true; + } + false +} diff --git a/raphtory-graphql/src/model/graph/edge.rs b/raphtory-graphql/src/model/graph/edge.rs new file mode 100644 index 0000000000..b1542880e3 --- /dev/null +++ b/raphtory-graphql/src/model/graph/edge.rs @@ -0,0 +1,57 @@ +use crate::model::graph::node::Node; +use dynamic_graphql::{ResolvedObject, ResolvedObjectFields}; +use itertools::Itertools; +use raphtory::db::{ + api::view::{ + internal::{DynamicGraph, IntoDynamic}, + EdgeViewOps, GraphViewOps, + }, + graph::edge::EdgeView, +}; + +#[derive(ResolvedObject)] +pub(crate) struct Edge { + pub(crate) ee: EdgeView, +} + +impl From> for Edge { + fn from(value: EdgeView) -> Self { + Self { + ee: EdgeView { + graph: value.graph.clone().into_dynamic(), + edge: value.edge, + }, + } + } +} + +#[ResolvedObjectFields] +impl Edge { + async fn earliest_time(&self) -> Option { + self.ee.earliest_time() + } + + async fn latest_time(&self) -> Option { + self.ee.latest_time() + } + + async fn src(&self) -> Node { + self.ee.src().into() + } + + async fn dst(&self) -> Node { + self.ee.dst().into() + } + + async fn property(&self, name: &str) -> Option { + self.ee.properties().get(name).map(|prop| prop.to_string()) + } + + async fn layers(&self) -> Vec { + self.ee.layer_names().map_into().collect() + } + + async fn history(&self) -> Vec { + self.ee.history() + } +} diff --git a/raphtory-graphql/src/model/graph/graph.rs b/raphtory-graphql/src/model/graph/graph.rs new file mode 100644 index 0000000000..7dcc19ddb3 --- /dev/null +++ b/raphtory-graphql/src/model/graph/graph.rs @@ -0,0 +1,222 @@ +use std::{ + collections::{HashMap, HashSet}, + ops::Deref, +}; + +use crate::model::{ + algorithm::Algorithms, + filters::{edge_filter::EdgeFilter, node_filter::NodeFilter}, + graph::{edge::Edge, get_expanded_edges, node::Node, property::Property}, + schema::graph_schema::GraphSchema, +}; +use dynamic_graphql::{ResolvedObject, ResolvedObjectFields}; +use itertools::Itertools; +use raphtory::{ + db::{ + api::view::{ + internal::{DynamicGraph, IntoDynamic}, + GraphViewOps, TimeOps, VertexViewOps, + }, + graph::edge::EdgeView, + }, + prelude::EdgeViewOps, + search::IndexedGraph, +}; + +#[derive(ResolvedObject)] +pub(crate) struct GraphMeta { + name: String, + graph: DynamicGraph, +} + +impl GraphMeta { + pub fn new(name: String, graph: DynamicGraph) -> Self { + Self { name, graph } + } +} + +#[ResolvedObjectFields] +impl GraphMeta { + async fn name(&self) -> String { + self.name.clone() + } + + async fn static_properties(&self) -> Vec { + self.graph + .properties() + .constant() + .into_iter() + .map(|(k, v)| Property::new(k.into(), v)) + .collect() + } + + async fn node_names(&self) -> Vec { + self.graph + .vertices() + .into_iter() + .map(|v| v.name()) + .collect_vec() + } +} + +#[derive(ResolvedObject)] +pub(crate) struct GqlGraph { + graph: IndexedGraph, +} + +impl From> for GqlGraph { + fn from(value: IndexedGraph) -> Self { + Self { + graph: value.into_dynamic_indexed(), + } + } +} + +impl GqlGraph { + pub(crate) fn new(graph: IndexedGraph) -> Self { + Self { graph } + } +} + +#[ResolvedObjectFields] +impl GqlGraph { + /// Return a graph containing only the activity between `start` and `end` measured as milliseconds from epoch + async fn window(&self, start: i64, end: i64) -> GqlGraph { + let w = self.graph.window(start, end); + w.into_dynamic_indexed().into() + } + + async fn layer_names(&self) -> Vec { + self.graph.unique_layers().map_into().collect() + } + + async fn static_properties(&self) -> Vec { + self.graph + .properties() + .constant() + .into_iter() + .map(|(k, v)| Property::new(k.into(), v)) + .collect() + } + + async fn nodes(&self, filter: Option) -> Vec { + match filter { + Some(filter) => self + .graph + .vertices() + .iter() + .map(|vv| vv.into()) + .filter(|n| filter.matches(n)) + .collect(), + None => self.graph.vertices().iter().map(|vv| vv.into()).collect(), + } + } + + /// Returns the schema of this graph + async fn schema(&self) -> GraphSchema { + GraphSchema::new(&self.graph) + } + + async fn search(&self, query: String, limit: usize, offset: usize) -> Vec { + self.graph + .search(&query, limit, offset) + .into_iter() + .flat_map(|vv| vv) + .map(|vv| vv.into()) + .collect() + } + + async fn search_edges(&self, query: String, limit: usize, offset: usize) -> Vec { + self.graph + .search_edges(&query, limit, offset) + .into_iter() + .flat_map(|vv| vv) + .map(|vv| vv.into()) + .collect() + } + + async fn edges<'a>(&self, filter: Option) -> Vec { + match filter { + Some(filter) => self + .graph + .edges() + .into_iter() + .map(|ev| ev.into()) + .filter(|ev| filter.matches(ev)) + .collect(), + None => self.graph.edges().into_iter().map(|ev| ev.into()).collect(), + } + } + + async fn expanded_edges( + &self, + nodes_to_expand: Vec, + graph_nodes: Vec, + filter: Option, + ) -> Vec { + if nodes_to_expand.is_empty() { + return vec![]; + } + + let nodes: Vec = self + .graph + .vertices() + .iter() + .map(|vv| vv.into()) + .filter(|n| NodeFilter::new(nodes_to_expand.clone()).matches(n)) + .collect(); + + let mut all_graph_nodes: HashSet = graph_nodes.into_iter().collect(); + let mut all_expanded_edges: HashMap> = HashMap::new(); + + let mut maybe_layers: Option> = None; + if filter.is_some() { + maybe_layers = filter.clone().unwrap().layer_names.map(|l| l.contains); + } + + for node in nodes { + let expanded_edges = + get_expanded_edges(all_graph_nodes.clone(), node.vv, maybe_layers.clone()); + expanded_edges.clone().into_iter().for_each(|e| { + let src = e.src().name(); + let dst = e.dst().name(); + all_expanded_edges.insert(src.to_owned() + &dst, e); + all_graph_nodes.insert(src); + all_graph_nodes.insert(dst); + }); + } + + let fetched_edges = all_expanded_edges + .values() + .map(|ee| ee.clone().into()) + .collect_vec(); + + match filter { + Some(filter) => fetched_edges + .into_iter() + .filter(|ev| filter.matches(ev)) + .collect(), + None => fetched_edges, + } + } + + async fn node(&self, name: String) -> Option { + self.graph + .vertices() + .iter() + .find(|vv| &vv.name() == &name) + .map(|vv| vv.into()) + } + + async fn node_id(&self, id: u64) -> Option { + self.graph + .vertices() + .iter() + .find(|vv| vv.id() == id) + .map(|vv| vv.into()) + } + + async fn algorithms(&self) -> Algorithms { + self.graph.deref().clone().into() + } +} diff --git a/raphtory-graphql/src/model/graph/mod.rs b/raphtory-graphql/src/model/graph/mod.rs new file mode 100644 index 0000000000..d192304832 --- /dev/null +++ b/raphtory-graphql/src/model/graph/mod.rs @@ -0,0 +1,101 @@ +use itertools::Itertools; +use raphtory::{ + core::ArcStr, + db::{ + api::view::internal::DynamicGraph, + graph::{edge::EdgeView, vertex::VertexView}, + }, + prelude::{EdgeViewOps, VertexViewOps}, +}; +use std::collections::HashSet; + +pub(crate) mod edge; +pub(crate) mod graph; +pub(crate) mod node; +pub(crate) mod property; +pub(crate) mod property_update; + +fn get_expanded_edges( + graph_nodes: HashSet, + vv: VertexView, + maybe_layers: Option>, +) -> Vec> { + let node_found_in_graph_nodes = + |node_name: String| -> bool { graph_nodes.iter().contains(&node_name) }; + + let fetched_edges = vv.clone().edges().into_iter().map(|ee| ee.clone()); + + let mut filtered_fetched_edges = match maybe_layers { + Some(layers) => { + let layer_set: HashSet = layers.into_iter().map_into().collect(); + fetched_edges + .filter(|e| { + e.layer_names() + .into_iter() + .any(|name| layer_set.contains(&name)) + }) + .collect_vec() + } + None => fetched_edges.collect_vec(), + }; + + let first_hop_edges = filtered_fetched_edges + .clone() + .into_iter() + .filter(|e| { + !node_found_in_graph_nodes((*e).src().name()) + || !node_found_in_graph_nodes((*e).dst().name()) + }) + .collect_vec(); + + let mut first_hop_nodes: HashSet = HashSet::new(); + first_hop_edges.clone().into_iter().for_each(|e| { + first_hop_nodes.insert(e.src().name()); + first_hop_nodes.insert(e.dst().name()); + }); + + let first_hop_nodes = first_hop_nodes + .into_iter() + .filter(|e| e != &vv.name()) + .collect_vec(); + + let node_found_in_first_hop_nodes = + |node_name: String| -> bool { first_hop_nodes.contains(&node_name) }; + + let mut first_hop_node_edges: Vec> = vec![]; + + first_hop_edges.into_iter().for_each(|e| { + if node_found_in_graph_nodes(e.src().name()) { + // Return only those edges whose either src or dst already exist + let mut r = e + .dst() + .edges() + .filter(|e| { + (node_found_in_first_hop_nodes(e.src().name()) + && node_found_in_first_hop_nodes(e.dst().name())) + || node_found_in_graph_nodes(e.src().name()) + || node_found_in_graph_nodes(e.dst().name()) + }) + .collect_vec(); + + first_hop_node_edges.append(&mut r); + } else { + let mut r = e + .src() + .edges() + .filter(|e| { + (node_found_in_first_hop_nodes(e.src().name()) + && node_found_in_first_hop_nodes(e.dst().name())) + || node_found_in_graph_nodes(e.src().name()) + || node_found_in_graph_nodes(e.dst().name()) + }) + .collect_vec(); + + first_hop_node_edges.append(&mut r); + } + }); + + filtered_fetched_edges.append(&mut first_hop_node_edges); + + filtered_fetched_edges +} diff --git a/raphtory-graphql/src/model/graph/node.rs b/raphtory-graphql/src/model/graph/node.rs new file mode 100644 index 0000000000..739d5a1101 --- /dev/null +++ b/raphtory-graphql/src/model/graph/node.rs @@ -0,0 +1,265 @@ +use crate::model::{ + filters::edge_filter::EdgeFilter, + graph::{edge::Edge, get_expanded_edges, property::Property, property_update::PropertyUpdate}, +}; +use dynamic_graphql::{ResolvedObject, ResolvedObjectFields}; +use itertools::Itertools; +use raphtory::db::{ + api::view::{ + internal::{DynamicGraph, IntoDynamic}, + *, + }, + graph::vertex::VertexView, +}; +use std::collections::HashSet; + +use super::property_update::PropertyUpdateGroup; + +#[derive(ResolvedObject)] +pub(crate) struct Node { + pub(crate) vv: VertexView, +} + +impl From> for Node { + fn from(value: VertexView) -> Self { + Self { + vv: VertexView { + graph: value.graph.clone().into_dynamic(), + vertex: value.vertex, + }, + } + } +} + +#[ResolvedObjectFields] +impl Node { + async fn id(&self) -> u64 { + self.vv.id() + } + + pub async fn name(&self) -> String { + self.vv.name() + } + + pub async fn node_type(&self) -> String { + self.vv + .properties() + .get("type") + .map(|p| p.to_string()) + .unwrap_or("NONE".to_string()) + } + + /// Returns all the property names this node has a value for + async fn property_names(&self) -> Vec { + self.vv.properties().keys().map_into().collect() + } + + /// Returns all the properties of the node + async fn properties(&self) -> Option> { + Some( + self.vv + .properties() + .iter() + .map(|(k, v)| Property::new(k.into(), v)) + .collect(), + ) + } + + /// Returns the value for the property with name `name` + async fn property(&self, name: &str) -> Option { + self.vv.properties().get(name).map(|v| v.to_string()) + } + + /// Returns the history as a vector of updates for the property with name `name` + async fn property_history(&self, name: String) -> Vec { + self.vv + .properties() + .temporal() + .get(&name) + .into_iter() + .flat_map(|p| { + p.iter() + .map(|(time, prop)| PropertyUpdate::new(time, prop.to_string())) + }) + .collect() + } + + /// Returns the history as a vectory of updates for any properties which are included in param names + async fn properties_history(&self, names: Vec) -> Vec { + names + .iter() + .filter_map(|name| match self.vv.properties().temporal().get(name) { + Some(prop) => Option::Some(PropertyUpdateGroup::new( + name.to_string(), + prop.iter() + .map(|(time, prop)| PropertyUpdate::new(time, prop.to_string())) + .collect_vec(), + )), + None => None, + }) + .collect_vec() + } + + async fn in_neighbours<'a>(&self, layer: Option) -> Vec { + match layer.as_deref() { + None => self.vv.in_neighbours().iter().map(|vv| vv.into()).collect(), + Some(layer) => match self.vv.layer(layer) { + None => { + vec![] + } + Some(vvv) => vvv.in_neighbours().iter().map(|vv| vv.into()).collect(), + }, + } + } + + async fn out_neighbours(&self, layer: Option) -> Vec { + match layer.as_deref() { + None => self + .vv + .out_neighbours() + .iter() + .map(|vv| vv.into()) + .collect(), + Some(layer) => match self.vv.layer(layer) { + None => { + vec![] + } + Some(vvv) => vvv.out_neighbours().iter().map(|vv| vv.into()).collect(), + }, + } + } + + async fn neighbours<'a>(&self, layer: Option) -> Vec { + match layer.as_deref() { + None => self.vv.neighbours().iter().map(|vv| vv.into()).collect(), + Some(layer) => match self.vv.layer(layer) { + None => { + vec![] + } + Some(vvv) => vvv.neighbours().iter().map(|vv| vv.into()).collect(), + }, + } + } + + /// Returns the number of edges connected to this node + async fn degree(&self, layers: Option>) -> usize { + match layers { + None => self.vv.degree(), + Some(layers) => layers + .iter() + .map(|layer| { + let degree = match self.vv.layer(layer) { + None => 0, + Some(vvv) => vvv.degree(), + }; + degree + }) + .sum(), + } + } + + /// Returns the number edges with this node as the source + async fn out_degree(&self, layer: Option) -> usize { + match layer.as_deref() { + None => self.vv.out_degree(), + Some(layer) => match self.vv.layer(layer) { + None => 0, + Some(vvv) => vvv.out_degree(), + }, + } + } + + /// Returns the number edges with this node as the destination + async fn in_degree(&self, layer: Option) -> usize { + match layer.as_deref() { + None => self.vv.in_degree(), + Some(layer) => match self.vv.layer(layer) { + None => 0, + Some(vvv) => vvv.in_degree(), + }, + } + } + + async fn out_edges(&self, layer: Option) -> Vec { + match layer.as_deref() { + None => self.vv.out_edges().map(|ee| ee.into()).collect(), + Some(layer) => match self.vv.layer(layer) { + None => { + vec![] + } + Some(vvv) => vvv.out_edges().map(|ee| ee.into()).collect(), + }, + } + } + + async fn in_edges(&self, layer: Option) -> Vec { + match layer.as_deref() { + None => self.vv.in_edges().map(|ee| ee.into()).collect(), + Some(layer) => match self.vv.layer(layer) { + None => { + vec![] + } + Some(vvv) => vvv.in_edges().map(|ee| ee.into()).collect(), + }, + } + } + + async fn edges(&self, filter: Option) -> Vec { + match filter { + Some(filter) => self + .vv + .edges() + .map(|ev| ev.into()) + .filter(|ev| filter.matches(ev)) + .collect(), + None => self.vv.edges().map(|ee| ee.into()).collect(), + } + } + + async fn expanded_edges( + &self, + graph_nodes: Vec, + filter: Option, + ) -> Vec { + let all_graph_nodes: HashSet = graph_nodes.into_iter().collect(); + + match filter { + Some(edge_filter) => { + let maybe_layers = edge_filter.clone().layer_names.map(|l| l.contains); + let fetched_edges = + get_expanded_edges(all_graph_nodes, self.vv.clone(), maybe_layers) + .iter() + .map(|ee| ee.clone().into()) + .collect_vec(); + fetched_edges + .into_iter() + .filter(|ev| edge_filter.matches(ev)) + .collect() + } + None => get_expanded_edges(all_graph_nodes, self.vv.clone(), None) + .iter() + .map(|ee| ee.clone().into()) + .collect_vec(), + } + } + + async fn exploded_in_edges(&self) -> Vec { + self.vv.in_edges().explode().map(|ee| ee.into()).collect() + } + + async fn exploded_out_edges(&self) -> Vec { + self.vv.out_edges().explode().map(|ee| ee.into()).collect() + } + + async fn exploded_edges(&self) -> Vec { + self.vv.edges().explode().map(|ee| ee.into()).collect() + } + + async fn start_date(&self) -> Option { + self.vv.earliest_time() + } + + async fn end_date(&self) -> Option { + self.vv.latest_time() + } +} diff --git a/raphtory-graphql/src/model/graph/property.rs b/raphtory-graphql/src/model/graph/property.rs new file mode 100644 index 0000000000..f69e2eba19 --- /dev/null +++ b/raphtory-graphql/src/model/graph/property.rs @@ -0,0 +1,25 @@ +use dynamic_graphql::{ResolvedObject, ResolvedObjectFields}; +use raphtory::core::Prop; + +#[derive(ResolvedObject)] +pub(crate) struct Property { + key: String, + value: Prop, +} + +impl Property { + pub(crate) fn new(key: String, value: Prop) -> Self { + Self { key, value } + } +} + +#[ResolvedObjectFields] +impl Property { + async fn key(&self) -> String { + self.key.to_string() + } + + async fn value(&self) -> String { + self.value.to_string() + } +} diff --git a/raphtory-graphql/src/model/graph/property_update.rs b/raphtory-graphql/src/model/graph/property_update.rs new file mode 100644 index 0000000000..3a7dddd1e7 --- /dev/null +++ b/raphtory-graphql/src/model/graph/property_update.rs @@ -0,0 +1,30 @@ +use dynamic_graphql::SimpleObject; + +/// A single property at a given `time` with a given `value` +#[derive(SimpleObject)] +pub(crate) struct PropertyUpdate { + pub(crate) time: i64, + pub(crate) value: String, +} + +// A collection of `PropertyUpdate`s under their `propertyName` +#[derive(SimpleObject)] +pub(crate) struct PropertyUpdateGroup { + pub(crate) property_name: String, + pub(crate) property_updates: Vec, +} + +impl PropertyUpdate { + pub fn new(time: i64, value: String) -> Self { + Self { time, value } + } +} + +impl PropertyUpdateGroup { + pub fn new(property_name: String, property_updates: Vec) -> Self { + Self { + property_name, + property_updates, + } + } +} diff --git a/raphtory-graphql/src/model/mod.rs b/raphtory-graphql/src/model/mod.rs index d87e0bc979..4e2215bfff 100644 --- a/raphtory-graphql/src/model/mod.rs +++ b/raphtory-graphql/src/model/mod.rs @@ -1,19 +1,45 @@ -use crate::data::Data; +use crate::{ + data::Data, + model::graph::graph::{GqlGraph, GraphMeta}, +}; use async_graphql::Context; -use dynamic_graphql::{ResolvedObject, ResolvedObjectFields}; +use base64::{engine::general_purpose::URL_SAFE_NO_PAD, Engine}; +use chrono::Utc; +use dynamic_graphql::{ + App, Mutation, MutationFields, MutationRoot, ResolvedObject, ResolvedObjectFields, Result, + Upload, +}; use itertools::Itertools; -use raphtory::core::Prop; -use raphtory::db::edge::EdgeView; -use raphtory::db::vertex::VertexView; -use raphtory::db::view_api::internal::{GraphViewInternalOps, WrappedGraph}; -use raphtory::db::view_api::EdgeListOps; -use raphtory::db::view_api::EdgeViewOps; -use raphtory::db::view_api::{GraphViewOps, TimeOps, VertexViewOps}; -use std::sync::Arc; - -use crate::model::algorithm::Algorithms; +use raphtory::{ + core::{ArcStr, Prop}, + db::api::view::internal::{IntoDynamic, MaterializedGraph}, + prelude::{Graph, GraphViewOps, PropertyAdditionOps, VertexViewOps}, + search::IndexedGraph, +}; +use std::{ + collections::HashMap, + error::Error, + fmt::{Display, Formatter}, + io::BufReader, + ops::Deref, +}; +use uuid::Uuid; pub(crate) mod algorithm; +pub(crate) mod filters; +pub(crate) mod graph; +pub(crate) mod schema; + +#[derive(Debug)] +pub struct MissingGraph; + +impl Display for MissingGraph { + fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result { + write!(f, "Graph does not exist") + } +} + +impl Error for MissingGraph {} #[derive(ResolvedObject)] #[graphql(root)] @@ -25,219 +51,325 @@ impl QueryRoot { "Hello world from raphtory-graphql" } - /// Returns a view including all events between `t_start` (inclusive) and `t_end` (exclusive) + /// Returns a graph async fn graph<'a>(ctx: &Context<'a>, name: &str) -> Option { let data = ctx.data_unchecked::(); - let g = data.graphs.get(name)?; - Some(g.clone().into()) + let g = data.graphs.read().get(name).cloned()?; + Some(GqlGraph::new(g.into_dynamic_indexed())) } -} -#[derive(Clone)] -pub struct DynamicGraph(Arc); - -impl WrappedGraph for DynamicGraph { - type Internal = dyn GraphViewInternalOps + Send + Sync + 'static; - fn as_graph(&self) -> &(dyn GraphViewInternalOps + Send + Sync + 'static) { - &*self.0 - } -} - -#[derive(ResolvedObject)] -pub(crate) struct GqlGraph { - graph: DynamicGraph, -} - -impl From for GqlGraph { - fn from(value: G) -> Self { - let graph = DynamicGraph(Arc::new(value)); - Self { graph } - } -} - -#[ResolvedObjectFields] -impl GqlGraph { - async fn window(&self, t_start: i64, t_end: i64) -> GqlGraph { - let w = self.graph.window(t_start, t_end); - w.into() - } - - async fn nodes(&self) -> Vec { - self.graph.vertices().iter().map(|vv| vv.into()).collect() - } - - async fn edges<'a>(&self) -> Vec { - self.graph.edges().into_iter().map(|ev| ev.into()).collect() - } - - async fn node(&self, name: String) -> Option { - self.graph - .vertices() - .iter() - .find(|vv| &vv.name() == &name) - .map(|vv| vv.into()) + async fn subgraph<'a>(ctx: &Context<'a>, name: &str) -> Option { + let data = ctx.data_unchecked::(); + let g = data.graphs.read().get(name).cloned()?; + Some(GraphMeta::new( + name.to_string(), + g.deref().clone().into_dynamic(), + )) } - async fn node_id(&self, id: u64) -> Option { - self.graph - .vertices() + async fn subgraphs<'a>(ctx: &Context<'a>) -> Vec { + let data = ctx.data_unchecked::(); + data.graphs + .read() .iter() - .find(|vv| vv.id() == id) - .map(|vv| vv.into()) - } - - async fn algorithms(&self) -> Algorithms { - self.graph.clone().into() - } -} - -#[derive(ResolvedObject)] -pub(crate) struct Property { - key: String, - value: Prop, -} - -impl Property { - fn new(key: String, value: Prop) -> Self { - Self { key, value } - } -} - -#[ResolvedObjectFields] -impl Property { - async fn key(&self, _ctx: &Context<'_>) -> String { - self.key.to_string() - } - - async fn value(&self, _ctx: &Context<'_>) -> String { - self.value.to_string() - } -} - -#[derive(ResolvedObject)] -pub(crate) struct Node { - vv: VertexView, -} - -impl From> for Node { - fn from(vv: VertexView) -> Self { - Self { vv } - } -} - -#[ResolvedObjectFields] -impl Node { - async fn id(&self) -> u64 { - self.vv.id() - } - - async fn name(&self) -> String { - self.vv.name() + .map(|(name, g)| GraphMeta::new(name.clone(), g.deref().clone().into_dynamic())) + .collect_vec() } - async fn property_names<'a>(&self, _ctx: &Context<'a>) -> Vec { - self.vv.property_names(true) - } - - async fn properties(&self) -> Option> { + async fn receive_graph<'a>(ctx: &Context<'a>, name: &str) -> Result { + let data = ctx.data_unchecked::(); + let g = data + .graphs + .read() + .get(name) + .cloned() + .ok_or(MissingGraph)? + .materialize()?; + let bincode = bincode::serialize(&g)?; + Ok(URL_SAFE_NO_PAD.encode(bincode)) + } + + async fn similarity_search<'a>( + ctx: &Context<'a>, + graph: &str, + query: &str, + init: Option, + min_nodes: Option, + min_edges: Option, + limit: Option, + window_start: Option, + window_end: Option, + ) -> Option> { + let init = init.unwrap_or(1); + let min_nodes = min_nodes.unwrap_or(0); + let min_edges = min_edges.unwrap_or(0); + let limit = limit.unwrap_or(1); + let data = ctx.data_unchecked::(); + let binding = data.vector_stores.read(); + let vec_store = binding.get(graph)?; + println!("running similarity search for {query}"); Some( - self.vv - .properties(true) - .into_iter() - .map(|(k, v)| Property::new(k, v)) - .collect_vec(), + vec_store + .similarity_search( + query, + init, + min_nodes, + min_edges, + limit, + window_start, + window_end, + ) + .await, ) } - - async fn property(&self, name: String) -> Option { - let prop = self.vv.property(name.clone(), true)?; - Some(Property::new(name, prop)) - } - - async fn in_neighbours<'a>(&self, _ctx: &Context<'a>) -> Vec { - self.vv.in_neighbours().iter().map(|vv| vv.into()).collect() - } - - async fn out_neighbours(&self) -> Vec { - self.vv - .out_neighbours() - .iter() - .map(|vv| vv.into()) - .collect() - } - - async fn neighbours<'a>(&self, _ctx: &Context<'a>) -> Vec { - self.vv.neighbours().iter().map(|vv| vv.into()).collect() - } - - async fn degree(&self) -> usize { - self.vv.degree() - } - - async fn out_degree(&self) -> usize { - self.vv.out_degree() - } - - async fn in_degree(&self) -> usize { - self.vv.in_degree() - } - - async fn out_edges(&self) -> Vec { - self.vv.out_edges().map(|ee| ee.clone().into()).collect() - } - - async fn in_edges(&self) -> Vec { - self.vv.in_edges().map(|ee| ee.into()).collect() - } - - async fn exploded_edges(&self) -> Vec { - self.vv.out_edges().explode().map(|ee| ee.into()).collect() - } - - async fn start_date(&self) -> Option { - self.vv.earliest_time() - } - - async fn end_date(&self) -> Option { - self.vv.latest_time() - } -} - -#[derive(ResolvedObject)] -pub(crate) struct Edge { - ee: EdgeView, } -impl From> for Edge { - fn from(ee: EdgeView) -> Self { - Self { ee } +#[derive(MutationRoot)] +pub(crate) struct MutRoot; + +#[derive(Mutation)] +pub(crate) struct Mut(MutRoot); + +#[MutationFields] +impl Mut { + /// Load graphs from a directory of bincode files (existing graphs with the same name are overwritten) + /// + /// # Returns: + /// list of names for newly added graphs + async fn load_graphs_from_path<'a>(ctx: &Context<'a>, path: String) -> Vec { + let new_graphs = Data::load_from_file(&path); + let keys: Vec<_> = new_graphs.keys().cloned().collect(); + let mut data = ctx.data_unchecked::().graphs.write(); + data.extend(new_graphs); + keys + } + + async fn rename_graph<'a>( + ctx: &Context<'a>, + parent_graph_name: String, + graph_name: String, + new_graph_name: String, + ) -> Result { + if new_graph_name.ne(&graph_name) && parent_graph_name.ne(&graph_name) { + let mut data = ctx.data_unchecked::().graphs.write(); + + let subgraph = data.get(&graph_name).ok_or("Graph not found")?; + let path = subgraph + .properties() + .constant() + .get("path") + .ok_or("Path is missing")? + .to_string(); + + let parent_graph = data.get(&parent_graph_name).ok_or("Graph not found")?; + let new_subgraph = parent_graph + .subgraph(subgraph.vertices().iter().map(|v| v.name()).collect_vec()) + .materialize()?; + + let static_props_without_name: Vec<(ArcStr, Prop)> = subgraph + .properties() + .into_iter() + .filter(|(a, _)| a != "name") + .collect_vec(); + + new_subgraph.add_constant_properties(static_props_without_name)?; + new_subgraph + .add_constant_properties([("name", Prop::Str(new_graph_name.clone().into()))])?; + + let dt = Utc::now(); + let timestamp: i64 = dt.timestamp(); + new_subgraph.add_constant_properties([("lastUpdated", Prop::I64(timestamp * 1000))])?; + + new_subgraph.save_to_file(path)?; + + let gi: IndexedGraph = new_subgraph + .into_events() + .ok_or("Graph with deletions not supported")? + .into(); + + data.insert(new_graph_name, gi); + data.remove(&graph_name); + } + + Ok(true) + } + + async fn save_graph<'a>( + ctx: &Context<'a>, + parent_graph_name: String, + graph_name: String, + new_graph_name: String, + props: String, + graph_nodes: Vec, + ) -> Result { + let mut data = ctx.data_unchecked::().graphs.write(); + + let subgraph = data.get(&graph_name).ok_or("Graph not found")?; + let mut path = subgraph + .properties() + .constant() + .get("path") + .ok_or("Path is missing")? + .to_string(); + + if new_graph_name.ne(&graph_name) { + fn path_prefix(path: String) -> Result { + let elements: Vec<&str> = path.split('/').collect(); + let size = elements.len(); + return if size > 2 { + let delimiter = "/"; + let joined_string = elements + .iter() + .take(size - 1) + .copied() + .collect::>() + .join(delimiter); + Ok(joined_string) + } else { + Err("Invalid graph path".into()) + }; + } + + path = path_prefix(path)? + "/" + &Uuid::new_v4().hyphenated().to_string(); + } + + let parent_graph = data.get(&parent_graph_name).ok_or("Graph not found")?; + + let new_subgraph = parent_graph.subgraph(graph_nodes).materialize()?; + + new_subgraph.add_constant_properties([("name", Prop::str(new_graph_name.clone()))])?; + + // parent_graph_name == graph_name, means its a graph created from UI + if parent_graph_name.ne(&graph_name) { + // graph_name == new_graph_name, means its a "save" and not "save as" action + if graph_name.ne(&new_graph_name) { + let static_props: Vec<(ArcStr, Prop)> = subgraph + .properties() + .into_iter() + .filter(|(a, _)| a != "name" && a != "creationTime" && a != "uiProps") + .collect_vec(); + new_subgraph.add_constant_properties(static_props)?; + } else { + let static_props: Vec<(ArcStr, Prop)> = subgraph + .properties() + .into_iter() + .filter(|(a, _)| a != "name" && a != "lastUpdated" && a != "uiProps") + .collect_vec(); + new_subgraph.add_constant_properties(static_props)?; + } + } + + let dt = Utc::now(); + let timestamp: i64 = dt.timestamp(); + + if parent_graph_name.eq(&graph_name) || graph_name.ne(&new_graph_name) { + new_subgraph + .add_constant_properties([("creationTime", Prop::I64(timestamp * 1000))])?; + } + + new_subgraph.add_constant_properties([("lastUpdated", Prop::I64(timestamp * 1000))])?; + new_subgraph.add_constant_properties([("uiProps", Prop::Str(props.into()))])?; + + new_subgraph.save_to_file(path)?; + + let gi: IndexedGraph = new_subgraph + .into_events() + .ok_or("Graph with deletions not supported")? + .into(); + + data.insert(new_graph_name, gi); + + Ok(true) + } + + /// Load new graphs from a directory of bincode files (existing graphs will not been overwritten) + /// + /// # Returns: + /// list of names for newly added graphs + async fn load_new_graphs_from_path<'a>(ctx: &Context<'a>, path: String) -> Vec { + let mut data = ctx.data_unchecked::().graphs.write(); + let new_graphs: HashMap<_, _> = Data::load_from_file(&path) + .into_iter() + .filter(|(key, _)| !data.contains_key(key)) + .collect(); + let keys: Vec<_> = new_graphs.keys().cloned().collect(); + data.extend(new_graphs); + keys + } + + /// Use GQL multipart upload to send new graphs to server + /// + /// # Returns: + /// name of the new graph + async fn upload_graph<'a>(ctx: &Context<'a>, name: String, graph: Upload) -> Result { + let g: MaterializedGraph = + bincode::deserialize_from(BufReader::new(graph.value(ctx)?.content))?; + let gi: IndexedGraph = g + .into_events() + .ok_or("Graph with deletions not supported")? + .into(); + let mut data = ctx.data_unchecked::().graphs.write(); + data.insert(name.clone(), gi); + Ok(name) + } + + /// Send graph bincode as base64 encoded string + /// + /// # Returns: + /// name of the new graph + async fn send_graph<'a>(ctx: &Context<'a>, name: String, graph: String) -> Result { + let g: MaterializedGraph = bincode::deserialize(&URL_SAFE_NO_PAD.decode(graph)?)?; + let mut data = ctx.data_unchecked::().graphs.write(); + data.insert( + name.clone(), + g.into_events() + .ok_or("Graph with deletions not supported")? + .into(), + ); + Ok(name) + } + + async fn archive_graph<'a>( + ctx: &Context<'a>, + graph_name: String, + parent_graph_name: String, + is_archive: u8, + ) -> Result { + let mut data = ctx.data_unchecked::().graphs.write(); + + let subgraph = data.get(&graph_name).ok_or("Graph not found")?; + + let path = subgraph + .properties() + .constant() + .get("path") + .ok_or("Path is missing")? + .to_string(); + + let parent_graph = data.get(&parent_graph_name).ok_or("Graph not found")?; + let new_subgraph = parent_graph + .subgraph(subgraph.vertices().iter().map(|v| v.name()).collect_vec()) + .materialize()?; + + let static_props_without_isactive: Vec<(ArcStr, Prop)> = subgraph + .properties() + .into_iter() + .filter(|(a, _)| a != "isArchive") + .collect_vec(); + new_subgraph.add_constant_properties(static_props_without_isactive)?; + new_subgraph.add_constant_properties([("isArchive", Prop::U8(is_archive))])?; + new_subgraph.save_to_file(path)?; + + let gi: IndexedGraph = new_subgraph + .into_events() + .ok_or("Graph with deletions not supported")? + .into(); + + data.insert(graph_name, gi); + + Ok(true) } } -#[ResolvedObjectFields] -impl Edge { - async fn earliest_time(&self) -> Option { - self.ee.earliest_time() - } - - async fn latest_time(&self) -> Option { - self.ee.latest_time() - } - - async fn src(&self) -> Node { - self.ee.src().into() - } - - async fn dst(&self) -> Node { - self.ee.dst().into() - } - - async fn property(&self, name: String) -> Option { - let prop = self.ee.property(name.clone(), true)?; - Some(Property::new(name, prop)) - } - - async fn history(&self) -> Vec { - self.ee.history() - } -} +#[derive(App)] +pub(crate) struct App(QueryRoot, MutRoot, Mut); diff --git a/raphtory-graphql/src/model/schema/edge_schema.rs b/raphtory-graphql/src/model/schema/edge_schema.rs new file mode 100644 index 0000000000..19cc277a39 --- /dev/null +++ b/raphtory-graphql/src/model/schema/edge_schema.rs @@ -0,0 +1,65 @@ +use crate::model::schema::{ + get_vertex_type, merge_schemas, property_schema::PropertySchema, SchemaAggregate, +}; +use dynamic_graphql::{ResolvedObject, ResolvedObjectFields}; +use itertools::Itertools; +use raphtory::{ + db::graph::edge::EdgeView, + prelude::{EdgeViewOps, GraphViewOps}, +}; +use std::collections::{HashMap, HashSet}; + +#[derive(ResolvedObject)] +pub(crate) struct EdgeSchema { + graph: G, + src_type: String, + dst_type: String, +} + +impl EdgeSchema { + pub fn new(graph: G, src_type: String, dst_type: String) -> Self { + Self { + graph, + src_type, + dst_type, + } + } +} + +#[ResolvedObjectFields] +impl EdgeSchema { + /// Returns the type of source for these edges + async fn src_type(&self) -> String { + self.src_type.clone() + } + + /// Returns the type of destination for these edges + async fn dst_type(&self) -> String { + self.dst_type.clone() + } + + /// Returns the list of property schemas for edges connecting these types of nodes + async fn properties(&self) -> Vec { + let filter_types = |edge: &EdgeView| { + let src_type = get_vertex_type(edge.src()); + let dst_type = get_vertex_type(edge.dst()); + src_type == self.src_type && dst_type == self.dst_type + }; + + let filtered_edges = self.graph.edges().filter(filter_types); + + let schema: SchemaAggregate = filtered_edges + .map(collect_edge_schema) + .reduce(merge_schemas) + .unwrap_or_else(|| HashMap::new()); + + schema.into_iter().map(|prop| prop.into()).collect_vec() + } +} + +fn collect_edge_schema(edge: EdgeView) -> SchemaAggregate { + edge.properties() + .iter() + .map(|(key, value)| (key.to_string(), HashSet::from([value.to_string()]))) + .collect() +} diff --git a/raphtory-graphql/src/model/schema/graph_schema.rs b/raphtory-graphql/src/model/schema/graph_schema.rs new file mode 100644 index 0000000000..8254872075 --- /dev/null +++ b/raphtory-graphql/src/model/schema/graph_schema.rs @@ -0,0 +1,32 @@ +use crate::model::schema::{layer_schema::LayerSchema, node_schema::NodeSchema}; +use dynamic_graphql::SimpleObject; +use itertools::Itertools; +use raphtory::{ + db::api::view::internal::DynamicGraph, + prelude::{GraphViewOps, LayerOps, VertexViewOps}, +}; + +#[derive(SimpleObject)] +pub(crate) struct GraphSchema { + nodes: Vec, + layers: Vec>, +} + +impl GraphSchema { + pub fn new(graph: &DynamicGraph) -> Self { + let nodes = graph + .vertices() + .iter() + .filter_map(|vertex| vertex.properties().get("type").map(|p| p.to_string())) + .unique() + .map(|node_type| NodeSchema::new(node_type, graph.clone())) + .collect_vec(); + + let layers = graph + .unique_layers() + .map(|layer_name| graph.layer(layer_name).unwrap().into()) + .collect_vec(); + + GraphSchema { nodes, layers } + } +} diff --git a/raphtory-graphql/src/model/schema/layer_schema.rs b/raphtory-graphql/src/model/schema/layer_schema.rs new file mode 100644 index 0000000000..5467b568d6 --- /dev/null +++ b/raphtory-graphql/src/model/schema/layer_schema.rs @@ -0,0 +1,46 @@ +use crate::model::schema::{edge_schema::EdgeSchema, get_vertex_type}; +use dynamic_graphql::{ResolvedObject, ResolvedObjectFields}; +use itertools::Itertools; +use raphtory::{ + db::graph::views::layer_graph::LayeredGraph, + prelude::{EdgeViewOps, GraphViewOps}, +}; + +#[derive(ResolvedObject)] +pub(crate) struct LayerSchema { + graph: LayeredGraph, +} + +impl From> for LayerSchema { + fn from(value: LayeredGraph) -> Self { + Self { graph: value } + } +} + +#[ResolvedObjectFields] +impl LayerSchema { + /// Returns the name of the layer with this schema + async fn name(&self) -> String { + let mut layers = self.graph.unique_layers(); + let layer = layers.next().expect("Layered graph has a layer"); + debug_assert!( + layers.next().is_none(), + "Layered graph outputted more than one layer name" + ); + layer.into() + } + /// Returns the list of edge schemas for this edge layer + async fn edges(&self) -> Vec>> { + self.graph + .edges() + .into_iter() + .map(|edge| { + let src_type = get_vertex_type(edge.src()); + let dst_type = get_vertex_type(edge.dst()); + (src_type, dst_type) + }) + .unique() + .map(|(src_type, dst_type)| EdgeSchema::new(self.graph.clone(), src_type, dst_type)) + .collect_vec() + } +} diff --git a/raphtory-graphql/src/model/schema/mod.rs b/raphtory-graphql/src/model/schema/mod.rs new file mode 100644 index 0000000000..5d10db0d79 --- /dev/null +++ b/raphtory-graphql/src/model/schema/mod.rs @@ -0,0 +1,39 @@ +use raphtory::{ + db::graph::vertex::VertexView, + prelude::{GraphViewOps, VertexViewOps}, +}; +use std::collections::{HashMap, HashSet}; + +pub(crate) mod edge_schema; +pub(crate) mod graph_schema; +pub(crate) mod layer_schema; +pub(crate) mod node_schema; +pub(crate) mod property_schema; + +const ENUM_BOUNDARY: usize = 20; + +fn get_vertex_type(vertex: VertexView) -> String { + let prop = vertex.properties().get("type"); + prop.map(|prop| prop.to_string()) + .unwrap_or_else(|| "NONE".to_string()) +} + +type SchemaAggregate = HashMap>; + +fn merge_schemas(mut s1: SchemaAggregate, s2: SchemaAggregate) -> SchemaAggregate { + for (key, set2) in s2 { + if let Some(set1) = s1.get_mut(&key) { + // Here, an empty set means: too many values to be interpreted as an enumerated type + if set1.len() > 0 && set2.len() > 0 { + set1.extend(set2); + } + if set1.len() > ENUM_BOUNDARY { + set1.clear(); + } + } else { + s1.insert(key, set2); + } + } + + s1 +} diff --git a/raphtory-graphql/src/model/schema/node_schema.rs b/raphtory-graphql/src/model/schema/node_schema.rs new file mode 100644 index 0000000000..3516569f91 --- /dev/null +++ b/raphtory-graphql/src/model/schema/node_schema.rs @@ -0,0 +1,56 @@ +use crate::model::schema::{merge_schemas, property_schema::PropertySchema, SchemaAggregate}; +use dynamic_graphql::{ResolvedObject, ResolvedObjectFields}; +use itertools::Itertools; +use raphtory::{ + db::{api::view::internal::DynamicGraph, graph::vertex::VertexView}, + prelude::{GraphViewOps, VertexViewOps}, +}; +use std::collections::{HashMap, HashSet}; + +#[derive(ResolvedObject)] +pub(crate) struct NodeSchema { + type_name: String, + graph: DynamicGraph, +} + +impl NodeSchema { + pub fn new(node_type: String, graph: DynamicGraph) -> Self { + Self { + type_name: node_type, + graph, + } + } +} + +#[ResolvedObjectFields] +impl NodeSchema { + async fn type_name(&self) -> String { + self.type_name.clone() + } + + /// Returns the list of property schemas for this node + async fn properties(&self) -> Vec { + let filter_type = |vertex: &VertexView| match vertex.properties().get("type") + { + Some(node_type) => node_type.to_string() == self.type_name, + None => false, + }; + + let filtered_vertices = self.graph.vertices().iter().filter(filter_type); + + let schema: SchemaAggregate = filtered_vertices + .map(collect_vertex_schema) + .reduce(merge_schemas) + .unwrap_or_else(|| HashMap::new()); + + schema.into_iter().map(|prop| prop.into()).collect_vec() + } +} + +fn collect_vertex_schema(vertex: VertexView) -> SchemaAggregate { + vertex + .properties() + .iter() + .map(|(key, value)| (key.to_string(), HashSet::from([value.to_string()]))) + .collect() +} diff --git a/raphtory-graphql/src/model/schema/property_schema.rs b/raphtory-graphql/src/model/schema/property_schema.rs new file mode 100644 index 0000000000..edb40cfadf --- /dev/null +++ b/raphtory-graphql/src/model/schema/property_schema.rs @@ -0,0 +1,24 @@ +use dynamic_graphql::SimpleObject; +use std::collections::HashSet; + +#[derive(SimpleObject)] +pub(crate) struct PropertySchema { + key: String, + variants: Vec, +} + +// impl PropertySchema { +// pub fn new(key: String, values: Vec) -> Self { +// Self { key, values } +// } +// } + +impl From<(String, HashSet)> for PropertySchema { + fn from(value: (String, HashSet)) -> Self { + let (key, set) = value; + PropertySchema { + key, + variants: Vec::from_iter(set), + } + } +} diff --git a/raphtory-graphql/src/observability/tracing.rs b/raphtory-graphql/src/observability/tracing.rs index 7b4f1fb8c7..2e3986ede5 100644 --- a/raphtory-graphql/src/observability/tracing.rs +++ b/raphtory-graphql/src/observability/tracing.rs @@ -1,6 +1,10 @@ -use opentelemetry::sdk::trace::{self, Sampler}; use opentelemetry::{ - global, runtime::Tokio, sdk::propagation::TraceContextPropagator, sdk::trace::Tracer, + global, + runtime::Tokio, + sdk::{ + propagation::TraceContextPropagator, + trace::{self, Sampler, Tracer}, + }, }; use std::env; diff --git a/raphtory-graphql/src/routes.rs b/raphtory-graphql/src/routes.rs index 6669027a0c..22865da9c4 100644 --- a/raphtory-graphql/src/routes.rs +++ b/raphtory-graphql/src/routes.rs @@ -1,9 +1,11 @@ use async_graphql::http::{playground_source, GraphQLPlaygroundConfig}; -use poem::http::StatusCode; -use poem::web::{Html, Json}; -use poem::{handler, IntoResponse}; +use poem::{ + handler, + http::StatusCode, + web::{Html, Json}, + IntoResponse, +}; use serde::Serialize; -use tracing::{span, Instrument, Level}; #[derive(Serialize)] struct Health { diff --git a/raphtory-graphql/src/server.rs b/raphtory-graphql/src/server.rs index 12c2fabee0..d9410bde50 100644 --- a/raphtory-graphql/src/server.rs +++ b/raphtory-graphql/src/server.rs @@ -1,29 +1,86 @@ -use crate::data::Data; -use crate::model::algorithm::Algorithm; -use crate::model::QueryRoot; -use crate::observability::tracing::create_tracer_from_env; -use crate::routes::{graphql_playground, health}; +#![allow(dead_code)] + +use crate::{ + data::Data, + model::{algorithm::Algorithm, App}, + observability::tracing::create_tracer_from_env, + routes::{graphql_playground, health}, +}; use async_graphql_poem::GraphQL; -use dynamic_graphql::App; -use poem::listener::TcpListener; -use poem::middleware::Cors; -use poem::{get, EndpointExt, Route, Server}; -use tokio::io::Result as IoResult; -use tokio::signal; -use tracing_subscriber::layer::SubscriberExt; -use tracing_subscriber::util::SubscriberInitExt; -use tracing_subscriber::Registry; +use poem::{get, listener::TcpListener, middleware::Cors, EndpointExt, Route, Server}; +use raphtory::{ + db::graph::{edge::EdgeView, vertex::VertexView}, + prelude::Graph, + vectors::{Embedding, Vectorizable}, +}; +use std::{collections::HashMap, future::Future, ops::Deref, path::Path}; +use tokio::{io::Result as IoResult, signal}; +use tracing_subscriber::{layer::SubscriberExt, util::SubscriberInitExt, EnvFilter, Registry}; pub struct RaphtoryServer { data: Data, } impl RaphtoryServer { - pub fn new(graph_directory: &str) -> Self { - let data = Data::load(graph_directory); + pub fn from_map(graphs: HashMap) -> Self { + let data = Data::from_map(graphs); + Self { data } + } + + pub fn from_directory(graph_directory: &str) -> Self { + let data = Data::from_directory(graph_directory); Self { data } } + pub fn from_map_and_directory(graphs: HashMap, graph_directory: &str) -> Self { + let data = Data::from_map_and_directory(graphs, graph_directory); + Self { data } + } + + pub async fn with_vectorized( + self, + graph_names: Vec, + embedding: F, + cache_dir: &Path, + templates: Option<(N, E)>, + ) -> Self + where + F: Fn(Vec) -> U + Send + Sync + Copy + 'static, + U: Future> + Send + 'static, + N: Fn(&VertexView) -> String + Sync + Send + Copy + 'static, + E: Fn(&EdgeView) -> String + Sync + Send + Copy + 'static, + { + { + let graphs_map = self.data.graphs.read(); + let mut stores_map = self.data.vector_stores.write(); + + for graph_name in graph_names { + let graph_cache = cache_dir.join(&graph_name); + let graph = graphs_map.get(&graph_name).unwrap().deref().clone(); + + println!("Loading embeddings for {graph_name} using cache from {graph_cache:?}"); + let vectorized = match templates { + Some((node_template, edge_template)) => { + graph + .vectorize_with_templates( + Box::new(embedding), + &graph_cache, + node_template, + edge_template, + ) + .await + } + None => graph.vectorize(Box::new(embedding), &graph_cache).await, + }; + stores_map.insert(graph_name, vectorized); + } + } + + println!("Embeddings were loaded successfully"); + + self + } + pub fn register_algorithm(self, name: &str) -> Self { crate::model::algorithm::PLUGIN_ALGOS .lock() @@ -38,19 +95,16 @@ impl RaphtoryServer { pub async fn run_with_port(self, port: u16) -> IoResult<()> { let registry = Registry::default().with(tracing_subscriber::fmt::layer().pretty()); + let env_filter = EnvFilter::try_from_default_env().unwrap_or(EnvFilter::new("INFO")); match create_tracer_from_env() { Some(tracer) => registry .with(tracing_opentelemetry::layer().with_tracer(tracer)) - .try_init() - .expect("Failed to register tracer with registry"), - None => registry - .try_init() - .expect("Failed to register tracer with registry"), + .with(env_filter) + .try_init(), + None => registry.with(env_filter).try_init(), } - - #[derive(App)] - struct App(QueryRoot); + .unwrap_or(()); // it is important that this runs after algorithms have been pushed to PLUGIN_ALGOS static variable let schema_builder = App::create_schema(); diff --git a/raphtory-io/src/graph_loader/source/polars_loader.rs b/raphtory-io/src/graph_loader/source/polars_loader.rs deleted file mode 100644 index 1f38ce7052..0000000000 --- a/raphtory-io/src/graph_loader/source/polars_loader.rs +++ /dev/null @@ -1 +0,0 @@ -//! TBD: Provides functionality for loading graph data from Polars DataFrames. diff --git a/raphtory-io/src/lib.rs b/raphtory-io/src/lib.rs deleted file mode 100644 index 4f0a6bef78..0000000000 --- a/raphtory-io/src/lib.rs +++ /dev/null @@ -1,81 +0,0 @@ -//! # raphtory -//! -//! `raphtory-io` is a module for loading graphs into raphtory from various sources, like csv, neo4j, etc. -//! -//! ## Examples -//! -//! Load a pre-built graph -//! ```rust -//! use raphtory::algorithms::degree::average_degree; -//! use raphtory::db::graph::Graph; -//! use raphtory::db::view_api::*; -//! use raphtory_io::graph_loader::example::lotr_graph::lotr_graph; -//! -//! let graph = lotr_graph(3); -//! -//! // Get the in-degree, out-degree of Gandalf -//! // The graph.vertex option returns a result of an option, -//! // so we need to unwrap the result and the option or -//! // we can use this if let instead -//! if let Some(gandalf) = graph.vertex("Gandalf") { -//! println!("Gandalf in degree: {:?}", gandalf.in_degree()); -//! println!("Gandalf out degree: {:?}", gandalf.out_degree()); -//! } -//! -//! // Run an average degree algorithm on the graph -//! println!("Average degree: {:?}", average_degree(&graph)); -//! ``` -//! -//! Load a graph from csv -//! -//! ```no_run -//! use raphtory::db::graph::Graph; -//! use raphtory::core::Prop; -//! use std::time::Instant; -//! use raphtory_io::graph_loader::source::csv_loader::CsvLoader; -//! use serde::Deserialize; -//! -//! let data_dir = "/tmp/lotr.csv"; -//! -//! #[derive(Deserialize, std::fmt::Debug)] -//! pub struct Lotr { -//! src_id: String, -//! dst_id: String, -//! time: i64, -//! } -//! -//! let g = Graph::new(2); -//! let now = Instant::now(); -//! -//! CsvLoader::new(data_dir) -//! .load_into_graph(&g, |lotr: Lotr, g: &Graph| { -//! g.add_vertex( -//! lotr.time, -//! lotr.src_id.clone(), -//! &vec![("type".to_string(), Prop::Str("Character".to_string()))], -//! ) -//! .expect("Failed to add vertex"); -//! -//! g.add_vertex( -//! lotr.time, -//! lotr.dst_id.clone(), -//! &vec![("type".to_string(), Prop::Str("Character".to_string()))], -//! ) -//! .expect("Failed to add vertex"); -//! -//! g.add_edge( -//! lotr.time, -//! lotr.src_id.clone(), -//! lotr.dst_id.clone(), -//! &vec![( -//! "type".to_string(), -//! Prop::Str("Character Co-occurrence".to_string()), -//! )], -//! None, -//! ) -//! .expect("Failed to add edge"); -//! }) -//! .expect("Failed to load graph from CSV data files"); -//! ``` -//! -pub mod graph_loader; diff --git a/raphtory/Cargo.toml b/raphtory/Cargo.toml index 42bdc866ec..4d71034241 100644 --- a/raphtory/Cargo.toml +++ b/raphtory/Cargo.toml @@ -12,7 +12,6 @@ license.workspace = true readme.workspace = true homepage.workspace = true - # See more keys and their definitions at https://doc.rust-lang.org/cargo/reference/manifest.html [dependencies] @@ -23,7 +22,7 @@ futures = {version = "0.3", features = ["thread-pool"] } genawaiter = "0.99" itertools="0.10" num-traits = "0.2" -parking_lot = { version = "0.12" , features = ["serde", "arc_lock"] } +parking_lot = { version = "0.12" , features = ["serde", "arc_lock", "send_guard"] } quickcheck = "1" quickcheck_macros = "1" once_cell = "1" @@ -37,13 +36,55 @@ rustc-hash = "1.1.0" serde = { version = "1", features = ["derive","rc"] } sorted_vector_map = "0.1" tempdir = "0.3" -# tokio = { version = "1.27.0", features = ["full"] } thiserror = "1" twox-hash = "1.6.3" uuid = { version = "1.3.0", features = ["v4"] } +lock_api = { version = "0.4", features = ["arc_lock", "serde"] } +dashmap = {version ="5", features = ["serde"] } +serde_with = "3.3.0" +enum_dispatch = "0.3" +kdam = "0.4.1" + +# io optional dependencies +csv = {version="1.1.6", optional=true} +zip = {version ="0.6.6", optional=true} +neo4rs = {version="0.6.1", optional=true} +bzip2 = {version="0.4", optional=true} +flate2 = {version="1.0", optional=true} +serde_json = {version="1", optional=true} +reqwest = { version = "0.11.14", features = ["blocking"], optional=true} +tokio = { version = "1.27.0", features = ["full"], optional=true} + +# search optional dependencies +tantivy = {version="0.20", optional=true} # 0.21 does not work (see https://github.com/quickwit-oss/tantivy/issues/2175) + +# vectors optional dependencies +futures-util = {version="0.3.0", optional=true} +async-trait = {version="0.1.73", optional=true} + +# python binding optional dependencies +pyo3 = {version= "0.19.2", features=["multiple-pymethods", "chrono"], optional=true} +pyo3-asyncio = { version = "0.19.0", features = ["tokio-runtime"], optional=true } +num = {version="0.4.0", optional=true} +display-error-chain = {version= "0.2.0", optional=true} +arrow2 = {version="0.17", optional=true} +ordered-float = "3.7.0" + [dev-dependencies] csv = "1" pretty_assertions = "1" quickcheck = "1" quickcheck_macros = "1" +tempfile = "3.2" + +[features] +default = ["search"] +# Enables the graph loader io module +io = ["dep:zip", "dep:neo4rs", "dep:bzip2", "dep:flate2", "dep:csv", "dep:serde_json", "dep:reqwest", "dep:tokio"] +# Enables generating the pyo3 python bindings +python = ["io", "vectors", "dep:pyo3", "dep:pyo3-asyncio", "dep:num", "dep:display-error-chain", "dep:arrow2"] +# search +search = ["dep:tantivy"] +# vectors +vectors = ["dep:futures-util", "dep:async-trait"] diff --git a/raphtory/src/algorithms/algorithm_result.rs b/raphtory/src/algorithms/algorithm_result.rs new file mode 100644 index 0000000000..2f4d3577b8 --- /dev/null +++ b/raphtory/src/algorithms/algorithm_result.rs @@ -0,0 +1,508 @@ +use itertools::Itertools; +use num_traits::Float; +use ordered_float::OrderedFloat; +use std::{ + borrow::Borrow, + collections::{hash_map::Iter, HashMap}, + fmt, + fmt::Debug, + hash::Hash, + marker::PhantomData, +}; + +pub trait AsOrd { + /// Converts reference of this type into reference of an ordered Type. + /// + /// This is the same as AsRef (with the additional constraint that the target type needs to be ordered). + /// + /// Importantly, unlike AsRef, this blanket-implements the trivial conversion from a type to itself! + fn as_ord(&self) -> &T; +} + +impl AsOrd for T { + fn as_ord(&self) -> &T { + self + } +} + +impl AsOrd> for T { + fn as_ord(&self) -> &OrderedFloat { + self.into() + } +} + +impl AsOrd<(OrderedFloat, OrderedFloat)> for (T, T) { + fn as_ord(&self) -> &(OrderedFloat, OrderedFloat) { + // Safety: OrderedFloat is #[repr(transparent)] and has no invalid values, i.e. there is no physical difference between OrderedFloat and Float. + unsafe { &*(self as *const (T, T) as *const (OrderedFloat, OrderedFloat)) } + } +} + +/// A generic `AlgorithmResult` struct that represents the result of an algorithm computation. +/// +/// The `AlgorithmResult` contains a hashmap, where keys (`H`) are cloneable, hashable, and comparable, +/// and values (`Y`) are cloneable. The keys and values can be of any type that satisfies the specified +/// trait bounds. +/// +/// This `AlgorithmResult` is returned for all algorithms that return a HashMap +/// +pub struct AlgorithmResult { + /// The result hashmap that stores keys of type `H` and values of type `Y`. + pub result: HashMap, + marker: PhantomData, +} + +impl AlgorithmResult +where + K: Clone + Hash + Eq + Ord, + V: Clone, +{ + /// Creates a new instance of `AlgorithmResult` with the provided hashmap. + /// + /// # Arguments + /// + /// * `result`: A `HashMap` with keys of type `H` and values of type `Y`. + pub fn new(result: HashMap) -> Self { + Self { + result, + marker: PhantomData, + } + } + + /// Returns a reference to the entire `result` hashmap. + pub fn get_all(&self) -> &HashMap { + &self.result + } + + /// Returns the value corresponding to the provided key in the `result` hashmap. + /// + /// # Arguments + /// + /// * `key`: The key of type `H` for which the value is to be retrieved. + pub fn get(&self, key: &Q) -> Option<&V> + where + Q: Hash + Eq + ?Sized, + K: Borrow, + { + self.result.get(key) + } + + /// Sorts the `AlgorithmResult` by its keys in ascending or descending order. + /// + /// # Arguments + /// + /// * `reverse`: If `true`, sorts the result in descending order; otherwise, sorts in ascending order. + /// + /// # Returns + /// + /// A sorted vector of tuples containing keys of type `H` and values of type `Y`. + pub fn sort_by_key(&self, reverse: bool) -> Vec<(K, V)> { + let mut sorted: Vec<(K, V)> = self.result.clone().into_iter().collect(); + sorted.sort_by(|(a, _), (b, _)| if reverse { b.cmp(a) } else { a.cmp(b) }); + sorted + } + + pub fn iter(&self) -> Iter<'_, K, V> { + self.result.iter() + } + + /// Sorts the `AlgorithmResult` by its values in ascending or descending order. + /// + /// # Arguments + /// + /// * `reverse`: If `true`, sorts the result in descending order; otherwise, sorts in ascending order. + /// + /// # Returns + /// + /// A sorted vector of tuples containing keys of type `H` and values of type `Y`. + pub fn sort_by std::cmp::Ordering>( + &self, + mut cmp: F, + reverse: bool, + ) -> Vec<(K, V)> { + let mut sorted: Vec<(K, V)> = self.result.clone().into_iter().collect(); + sorted.sort_by(|(_, a), (_, b)| if reverse { cmp(b, a) } else { cmp(a, b) }); + sorted + } + + /// Retrieves the top-k elements from the `AlgorithmResult` based on its values. + /// + /// # Arguments + /// + /// * `k`: The number of elements to retrieve. + /// * `percentage`: If `true`, the `k` parameter is treated as a percentage of total elements. + /// * `reverse`: If `true`, retrieves the elements in descending order; otherwise, in ascending order. + /// + /// # Returns + /// + /// An `a vector of tuples with keys of type `H` and values of type `Y`. + /// If `percentage` is `true`, the returned vector contains the top `k` percentage of elements. + /// If `percentage` is `false`, the returned vector contains the top `k` elements. + /// Returns empty vec if the result is empty or if `k` is 0. + pub fn top_k_by std::cmp::Ordering>( + &self, + cmp: F, + k: usize, + percentage: bool, + reverse: bool, + ) -> Vec<(K, V)> { + let k = if percentage { + let total_count = self.result.len(); + (total_count as f64 * (k as f64 / 100.0)) as usize + } else { + k + }; + self.sort_by(cmp, reverse).into_iter().take(k).collect() + } + + pub fn min_by std::cmp::Ordering>(&self, mut cmp: F) -> Option<(K, V)> { + self.result + .iter() + .min_by(|a, b| cmp(a.1, b.1)) + .map(|(k, v)| (k.clone(), v.clone())) + } + + pub fn max_by std::cmp::Ordering>(&self, mut cmp: F) -> Option<(K, V)> { + self.result + .iter() + .max_by(|a, b| cmp(a.1, b.1)) + .map(|(k, v)| (k.clone(), v.clone())) + } + + pub fn median_by std::cmp::Ordering>(&self, mut cmp: F) -> Option<(K, V)> { + let mut items: Vec<_> = self.result.iter().collect(); + let len = items.len(); + if len == 0 { + return None; + } + items.sort_by(|(_, a), (_, b)| cmp(a, b)); + let median_index = len / 2; + Some((items[median_index].0.clone(), items[median_index].1.clone())) + } +} + +impl IntoIterator for AlgorithmResult +where + K: Clone + Hash + Eq + Ord, + V: Clone, + for<'a> &'a O: From<&'a V>, +{ + type Item = (K, V); + type IntoIter = std::collections::hash_map::IntoIter; + + fn into_iter(self) -> Self::IntoIter { + self.result.into_iter() + } +} + +impl<'a, K, V, O> IntoIterator for &'a AlgorithmResult +where + K: Clone + Hash + Ord, + V: Clone, +{ + type Item = (&'a K, &'a V); + type IntoIter = Iter<'a, K, V>; + + fn into_iter(self) -> Self::IntoIter { + self.iter() + } +} + +impl FromIterator<(K, V)> for AlgorithmResult { + fn from_iter>(iter: T) -> Self { + let result = iter.into_iter().collect(); + Self { + result, + marker: PhantomData, + } + } +} + +impl AlgorithmResult +where + K: Clone + Hash + Eq + Ord, + V: Clone, + O: Ord, + V: AsOrd, +{ + /// Sorts the `AlgorithmResult` by its values in ascending or descending order. + /// + /// # Arguments + /// + /// * `reverse`: If `true`, sorts the result in descending order; otherwise, sorts in ascending order. + /// + /// # Returns + /// + /// A sorted vector of tuples containing keys of type `H` and values of type `Y`. + pub fn sort_by_value(&self, reverse: bool) -> Vec<(K, V)> { + self.sort_by(|a, b| O::cmp(a.as_ord(), b.as_ord()), reverse) + } + + /// Retrieves the top-k elements from the `AlgorithmResult` based on its values. + /// + /// # Arguments + /// + /// * `k`: The number of elements to retrieve. + /// * `percentage`: If `true`, the `k` parameter is treated as a percentage of total elements. + /// * `reverse`: If `true`, retrieves the elements in descending order; otherwise, in ascending order. + /// + /// # Returns + /// + /// An `a vector of tuples with keys of type `H` and values of type `Y`. + /// If `percentage` is `true`, the returned vector contains the top `k` percentage of elements. + /// If `percentage` is `false`, the returned vector contains the top `k` elements. + /// Returns empty vec if the result is empty or if `k` is 0. + pub fn top_k(&self, k: usize, percentage: bool, reverse: bool) -> Vec<(K, V)> { + self.top_k_by( + |a, b| O::cmp(a.as_ord(), b.as_ord()), + k, + percentage, + reverse, + ) + } + + pub fn min(&self) -> Option<(K, V)> { + self.min_by(|a, b| O::cmp(a.as_ord(), b.as_ord())) + } + + pub fn max(&self) -> Option<(K, V)> { + self.max_by(|a, b| O::cmp(a.as_ord(), b.as_ord())) + } + + pub fn median(&self) -> Option<(K, V)> { + self.median_by(|a, b| O::cmp(a.as_ord(), b.as_ord())) + } +} + +impl AlgorithmResult +where + K: Clone + Hash + Eq + Ord, + V: Clone + Hash + Eq, +{ + /// Groups the `AlgorithmResult` by its values. + /// + /// # Returns + /// + /// A `HashMap` where keys are unique values from the `AlgorithmResult` and values are vectors + /// containing keys of type `H` that share the same value. + pub fn group_by(&self) -> HashMap> { + let mut grouped: HashMap> = HashMap::new(); + for (key, value) in &self.result { + grouped.entry(value.clone()).or_default().push(key.clone()); + } + grouped + } +} + +impl Debug for AlgorithmResult { + fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result { + let map_string = self + .result + .iter() + .map(|(key, value)| format!("{:?}: {:?}, ", key, value)) + .join(", "); + write!(f, "{{{}}}", map_string) + } +} + +/// Add tests for all functions +#[cfg(test)] +mod algorithm_result_test { + use crate::algorithms::algorithm_result::AlgorithmResult; + use ordered_float::OrderedFloat; + use std::collections::HashMap; + + fn create_algo_result_u64() -> AlgorithmResult { + let mut map: HashMap = HashMap::new(); + map.insert("A".to_string(), 10); + map.insert("B".to_string(), 20); + map.insert("C".to_string(), 30); + AlgorithmResult::new(map) + } + + fn group_by_test() -> AlgorithmResult { + let mut map: HashMap = HashMap::new(); + map.insert("A".to_string(), 10); + map.insert("B".to_string(), 20); + map.insert("C".to_string(), 30); + map.insert("D".to_string(), 10); + AlgorithmResult::new(map) + } + + fn create_algo_result_f64() -> AlgorithmResult> { + let mut map: HashMap = HashMap::new(); + map.insert("A".to_string(), 10.0); + map.insert("B".to_string(), 20.0); + map.insert("C".to_string(), 30.0); + AlgorithmResult::new(map) + } + + fn create_algo_result_tuple( + ) -> AlgorithmResult, OrderedFloat)> { + let mut map: HashMap = HashMap::new(); + map.insert("A".to_string(), (10.0, 20.0)); + map.insert("B".to_string(), (20.0, 30.0)); + map.insert("C".to_string(), (30.0, 40.0)); + AlgorithmResult::new(map) + } + + fn create_algo_result_hashmap_vec() -> AlgorithmResult> { + let mut map: HashMap> = HashMap::new(); + map.insert("A".to_string(), vec![(11, "H".to_string())]); + map.insert("B".to_string(), vec![]); + map.insert( + "C".to_string(), + vec![(22, "E".to_string()), (33, "F".to_string())], + ); + AlgorithmResult::new(map) + } + + #[test] + fn test_min_max_value() { + let algo_result = create_algo_result_u64(); + assert_eq!(algo_result.min(), Some(("A".to_string(), 10u64))); + assert_eq!(algo_result.max(), Some(("C".to_string(), 30u64))); + assert_eq!(algo_result.median(), Some(("B".to_string(), 20u64))); + let algo_result = create_algo_result_f64(); + assert_eq!(algo_result.min(), Some(("A".to_string(), 10.0))); + assert_eq!(algo_result.max(), Some(("C".to_string(), 30.0))); + assert_eq!(algo_result.median(), Some(("B".to_string(), 20.0))); + } + + #[test] + fn test_get() { + let algo_result = create_algo_result_u64(); + assert_eq!(algo_result.get(&"C".to_string()), Some(&30)); + assert_eq!(algo_result.get(&"D".to_string()), None); + let algo_result = create_algo_result_f64(); + assert_eq!(algo_result.get(&"C".to_string()), Some(&30.0)); + let algo_result = create_algo_result_tuple(); + assert_eq!(algo_result.get(&"C".to_string()).unwrap().0, 30.0); + let algo_result = create_algo_result_hashmap_vec(); + assert_eq!(algo_result.get(&"C".to_string()).unwrap()[0].0, 22); + } + + #[test] + fn test_sort() { + let algo_result = create_algo_result_u64(); + let sorted = algo_result.sort_by_value(true); + assert_eq!(sorted[0].0, "C"); + let sorted = algo_result.sort_by_value(false); + assert_eq!(sorted[0].0, "A"); + + let algo_result = create_algo_result_f64(); + let sorted = algo_result.sort_by_value(true); + assert_eq!(sorted[0].0, "C"); + let sorted = algo_result.sort_by_value(false); + assert_eq!(sorted[0].0, "A"); + + let algo_result = create_algo_result_tuple(); + assert_eq!(algo_result.sort_by_value(true)[0].0, "C"); + + let algo_result = create_algo_result_hashmap_vec(); + assert_eq!(algo_result.sort_by_value(true)[0].0, "C"); + } + + #[test] + fn test_top_k() { + let algo_result = create_algo_result_u64(); + let top_k = algo_result.top_k(2, false, false); + assert_eq!(top_k[0].0, "A"); + let top_k = algo_result.top_k(2, false, true); + assert_eq!(top_k[0].0, "C"); + + let algo_result = create_algo_result_f64(); + let top_k = algo_result.top_k(2, false, false); + assert_eq!(top_k[0].0, "A"); + let top_k = algo_result.top_k(2, false, true); + assert_eq!(top_k[0].0, "C"); + + let algo_result = create_algo_result_tuple(); + assert_eq!(algo_result.top_k(2, false, false)[0].0, "A"); + + let algo_result = create_algo_result_hashmap_vec(); + assert_eq!(algo_result.top_k(2, false, false)[0].0, "B"); + } + + #[test] + fn test_group_by() { + let algo_result = group_by_test(); + let grouped = algo_result.group_by(); + assert_eq!(grouped.get(&10).unwrap().len(), 2); + assert!(grouped.get(&10).unwrap().contains(&"A".to_string())); + assert!(!grouped.get(&10).unwrap().contains(&"B".to_string())); + + let algo_result = create_algo_result_hashmap_vec(); + assert_eq!( + algo_result + .group_by() + .get(&vec![(11, "H".to_string())]) + .unwrap() + .len(), + 1 + ); + } + + #[test] + fn test_get_all() { + let algo_result = create_algo_result_u64(); + let all = algo_result.get_all(); + assert_eq!(all.len(), 3); + assert!(all.contains_key("A")); + + let algo_result = create_algo_result_f64(); + let all = algo_result.get_all(); + assert_eq!(all.len(), 3); + assert!(all.contains_key("A")); + + let algo_result = create_algo_result_tuple(); + assert_eq!(algo_result.get_all().get("A").unwrap().0, 10.0); + assert_eq!(algo_result.get_all().len(), 3); + + let algo_result = create_algo_result_hashmap_vec(); + assert_eq!(algo_result.get_all().get("A").unwrap()[0].0, 11); + assert_eq!(algo_result.get_all().len(), 3); + } + + #[test] + fn test_sort_by_key() { + let algo_result = create_algo_result_u64(); + let sorted = algo_result.sort_by_key(true); + let my_array: Vec<(String, u64)> = vec![ + ("C".to_string(), 30u64), + ("B".to_string(), 20u64), + ("A".to_string(), 10u64), + ]; + assert_eq!(my_array, sorted); + // + let algo_result = create_algo_result_f64(); + let sorted = algo_result.sort_by_key(true); + let my_array: Vec<(String, f64)> = vec![ + ("C".to_string(), 30.0), + ("B".to_string(), 20.0), + ("A".to_string(), 10.0), + ]; + assert_eq!(my_array, sorted); + // + let algo_result = create_algo_result_tuple(); + let sorted = algo_result.sort_by_key(true); + let my_array: Vec<(String, (f32, f32))> = vec![ + ("C".to_string(), (30.0, 40.0)), + ("B".to_string(), (20.0, 30.0)), + ("A".to_string(), (10.0, 20.0)), + ]; + assert_eq!(my_array, sorted); + // + let algo_result = create_algo_result_hashmap_vec(); + let sorted = algo_result.sort_by_key(true); + let my_array: Vec<(String, Vec<(i64, String)>)> = vec![ + ( + "C".to_string(), + vec![(22, "E".to_string()), (33, "F".to_string())], + ), + ("B".to_string(), vec![]), + ("A".to_string(), vec![(11, "H".to_string())]), + ]; + assert_eq!(my_array, sorted); + } +} diff --git a/raphtory/src/algorithms/balance.rs b/raphtory/src/algorithms/balance.rs new file mode 100644 index 0000000000..f55ad66fe4 --- /dev/null +++ b/raphtory/src/algorithms/balance.rs @@ -0,0 +1,193 @@ +//! # Weight Accumulation +//! +//! This algorithm provides functionality to accumulate (or sum) weights on vertices +//! in a graph. +use crate::{ + algorithms::algorithm_result::AlgorithmResult, + core::{ + state::{ + accumulator_id::accumulators::sum, + compute_state::{ComputeState, ComputeStateVec}, + }, + Direction, + }, + db::{ + api::view::GraphViewOps, + task::{ + context::Context, + task::{ATask, Job, Step}, + task_runner::TaskRunner, + vertex::eval_vertex::EvalVertexView, + }, + }, + prelude::{EdgeListOps, PropUnwrap, VertexViewOps}, +}; +use ordered_float::OrderedFloat; + +/// Computes the net sum of weights for a given vertex based on edge direction. +/// +/// For every edge connected to the vertex, this function checks the source of the edge +/// against the vertex itself to determine the directionality. The weight can be treated +/// as negative or positive based on the edge's source and the specified direction: +/// +/// - If the edge's source is the vertex itself and the direction is either `OUT` or `BOTH`, +/// the weight is treated as negative. +/// - If the edge's source is not the vertex and the direction is either `IN` or `BOTH`, +/// the weight is treated as positive. +/// - In all other cases, the weight contribution is zero. +/// +/// # Parameters +/// - `v`: The vertex for which we want to compute the weight sum. +/// - `name`: The name of the property which holds the edge weight. +/// - `direction`: Specifies the direction of edges to consider (`IN`, `OUT`, or `BOTH`). +/// +/// # Returns +/// Returns a `f64` which is the net sum of weights for the vertex considering the specified direction. +fn balance_per_vertex( + v: &EvalVertexView, + name: &str, + direction: Direction, +) -> f64 { + // let in_result = v.in_edges().properties().get(name.clone()).sum(); + // in_result - out_result + match direction { + Direction::IN => v + .in_edges() + .properties() + .flat_map(|prop| { + prop.temporal().get(name).map(|val| { + val.values() + .into_iter() + .map(|valval| valval.into_f64().unwrap_or(0.0f64)) + .sum::() + }) + }) + .sum::(), + Direction::OUT => -v + .out_edges() + .properties() + .flat_map(|prop| { + prop.temporal().get(name).map(|val| { + val.values() + .into_iter() + .map(|valval| valval.into_f64().unwrap_or(0.0f64)) + .sum::() + }) + }) + .sum::(), + Direction::BOTH => { + let in_res = balance_per_vertex(v, name, Direction::IN); + let out_res = balance_per_vertex(v, name, Direction::OUT); + in_res + out_res + } + } +} + +/// Computes the sum of weights for all vertices in the graph. +/// +/// This function iterates over all vertices and calculates the net sum of weights. +/// Incoming edges have a positive sum and outgoing edges have a negative sum +/// It uses a compute context and tasks to achieve this. +/// +/// # Parameters +/// - `graph`: The graph on which the operation is to be performed. +/// - `name`: The name of the property which holds the edge weight. +/// - `threads`: An optional parameter to specify the number of threads to use. +/// If `None`, it defaults to a suitable number. +/// +/// # Returns +/// Returns an `AlgorithmResult` which maps each vertex to its corresponding net weight sum. +pub fn balance( + graph: &G, + name: String, + direction: Direction, + threads: Option, +) -> AlgorithmResult> { + let mut ctx: Context = graph.into(); + let min = sum(0); + ctx.agg(min); + let step1 = ATask::new(move |evv| { + let res = balance_per_vertex(evv, &name, direction); + evv.update(&min, res); + Step::Done + }); + let mut runner: TaskRunner = TaskRunner::new(ctx); + AlgorithmResult::new(runner.run( + vec![], + vec![Job::new(step1)], + None, + |_, ess, _, _| ess.finalize(&min, |min| min), + threads, + 1, + None, + None, + )) +} + +#[cfg(test)] +mod sum_weight_test { + use crate::{ + algorithms::balance::balance, + core::{Direction, Prop}, + db::{api::mutation::AdditionOps, graph::graph::Graph}, + }; + use pretty_assertions::assert_eq; + + #[test] + fn test_sum_float_weights() { + let graph = Graph::new(); + + let vs = vec![ + ("1", "2", 10.0, 1), + ("1", "4", 20.0, 2), + ("2", "3", 5.0, 3), + ("3", "2", 2.0, 4), + ("3", "1", 1.0, 5), + ("4", "3", 10.0, 6), + ("4", "1", 5.0, 7), + ("1", "5", 2.0, 8), + ]; + + for (src, dst, val, time) in &vs { + graph + .add_edge( + *time, + *src, + *dst, + [("value_dec".to_string(), Prop::F64(*val))], + None, + ) + .expect("Couldnt add edge"); + } + + let res = balance(&graph, "value_dec".to_string(), Direction::BOTH, None); + let expected = vec![ + ("1".to_string(), -26.0), + ("2".to_string(), 7.0), + ("3".to_string(), 12.0), + ("4".to_string(), 5.0), + ("5".to_string(), 2.0), + ]; + assert_eq!(res.sort_by_key(false), expected); + + let res = balance(&graph, "value_dec".to_string(), Direction::IN, None); + let expected = vec![ + ("1".to_string(), 6.0), + ("2".to_string(), 12.0), + ("3".to_string(), 15.0), + ("4".to_string(), 20.0), + ("5".to_string(), 2.0), + ]; + assert_eq!(res.sort_by_key(false), expected); + + let res = balance(&graph, "value_dec".to_string(), Direction::OUT, None); + let expected = vec![ + ("1".to_string(), -32.0), + ("2".to_string(), -5.0), + ("3".to_string(), -3.0), + ("4".to_string(), -15.0), + ("5".to_string(), 0.0), + ]; + assert_eq!(res.sort_by_key(false), expected); + } +} diff --git a/raphtory/src/algorithms/clustering_coefficient.rs b/raphtory/src/algorithms/clustering_coefficient.rs index d48a809ac1..af14872321 100644 --- a/raphtory/src/algorithms/clustering_coefficient.rs +++ b/raphtory/src/algorithms/clustering_coefficient.rs @@ -1,6 +1,7 @@ -use crate::algorithms::triangle_count::triangle_count; -use crate::algorithms::triplet_count::triplet_count; -use crate::db::view_api::GraphViewOps; +use crate::{ + algorithms::{triangle_count::triangle_count, triplet_count::triplet_count}, + db::api::view::GraphViewOps, +}; /// Computes the global clustering coefficient of a graph. The global clustering coefficient is /// defined as the number of triangles in the graph divided by the number of triplets in the graph. @@ -16,10 +17,9 @@ use crate::db::view_api::GraphViewOps; /// # Example /// /// ```rust -/// use raphtory::db::graph::Graph; +/// use raphtory::prelude::*; /// use raphtory::algorithms::clustering_coefficient::clustering_coefficient; -/// use raphtory::db::view_api::*; -/// let graph = Graph::new(2); +/// let graph = Graph::new(); /// let edges = vec![ /// (1, 2), /// (1, 3), @@ -29,7 +29,7 @@ use crate::db::view_api::GraphViewOps; /// (2, 7), /// ]; /// for (src, dst) in edges { -/// graph.add_edge(0, src, dst, &vec![], None).expect("Unable to add edge"); +/// graph.add_edge(0, src, dst, NO_PROPS, None).expect("Unable to add edge"); /// } /// let results = clustering_coefficient(&graph.at(1)); /// println!("global_clustering_coefficient: {}", results); @@ -49,14 +49,19 @@ pub fn clustering_coefficient(g: &G) -> f64 { #[cfg(test)] mod cc_test { use super::*; - use crate::db::graph::Graph; - use crate::db::view_api::*; + use crate::{ + db::{ + api::{mutation::AdditionOps, view::*}, + graph::graph::Graph, + }, + prelude::NO_PROPS, + }; use pretty_assertions::assert_eq; /// Test the global clustering coefficient #[test] fn test_global_cc() { - let graph = Graph::new(1); + let graph = Graph::new(); // Graph has 2 triangles and 20 triplets let edges = vec![ @@ -83,7 +88,7 @@ mod cc_test { ]; for (src, dst) in edges { - graph.add_edge(0, src, dst, &vec![], None).unwrap(); + graph.add_edge(0, src, dst, NO_PROPS, None).unwrap(); } let graph_at = graph.at(1); diff --git a/raphtory/src/algorithms/connected_components.rs b/raphtory/src/algorithms/connected_components.rs index 527b1841ec..a5bb674f96 100644 --- a/raphtory/src/algorithms/connected_components.rs +++ b/raphtory/src/algorithms/connected_components.rs @@ -1,32 +1,26 @@ -use std::cmp; -use crate::db::view_api::VertexViewOps; +use super::algorithm_result::AlgorithmResult; use crate::{ - core::state::{accumulator_id::accumulators, compute_state::ComputeStateVec}, + core::{ + entities::{vertices::vertex_ref::VertexRef, VID}, + state::compute_state::ComputeStateVec, + }, db::{ + api::view::{GraphViewOps, VertexViewOps}, task::{ context::Context, task::{ATask, Job, Step}, task_runner::TaskRunner, + vertex::eval_vertex::EvalVertexView, }, - view_api::GraphViewOps, }, }; -use std::collections::HashMap; -use crate::db::task::eval_vertex::EvalVertexView; +use std::{cmp, collections::HashMap}; -#[derive(Clone, Debug)] +#[derive(Clone, Debug, Default)] struct WccState { component: u64, } -impl WccState { - fn new() -> Self { - Self { - component: 0, - } - } -} - /// Computes the connected components of a graph using the Simple Connected Components algorithm /// /// # Arguments @@ -37,17 +31,17 @@ impl WccState { /// /// # Returns /// -/// A hash map containing the mapping from component ID to the number of vertices in the component +/// An AlgorithmResult containing the mapping from component ID to the number of vertices in the component /// pub fn weakly_connected_components( graph: &G, iter_count: usize, threads: Option, -) -> HashMap +) -> AlgorithmResult where G: GraphViewOps, { - let mut ctx: Context = graph.into(); + let ctx: Context = graph.into(); let step1 = ATask::new(move |vv| { let min_neighbour_id = vv.neighbours().id().min(); @@ -57,31 +51,42 @@ where Step::Continue }); - let step2 = ATask::new(move |vv: &mut EvalVertexView<'_, G,ComputeStateVec, WccState>| { - let prev:u64 = vv.prev().component; - let current = vv.neighbours().into_iter().map(|n|n.prev().component).min().unwrap_or(prev); - let state: &mut WccState = vv.get_mut(); - if current| { + let prev: u64 = vv.prev().component; + let current = vv + .neighbours() + .into_iter() + .map(|n| n.prev().component) + .min() + .unwrap_or(prev); + let state: &mut WccState = vv.get_mut(); + if current < prev { + state.component = current; + Step::Continue + } else { + Step::Done + } + }, + ); let mut runner: TaskRunner = TaskRunner::new(ctx); - runner.run( + let res = runner.run( vec![Job::new(step1)], vec![Job::read_only(step2)], - WccState::new(), - |g, _, _, local| { + None, + |_, _, _, local| { + let layers = graph.layer_ids(); + let edge_filter = graph.edge_filter(); local .iter() - .filter_map(|line| { - line.as_ref() - .map(|(v_ref, state)| (v_ref.clone(), state.component)) + .enumerate() + .filter_map(|(v_ref, state)| { + let v_ref = VID(v_ref); + graph + .has_vertex_ref(VertexRef::Internal(v_ref), &layers, edge_filter) + .then_some((graph.vertex_name(v_ref), state.component)) }) .collect::>() }, @@ -89,22 +94,22 @@ where iter_count, None, None, - ).into_iter() - .map(|(k, v)| (graph.vertex_name(k), v)) - .collect() + ); + AlgorithmResult::new(res) } #[cfg(test)] mod cc_test { - use crate::db::graph::Graph; + use crate::prelude::*; use super::*; + use crate::db::api::mutation::AdditionOps; use itertools::*; use std::{cmp::Reverse, iter::once}; #[test] fn run_loop_simple_connected_components() { - let graph = Graph::new(2); + let graph = Graph::new(); let edges = vec![ (1, 2, 1), @@ -117,12 +122,12 @@ mod cc_test { ]; for (src, dst, ts) in edges { - graph.add_edge(ts, src, dst, &vec![], None).unwrap(); + graph.add_edge(ts, src, dst, NO_PROPS, None).unwrap(); } - let results: HashMap = weakly_connected_components(&graph, usize::MAX, None); - + let results: AlgorithmResult = + weakly_connected_components(&graph, usize::MAX, None); assert_eq!( - results, + *results.get_all(), vec![ ("1".to_string(), 1), ("2".to_string(), 1), @@ -140,7 +145,7 @@ mod cc_test { #[test] fn simple_connected_components_2() { - let graph = Graph::new(2); + let graph = Graph::new(); let edges = vec![ (1, 2, 1), @@ -169,13 +174,14 @@ mod cc_test { ]; for (src, dst, ts) in edges { - graph.add_edge(ts, src, dst, &vec![], None).unwrap(); + graph.add_edge(ts, src, dst, NO_PROPS, None).unwrap(); } - let results: HashMap = weakly_connected_components(&graph, usize::MAX, None); + let results: AlgorithmResult = + weakly_connected_components(&graph, usize::MAX, None); assert_eq!( - results, + *results.get_all(), vec![ ("1".to_string(), 1), ("2".to_string(), 1), @@ -197,24 +203,58 @@ mod cc_test { // connected components on a graph with 1 node and a self loop #[test] fn simple_connected_components_3() { - let graph = Graph::new(2); + let graph = Graph::new(); let edges = vec![(1, 1, 1)]; for (src, dst, ts) in edges { - graph.add_edge(ts, src, dst, &vec![], None).unwrap(); + graph.add_edge(ts, src, dst, NO_PROPS, None).unwrap(); } - let results: HashMap = weakly_connected_components(&graph, usize::MAX, None); + let results: AlgorithmResult = + weakly_connected_components(&graph, usize::MAX, None); assert_eq!( - results, - vec![("1".to_string(), 1),] + *results.get_all(), + vec![("1".to_string(), 1)] .into_iter() .collect::>() ); } + #[test] + fn windowed_connected_components() { + let graph = Graph::new(); + graph.add_edge(0, 1, 2, NO_PROPS, None).expect("add edge"); + graph.add_edge(0, 2, 1, NO_PROPS, None).expect("add edge"); + graph.add_edge(9, 3, 4, NO_PROPS, None).expect("add edge"); + graph.add_edge(9, 4, 3, NO_PROPS, None).expect("add edge"); + + let results: AlgorithmResult = + weakly_connected_components(&graph, usize::MAX, None); + let expected = vec![ + ("1".to_string(), 1), + ("2".to_string(), 1), + ("3".to_string(), 3), + ("4".to_string(), 3), + ] + .into_iter() + .collect::>(); + + assert_eq!(*results.get_all(), expected); + + let wg = graph.window(0, 2); + let results: AlgorithmResult = + weakly_connected_components(&wg, usize::MAX, None); + + let expected = vec![("1", 1), ("2", 1)] + .into_iter() + .map(|(k, v)| (k.to_string(), v)) + .collect::>(); + + assert_eq!(*results.get_all(), expected); + } + #[quickcheck] fn circle_graph_the_smallest_value_is_the_cc(vs: Vec) { if !vs.is_empty() { @@ -233,18 +273,19 @@ mod cc_test { assert_eq!(edges[0].0, first); assert_eq!(edges.last().unwrap().1, first); - let graph = Graph::new(2); + let graph = Graph::new(); for (src, dst) in edges.iter() { - graph.add_edge(0, *src, *dst, &vec![], None).unwrap(); + graph.add_edge(0, *src, *dst, NO_PROPS, None).unwrap(); } // now we do connected components over window 0..1 - let components: HashMap = + let res: AlgorithmResult = weakly_connected_components(&graph, usize::MAX, None); - let actual = components + let actual = res + .get_all() .iter() .group_by(|(_, cc)| *cc) .into_iter() diff --git a/raphtory/src/algorithms/degree.rs b/raphtory/src/algorithms/degree.rs index 5b90aed4a5..ce0192cda1 100644 --- a/raphtory/src/algorithms/degree.rs +++ b/raphtory/src/algorithms/degree.rs @@ -17,10 +17,9 @@ //! //! ```rust //! use raphtory::algorithms::degree::{max_out_degree, max_in_degree, min_out_degree, min_in_degree, average_degree}; -//! use raphtory::db::graph::Graph; -//! use raphtory::db::view_api::*; +//! use raphtory::prelude::*; //! -//! let g = Graph::new(1); +//! let g = Graph::new(); //! let windowed_graph = g.window(0, 7); //! let vs = vec![ //! (1, 1, 2), @@ -32,7 +31,7 @@ //! ]; //! //! for (t, src, dst) in &vs { -//! g.add_edge(*t, *src, *dst, &vec![], None); +//! g.add_edge(*t, *src, *dst, NO_PROPS, None); //! } //! //! print!("Max out degree: {:?}", max_out_degree(&windowed_graph)); @@ -42,7 +41,7 @@ //! print!("Average degree: {:?}", average_degree(&windowed_graph)); //! ``` //! -use crate::db::view_api::*; +use crate::db::api::view::*; /// The maximum out degree of any vertex in the graph. pub fn max_out_degree(graph: &G) -> usize { @@ -104,14 +103,15 @@ pub fn average_degree(graph: &G) -> f64 { mod degree_test { use crate::{ algorithms::degree::{average_degree, max_in_degree, min_in_degree, min_out_degree}, - db::graph::Graph, + db::{api::mutation::AdditionOps, graph::graph::Graph}, + prelude::NO_PROPS, }; use super::max_out_degree; #[test] fn degree_test() { - let g = Graph::new(1); + let g = Graph::new(); let vs = vec![ (1, 1, 2), (2, 1, 3), @@ -122,7 +122,7 @@ mod degree_test { ]; for (t, src, dst) in &vs { - g.add_edge(*t, *src, *dst, &vec![], None).unwrap(); + g.add_edge(*t, *src, *dst, NO_PROPS, None).unwrap(); } let expected_max_out_degree = 3; diff --git a/raphtory/src/algorithms/directed_graph_density.rs b/raphtory/src/algorithms/directed_graph_density.rs index b292c6af5f..888336a856 100644 --- a/raphtory/src/algorithms/directed_graph_density.rs +++ b/raphtory/src/algorithms/directed_graph_density.rs @@ -11,10 +11,9 @@ //! //! ```rust //! use raphtory::algorithms::directed_graph_density::directed_graph_density; -//! use raphtory::db::graph::Graph; -//! use raphtory::db::view_api::*; +//! use raphtory::prelude::*; //! -//! let g = Graph::new(1); +//! let g = Graph::new(); //! let windowed_graph = g.window(0, 7); //! let vs = vec![ //! (1, 1, 2), @@ -26,27 +25,31 @@ //! ]; //! //! for (t, src, dst) in &vs { -//! g.add_edge(*t, *src, *dst, &vec![], None); +//! g.add_edge(*t, *src, *dst, NO_PROPS, None); //! } //! //! println!("graph density: {:?}", directed_graph_density(&windowed_graph)); //! ``` //! -use crate::db::view_api::*; +use crate::db::api::view::*; /// Measures how dense or sparse a graph is pub fn directed_graph_density(graph: &G) -> f32 { - graph.num_edges() as f32 / (graph.num_vertices() as f32 * (graph.num_vertices() as f32 - 1.0)) + graph.count_edges() as f32 + / (graph.count_vertices() as f32 * (graph.count_vertices() as f32 - 1.0)) } #[cfg(test)] mod directed_graph_density_tests { use super::*; - use crate::db::graph::Graph; + use crate::{ + db::{api::mutation::AdditionOps, graph::graph::Graph}, + prelude::NO_PROPS, + }; #[test] fn low_graph_density() { - let g = Graph::new(1); + let g = Graph::new(); let windowed_graph = g.window(0, 7); let vs = vec![ (1, 1, 2), @@ -58,7 +61,7 @@ mod directed_graph_density_tests { ]; for (t, src, dst) in &vs { - g.add_edge(*t, *src, *dst, &vec![], None).unwrap(); + g.add_edge(*t, *src, *dst, NO_PROPS, None).unwrap(); } let actual = directed_graph_density(&windowed_graph); @@ -69,12 +72,12 @@ mod directed_graph_density_tests { #[test] fn complete_graph_has_graph_density_of_one() { - let g = Graph::new(1); + let g = Graph::new(); let windowed_graph = g.window(0, 3); let vs = vec![(1, 1, 2), (2, 2, 1)]; for (t, src, dst) in &vs { - g.add_edge(*t, *src, *dst, &vec![], None).unwrap(); + g.add_edge(*t, *src, *dst, NO_PROPS, None).unwrap(); } let actual = directed_graph_density(&windowed_graph); diff --git a/raphtory/src/algorithms/hits.rs b/raphtory/src/algorithms/hits.rs index a1d6cb6f98..81cd1c7952 100644 --- a/raphtory/src/algorithms/hits.rs +++ b/raphtory/src/algorithms/hits.rs @@ -1,20 +1,25 @@ -use crate::core::state::accumulator_id::accumulators::{max, sum}; -use crate::db::task::eval_vertex::EvalVertexView; use crate::{ - core::state::compute_state::ComputeStateVec, + algorithms::algorithm_result::AlgorithmResult, + core::{ + entities::vertices::vertex_ref::VertexRef, + state::{ + accumulator_id::accumulators::{max, sum}, + compute_state::ComputeStateVec, + }, + }, db::{ + api::view::{GraphViewOps, VertexViewOps}, task::{ context::Context, task::{ATask, Job, Step}, task_runner::TaskRunner, + vertex::eval_vertex::EvalVertexView, }, - view_api::{GraphViewOps, VertexViewOps}, }, }; use num_traits::abs; -use rustc_hash::FxHashMap; +use ordered_float::OrderedFloat; use std::collections::HashMap; -use std::ops::Range; #[derive(Debug, Clone)] struct Hits { @@ -22,20 +27,31 @@ struct Hits { auth_score: f32, } -// HITS (Hubs and Authority) Algorithm: -// AuthScore of a vertex (A) = Sum of HubScore of all vertices pointing at vertex (A) from previous iteration / -// Sum of HubScore of all vertices in the current iteration -// -// HubScore of a vertex (A) = Sum of AuthScore of all vertices pointing away from vertex (A) from previous iteration / -// Sum of AuthScore of all vertices in the current iteration +impl Default for Hits { + fn default() -> Self { + Self { + hub_score: 1f32, + auth_score: 1f32, + } + } +} +/// HITS (Hubs and Authority) Algorithm: +/// AuthScore of a vertex (A) = Sum of HubScore of all vertices pointing at vertex (A) from previous iteration / +/// Sum of HubScore of all vertices in the current iteration +/// +/// HubScore of a vertex (A) = Sum of AuthScore of all vertices pointing away from vertex (A) from previous iteration / +/// Sum of AuthScore of all vertices in the current iteration +/// +/// Returns +/// +/// * An AlgorithmResult object containing the mapping from vertex ID to the hub and authority score of the vertex #[allow(unused_variables)] pub fn hits( g: &G, - window: Range, iter_count: usize, threads: Option, -) -> FxHashMap { +) -> AlgorithmResult, OrderedFloat)> { let mut ctx: Context = g.into(); let recv_hub_score = sum::(2); @@ -96,8 +112,8 @@ pub fn hits( let md_hub_score = abs(prev_hub_score - curr_hub_score); evv.global_update(&max_diff_hub_score, md_hub_score); - let prev_auth_score = evv.prev().auth_score; - let curr_auth_score = evv.get().auth_score; + let prev_auth_score = evv.prev().auth_score; + let curr_auth_score = evv.get().auth_score; let md_auth_score = abs(prev_auth_score - curr_auth_score); evv.global_update(&max_diff_auth_score, md_auth_score); @@ -122,16 +138,15 @@ pub fn hits( let (hub_scores, auth_scores) = runner.run( vec![], vec![Job::new(step2), Job::new(step3), Job::new(step4), step5], - Hits { - hub_score: 1f32, - auth_score: 1f32, - }, + None, |_, _, els, local| { let mut hubs = HashMap::new(); let mut auths = HashMap::new(); - for line in local.iter() { - if let Some((v_ref, hit)) = line { - let v_gid = g.vertex_name(v_ref.clone()); + let layers = g.layer_ids(); + let edge_filter = g.edge_filter(); + for (v_ref, hit) in local.iter().enumerate() { + if g.has_vertex_ref(VertexRef::Internal(v_ref.into()), &layers, edge_filter) { + let v_gid = g.vertex_name(v_ref.into()); hubs.insert(v_gid.clone(), hit.hub_score); auths.insert(v_gid, hit.auth_score); } @@ -144,7 +159,7 @@ pub fn hits( None, ); - let mut results: FxHashMap = FxHashMap::default(); + let mut results: HashMap = HashMap::new(); hub_scores.into_iter().for_each(|(k, v)| { results.insert(k, (v, 0.0)); @@ -155,52 +170,47 @@ pub fn hits( results.insert(k, (*a, v)); }); - results + AlgorithmResult::new(results) } #[cfg(test)] mod hits_tests { use super::*; - use crate::db::graph::Graph; - use itertools::Itertools; + use crate::{ + db::{api::mutation::AdditionOps, graph::graph::Graph}, + prelude::NO_PROPS, + }; - fn load_graph(n_shards: usize, edges: Vec<(u64, u64)>) -> Graph { - let graph = Graph::new(n_shards); + fn load_graph(edges: Vec<(u64, u64)>) -> Graph { + let graph = Graph::new(); for (src, dst) in edges { - graph.add_edge(0, src, dst, &vec![], None).unwrap(); + graph.add_edge(0, src, dst, NO_PROPS, None).unwrap(); } graph } - fn test_hits(n_shards: usize) { - let graph = load_graph( - n_shards, - vec![ - (1, 4), - (2, 3), - (2, 5), - (3, 1), - (4, 2), - (4, 3), - (5, 2), - (5, 3), - (5, 4), - (5, 6), - (6, 3), - (6, 8), - (7, 1), - (7, 3), - (8, 1), - ], - ); - - let window = 0..10; - - let mut results: Vec<(String, (f32, f32))> = - hits(&graph, window, 20, None).into_iter().collect_vec(); - - results.sort_by_key(|k| (*k).0.clone()); + #[test] + fn test_hits() { + let graph = load_graph(vec![ + (1, 4), + (2, 3), + (2, 5), + (3, 1), + (4, 2), + (4, 3), + (5, 2), + (5, 3), + (5, 4), + (5, 6), + (6, 3), + (6, 8), + (7, 1), + (7, 3), + (8, 1), + ]); + + let results = hits(&graph, 20, None); // NetworkX results // >>> G = nx.DiGraph() @@ -232,7 +242,7 @@ mod hits_tests { // ) assert_eq!( - results, + results.sort_by_key(false), vec![ ("1".to_string(), (0.0431365, 0.096625775)), ("2".to_string(), (0.14359662, 0.18366566)), @@ -245,9 +255,4 @@ mod hits_tests { ] ); } - - #[test] - fn test_hits_11() { - test_hits(1); - } } diff --git a/raphtory/src/algorithms/k_core.rs b/raphtory/src/algorithms/k_core.rs new file mode 100644 index 0000000000..b8f3e0e2c4 --- /dev/null +++ b/raphtory/src/algorithms/k_core.rs @@ -0,0 +1,174 @@ +use crate::{ + core::{ + entities::{vertices::vertex_ref::VertexRef, VID}, + state::compute_state::ComputeStateVec, + }, + db::{ + api::view::{GraphViewOps, VertexViewOps}, + graph::views::vertex_subgraph::VertexSubgraph, + task::{ + context::Context, + task::{ATask, Job, Step}, + task_runner::TaskRunner, + vertex::eval_vertex::EvalVertexView, + }, + }, +}; +use std::collections::HashSet; + +#[derive(Clone, Debug)] +struct KCoreState { + alive: bool, +} + +impl Default for KCoreState { + fn default() -> Self { + Self { alive: true } + } +} + +/// Determines which nodes are in the k-core for a given value of k +/// +/// # Arguments +/// +/// * `g` - A reference to the graph +/// * `k` - Value of k such that the returned vertices have degree > k (recursively) +/// * `iter_count` - The number of iterations to run +/// * `threads` - number of threads to run on +/// +/// # Returns +/// +/// A hash set of vertices in the k core +/// +pub fn k_core_set(graph: &G, k: usize, iter_count: usize, threads: Option) -> HashSet +where + G: GraphViewOps, +{ + let ctx: Context = graph.into(); + + let step1 = ATask::new(move |vv| { + let deg = vv.degree(); + let state: &mut KCoreState = vv.get_mut(); + state.alive = deg >= k; + Step::Continue + }); + + let step2 = ATask::new( + move |vv: &mut EvalVertexView<'_, G, ComputeStateVec, KCoreState>| { + let prev: bool = vv.prev().alive; + if prev == true { + let current = vv + .neighbours() + .into_iter() + .filter(|n| n.prev().alive) + .count() + >= k; + let state: &mut KCoreState = vv.get_mut(); + if current != prev { + state.alive = current; + Step::Continue + } else { + Step::Done + } + } else { + Step::Done + } + }, + ); + + let mut runner: TaskRunner = TaskRunner::new(ctx); + + runner.run( + vec![Job::new(step1)], + vec![Job::read_only(step2)], + None, + |_, _, _, local| { + let layers = graph.layer_ids(); + let edge_filter = graph.edge_filter(); + local + .iter() + .enumerate() + .filter(|(v_ref, state)| { + state.alive + && graph.has_vertex_ref( + VertexRef::Internal((*v_ref).into()), + &layers, + edge_filter, + ) + }) + .map(|(v_ref, _)| v_ref.into()) + .collect::>() + }, + threads, + iter_count, + None, + None, + ) +} + +pub fn k_core( + graph: &G, + k: usize, + iter_count: usize, + threads: Option, +) -> VertexSubgraph +where + G: GraphViewOps, +{ + let v_set = k_core_set(graph, k, iter_count, threads); + graph.subgraph(v_set) +} + +#[cfg(test)] +mod k_core_test { + use std::collections::HashSet; + + use crate::{algorithms::k_core::k_core_set, prelude::*}; + + #[test] + fn k_core_2() { + let graph = Graph::new(); + + let edges = vec![ + (1, 2, 1), + (1, 3, 2), + (1, 4, 3), + (3, 1, 4), + (3, 4, 5), + (3, 5, 6), + (4, 5, 7), + (5, 6, 8), + (5, 8, 9), + (7, 5, 10), + (8, 5, 11), + (1, 9, 12), + (9, 1, 13), + (6, 3, 14), + (4, 8, 15), + (8, 3, 16), + (5, 10, 17), + (10, 5, 18), + (10, 8, 19), + (1, 11, 20), + (11, 1, 21), + (9, 11, 22), + (11, 9, 23), + ]; + + for (src, dst, ts) in edges { + graph.add_edge(ts, src, dst, NO_PROPS, None).unwrap(); + } + + let result = k_core_set(&graph, 2, usize::MAX, None); + let subgraph = graph.subgraph(result.clone()); + let actual = vec!["1", "3", "4", "5", "6", "8", "9", "10", "11"] + .into_iter() + .map(|k| k.to_string()) + .collect::>(); + + assert_eq!( + actual, + subgraph.vertices().name().collect::>() + ); + } +} diff --git a/raphtory/src/algorithms/local_clustering_coefficient.rs b/raphtory/src/algorithms/local_clustering_coefficient.rs index 79b268d123..becc916fac 100644 --- a/raphtory/src/algorithms/local_clustering_coefficient.rs +++ b/raphtory/src/algorithms/local_clustering_coefficient.rs @@ -24,10 +24,9 @@ //! //! ```rust //! use raphtory::algorithms::local_clustering_coefficient::{local_clustering_coefficient}; -//! use raphtory::db::graph::Graph; -//! use raphtory::db::view_api::*; +//! use raphtory::prelude::*; //! -//! let g = Graph::new(1); +//! let g = Graph::new(); //! let windowed_graph = g.window(0, 7); //! let vs = vec![ //! (1, 1, 2), @@ -39,7 +38,7 @@ //! ]; //! //! for (t, src, dst) in &vs { -//! g.add_edge(*t, *src, *dst, &vec![], None); +//! g.add_edge(*t, *src, *dst, NO_PROPS, None); //! } //! //! let actual = (1..=5) @@ -49,9 +48,10 @@ //! println!("local clustering coefficient of all nodes: {:?}", actual); //! ``` -use crate::algorithms::local_triangle_count::local_triangle_count; -use crate::core::vertex_ref::VertexRef; -use crate::db::view_api::*; +use crate::{ + algorithms::local_triangle_count::local_triangle_count, + core::entities::vertices::vertex_ref::VertexRef, db::api::view::*, +}; /// measures the degree to which nodes in a graph tend to cluster together pub fn local_clustering_coefficient>( @@ -79,12 +79,17 @@ pub fn local_clustering_coefficient>( #[cfg(test)] mod clustering_coefficient_tests { use super::local_clustering_coefficient; - use crate::db::graph::Graph; - use crate::db::view_api::*; + use crate::{ + db::{ + api::{mutation::AdditionOps, view::*}, + graph::graph::Graph, + }, + prelude::NO_PROPS, + }; #[test] fn clusters_of_triangles() { - let g = Graph::new(1); + let g = Graph::new(); let windowed_graph = g.window(0, 7); let vs = vec![ (1, 1, 2), @@ -96,7 +101,7 @@ mod clustering_coefficient_tests { ]; for (t, src, dst) in &vs { - g.add_edge(*t, *src, *dst, &vec![], None).unwrap(); + g.add_edge(*t, *src, *dst, NO_PROPS, None).unwrap(); } let expected = vec![0.33333334, 1.0, 1.0, 0.0, 0.0]; diff --git a/raphtory/src/algorithms/local_triangle_count.rs b/raphtory/src/algorithms/local_triangle_count.rs index 8286e1ab0a..1b40dff856 100644 --- a/raphtory/src/algorithms/local_triangle_count.rs +++ b/raphtory/src/algorithms/local_triangle_count.rs @@ -18,14 +18,13 @@ //! //! ```rust //! use raphtory::algorithms::local_triangle_count::{local_triangle_count}; -//! use raphtory::db::graph::Graph; -//! use raphtory::db::view_api::*; +//! use raphtory::prelude::*; //! -//! let g = Graph::new(1); +//! let g = Graph::new(); //! let vs = vec![(1, 1, 2), (2, 1, 3), (3, 2, 1), (4, 3, 2)]; //! //! for (t, src, dst) in &vs { -//! g.add_edge(*t, *src, *dst, &vec![], None); +//! g.add_edge(*t, *src, *dst, NO_PROPS, None); //! } //! //! let windowed_graph = g.window(0, 5); @@ -38,28 +37,27 @@ //! println!("local_triangle_count: {:?}", result); //! ``` //! -use crate::core::vertex_ref::VertexRef; -use crate::db::view_api::*; +use crate::{core::entities::vertices::vertex_ref::VertexRef, db::api::view::*}; use itertools::Itertools; /// calculates the number of triangles (a cycle of length 3) for a node. pub fn local_triangle_count>(graph: &G, v: V) -> Option { if let Some(vertex) = graph.vertex(v) { if vertex.degree() >= 2 { - let x: Vec = vertex + let len = vertex .neighbours() .id() .into_iter() .combinations(2) - .filter_map(|nb| match graph.has_edge(nb[0], nb[1], None) { + .filter_map(|nb| match graph.has_edge(nb[0], nb[1], Layer::All) { true => Some(1), - false => match graph.has_edge(nb[1], nb[0], None) { + false => match graph.has_edge(nb[1], nb[0], Layer::All) { true => Some(1), false => None, }, }) - .collect(); - Some(x.len()) + .count(); + Some(len) } else { Some(0) } @@ -72,16 +70,21 @@ pub fn local_triangle_count>(graph: &G, v: V mod triangle_count_tests { use super::local_triangle_count; - use crate::db::graph::Graph; - use crate::db::view_api::*; + use crate::{ + db::{ + api::{mutation::AdditionOps, view::*}, + graph::graph::Graph, + }, + prelude::NO_PROPS, + }; #[test] fn counts_triangles() { - let g = Graph::new(1); + let g = Graph::new(); let vs = vec![(1, 1, 2), (2, 1, 3), (3, 2, 1), (4, 3, 2)]; for (t, src, dst) in &vs { - g.add_edge(*t, *src, *dst, &vec![], None).unwrap(); + g.add_edge(*t, *src, *dst, NO_PROPS, None).unwrap(); } let windowed_graph = g.window(0, 5); diff --git a/raphtory/src/algorithms/mod.rs b/raphtory/src/algorithms/mod.rs index ff7ca93079..4b54f5dc4a 100644 --- a/raphtory/src/algorithms/mod.rs +++ b/raphtory/src/algorithms/mod.rs @@ -8,9 +8,9 @@ //! //! ```rust //! use raphtory::algorithms::degree::{average_degree}; -//! use raphtory::db::graph::Graph; +//! use raphtory::prelude::*; //! -//! let g = Graph::new(1); +//! let g = Graph::new(); //! let vs = vec![ //! (1, 1, 2), //! (2, 1, 3), @@ -21,21 +21,24 @@ //! ]; //! //! for (t, src, dst) in &vs { -//! g.add_edge(*t, *src, *dst, &vec![], None); +//! g.add_edge(*t, *src, *dst, NO_PROPS, None); //! }; //! println!("average_degree: {:?}", average_degree(&g)); //! ``` +pub mod algorithm_result; +pub mod balance; pub mod clustering_coefficient; pub mod connected_components; pub mod degree; pub mod directed_graph_density; -pub mod generic_taint; pub mod hits; +pub mod k_core; pub mod local_clustering_coefficient; pub mod local_triangle_count; pub mod motifs; pub mod pagerank; pub mod reciprocity; +pub mod temporal_reachability; pub mod triangle_count; pub mod triplet_count; diff --git a/raphtory/src/algorithms/motifs/mod.rs b/raphtory/src/algorithms/motifs/mod.rs index 7180cd10ef..73bd75ec28 100644 --- a/raphtory/src/algorithms/motifs/mod.rs +++ b/raphtory/src/algorithms/motifs/mod.rs @@ -1,2 +1,3 @@ -pub mod three_node_local; +pub mod three_node_local_single_thread; pub mod three_node_motifs; +pub mod three_node_temporal_motifs; diff --git a/raphtory/src/algorithms/motifs/three_node_local.rs b/raphtory/src/algorithms/motifs/three_node_local.rs deleted file mode 100644 index 3ef5aa4868..0000000000 --- a/raphtory/src/algorithms/motifs/three_node_local.rs +++ /dev/null @@ -1,523 +0,0 @@ -use std::collections::HashMap; -use std::slice::Iter; - -use crate::core::agg::ValDef; -use crate::core::state::accumulator_id::AccId; -use crate::db::view_api::*; - -use crate::algorithms::motifs::three_node_motifs::*; -use crate::core::state::accumulator_id::accumulators::val; -use crate::core::state::compute_state::ComputeStateVec; -use crate::db::task::context::Context; -use crate::db::task::eval_vertex::EvalVertexView; -use crate::db::task::task::{ATask, Job, Step}; -use crate::db::task::task_runner::TaskRunner; -use crate::db::view_api::{GraphViewOps, VertexViewOps}; -use num_traits::Zero; -use std::ops::Add; - -pub fn star_motif_count( - evv: &EvalVertexView, - delta: i64, -) -> [usize; 24] { - let neigh_map: HashMap = evv - .neighbours() - .into_iter() - .enumerate() - .map(|(num, nb)| (nb.id(), num)) - .into_iter() - .collect(); - let mut exploded_edges = evv - .edges() - .explode() - .map(|edge| { - if edge.src().id() == evv.id() { - star_event(neigh_map[&edge.dst().id()], 1, edge.time().unwrap()) - } else { - star_event(neigh_map[&edge.src().id()], 0, edge.time().unwrap()) - } - }) - .collect::>(); - exploded_edges.sort_by_key(|e| e.time); - let mut star_count = init_star_count(neigh_map.len()); - star_count.execute(&exploded_edges, delta); - star_count.return_counts() -} - -pub fn twonode_motif_count( - graph: &G, - evv: &EvalVertexView, - delta: i64, -) -> [usize; 8] { - let mut counts = [0; 8]; - for nb in evv.neighbours().into_iter() { - let nb_id = nb.id(); - let out = graph.edge(evv.id(), nb_id, None); - let inc = graph.edge(nb_id, evv.id(), None); - let mut all_exploded = match (out, inc) { - (Some(o), Some(i)) => o - .explode() - .chain(i.explode()) - .map(|e| { - two_node_event( - if e.src().id() == evv.id() { 1 } else { 0 }, - e.time().unwrap(), - ) - }) - .collect::>(), - (Some(o), None) => o - .explode() - .map(|e| two_node_event(1, e.time().unwrap())) - .collect::>(), - (None, Some(i)) => i - .explode() - .map(|e| two_node_event(0, e.time().unwrap())) - .collect::>(), - (None, None) => Vec::new(), - }; - all_exploded.sort_by_key(|e| e.time); - let mut two_node_counter = init_two_node_count(); - two_node_counter.execute(&all_exploded, delta); - let two_node_result = two_node_counter.return_counts(); - for i in 0..8 { - counts[i] += two_node_result[i]; - } - } - counts -} - -pub fn triangle_motif_count( - graph: &G, - evv: &EvalVertexView, - delta: i64, - motif_counter: AccId>, -) { - let u: u64 = evv.id(); - for v in evv.neighbours().into_iter().filter(|x| x.id() > u) { - let mut nb_ct = 0; - for nb in evv.neighbours().into_iter().filter(|x| x.id() > v.id()) { - let u_to_v = match graph.edge(u, v.id(), None) { - Some(edge) => { - let r = edge - .explode() - .map(|e| new_triangle_edge(true, 1, 0, 1, e.time().unwrap())) - .collect::>(); - r.into_iter() - } - None => vec![].into_iter(), - }; - let v_to_u = match graph.edge(v.id(), u, None) { - Some(edge) => { - let r = edge - .explode() - .map(|e| new_triangle_edge(true, 0, 0, 0, e.time().unwrap())) - .collect::>(); - r.into_iter() - } - None => vec![].into_iter(), - }; - let mut tri_edges: Vec = Vec::new(); - let out = graph.edge(v.id(), nb.id(), None); - let inc = graph.edge(nb.id(), v.id(), None); - // The following code checks for triangles - match (out, inc) { - (Some(o), Some(i)) => { - tri_edges.append( - &mut o - .explode() - .map(|e| new_triangle_edge(false, 1, nb_ct, 1, e.time().unwrap())) - .collect::>(), - ); - tri_edges.append( - &mut i - .explode() - .map(|e| new_triangle_edge(false, 1, nb_ct, 0, e.time().unwrap())) - .collect::>(), - ); - } - (Some(o), None) => { - tri_edges.append( - &mut o - .explode() - .map(|e| new_triangle_edge(false, 1, nb_ct, 1, e.time().unwrap())) - .collect::>(), - ); - } - (None, Some(i)) => { - tri_edges.append( - &mut i - .explode() - .map(|e| new_triangle_edge(false, 1, nb_ct, 0, e.time().unwrap())) - .collect::>(), - ); - } - (None, None) => { - continue; - } - } - if !tri_edges.is_empty() { - let uout = graph.edge(u, nb.id(), None); - let uin = graph.edge(nb.id(), u, None); - match (uout, uin) { - (Some(o), Some(i)) => { - tri_edges.append( - &mut o - .explode() - .map(|e| new_triangle_edge(false, 0, nb_ct, 1, e.time().unwrap())) - .collect::>(), - ); - tri_edges.append( - &mut i - .explode() - .map(|e| new_triangle_edge(false, 0, nb_ct, 0, e.time().unwrap())) - .collect::>(), - ); - } - (Some(o), None) => { - tri_edges.append( - &mut o - .explode() - .map(|e| new_triangle_edge(false, 0, nb_ct, 1, e.time().unwrap())) - .collect::>(), - ); - } - (None, Some(i)) => { - tri_edges.append( - &mut i - .explode() - .map(|e| new_triangle_edge(false, 0, nb_ct, 0, e.time().unwrap())) - .collect::>(), - ); - } - (None, None) => { - continue; - } - } - nb_ct += 1; - // found triangle at this point!! - tri_edges.append(&mut u_to_v.collect::>()); - tri_edges.append(&mut v_to_u.collect::>()); - tri_edges.sort_by_key(|e| e.time); - - let mut tri_count = init_tri_count(nb_ct); - tri_count.execute(&tri_edges, delta); - let tmp_counts: Iter = tri_count.return_counts().iter(); - - update_counter(vec![evv, &v, &nb], motif_counter, tmp_counts); - } - } - } -} - -// works fine for 1 shard but breaks on more shard -// v1 - shard1, v2,v3 - shard2 -// distributed acc -// v1 -> v2 (sending new count v2/) -// v2 -> v1 (sending new count v1) 5, 6 (motif 3 c) - -// per vertex (motif counts) -// every iteration (sum them up) -// A -> B -> C-> A (motif 3) - -// A: [1, 2, 3(1), 4, 5, 6, 7, 8], B: [1, 2, 3(1), 4, 5, 6, 7, 8], C: [1, 2, 3(1), 4, 5, 6, 7, 8] - shard1 -// A: [1, 2, 3(0), 4, 5, 6, 7, 8], B: [1, 2, 3(0), 4, 5, 6, 7, 8], C: [1, 2, 3(0), 4, 5, 6, 7, 8] - shard2 -// A: [1, 2, 3(0), 4, 5, 6, 7, 8], B: [1, 2, 3(0), 4, 5, 6, 7, 8], C: [1, 2, 3(0), 4, 5, 6, 7, 8] - shard3 - -// global acc -// 1, 2, 3, 4, 5, 6, 7, 8 - -fn update_counter( - vs: Vec<&EvalVertexView>, - motif_counter: AccId>, - tmp_counts: Iter, -) { - for v in vs { - let mc = v.read(&motif_counter); - let triangle: [usize; 8] = mc - .triangle - .iter() - .zip(tmp_counts.clone()) - .map(|(&i1, &i2)| i1 + i2) - .collect::>() - .try_into() - .unwrap(); - v.update( - &motif_counter, - MotifCounter::from_triangle_counter(triangle), - ); - } -} - -#[derive(Eq, PartialEq, Clone, Debug, Default)] -pub struct MotifCounter { - pub two_nodes: [usize; 8], - pub star_nodes: [usize; 24], - pub triangle: [usize; 8], -} - -impl MotifCounter { - fn new(two_nodes: [usize; 8], star_nodes: [usize; 24], triangle: [usize; 8]) -> Self { - Self { - two_nodes, - star_nodes, - triangle, - } - } - - pub(crate) fn from_triangle_counter(triangle: [usize; 8]) -> Self { - Self { - two_nodes: [0; 8], - star_nodes: [0; 24], - triangle, - } - } -} - -impl Add for MotifCounter { - type Output = MotifCounter; - - fn add(self, rhs: Self) -> Self::Output { - rhs - } -} - -impl Zero for MotifCounter { - fn zero() -> Self { - MotifCounter { - two_nodes: [0; 8], - star_nodes: [0; 24], - triangle: [0; 8], - } - } - - fn set_zero(&mut self) { - *self = Zero::zero(); - } - - fn is_zero(&self) -> bool { - self.two_nodes == [0; 8] && self.star_nodes == [0; 24] && self.triangle == [0; 8] - } -} - -pub fn global_temporal_three_node_motif( - graph: &G, - threads: Option, - delta: i64, -) -> Vec { - let counts = temporal_three_node_motif(graph, threads, delta); - let mut tmp_counts = counts.values().fold(vec![0; 40], |acc, x| { - acc.iter().zip(x.iter()).map(|(x1, x2)| x1 + x2).collect() - }); - for ind in 31..40 { - tmp_counts[ind] = tmp_counts[ind] / 3; - } - tmp_counts -} - -pub fn global_temporal_three_node_motif_from_local( - counts: HashMap>, -) -> Vec { - let mut tmp_counts = counts.values().fold(vec![0; 40], |acc, x| { - acc.iter().zip(x.iter()).map(|(x1, x2)| x1 + x2).collect() - }); - for ind in 31..40 { - tmp_counts[ind] = tmp_counts[ind] / 3; - } - tmp_counts -} - -pub fn temporal_three_node_motif( - g: &G, - threads: Option, - delta: i64, -) -> HashMap> { - let mut ctx: Context = g.into(); - let motifs_counter = val::(0); - - ctx.agg(motifs_counter); - - let step1 = ATask::new( - move |evv: &mut EvalVertexView| { - let g = evv.graph; - - triangle_motif_count(g, evv, delta, motifs_counter); - let two_nodes = twonode_motif_count(g, evv, delta); - let star_nodes = star_motif_count(evv, delta); - - *evv.get_mut() = MotifCounter::new( - two_nodes, - star_nodes, - evv.get().triangle, - ); - - Step::Continue - }, - ); - - let mut runner: TaskRunner = TaskRunner::new(ctx); - - runner.run( - vec![], - vec![Job::new(step1)], - MotifCounter::zero(), - |_, _, els, _| { - els.finalize(&motifs_counter, |motifs_counter| { - let triangles = motifs_counter.triangle.to_vec(); - let two_nodes = motifs_counter.two_nodes.to_vec(); - let tmp_stars = motifs_counter.star_nodes.to_vec(); - let stars: Vec = tmp_stars - .iter() - .zip(two_nodes.iter().cycle().take(24)) - .map(|(&x1, &x2)| x1 - x2) - .collect(); - let mut final_cts = Vec::new(); - final_cts.extend(stars.into_iter()); - final_cts.extend(two_nodes.into_iter()); - final_cts.extend(triangles.into_iter()); - - final_cts - }) - }, - threads, - 1, - None, - None, - ) -} - -#[cfg(test)] -mod motifs_test { - use super::*; - use crate::db::graph::Graph; - - fn load_graph(n_shards: usize, edges: Vec<(i64, u64, u64)>) -> Graph { - let graph = Graph::new(n_shards); - - for (t, src, dst) in edges { - graph.add_edge(t, src, dst, &vec![], None).unwrap(); - } - graph - } - - #[test] - #[ignore = "This is not correct, it needs a rethink of the algorithm to be parallel"] - fn test_two_node_motif() { - let g = load_graph( - 1, - vec![ - (1, 1, 2), - (2, 1, 3), - (3, 1, 4), - (4, 3, 1), - (5, 3, 4), - (6, 3, 5), - (7, 4, 5), - (8, 5, 6), - (9, 5, 8), - (10, 7, 5), - (11, 8, 5), - (12, 1, 9), - (13, 9, 1), - (14, 6, 3), - (15, 4, 8), - (16, 8, 3), - (17, 5, 10), - (18, 10, 5), - (19, 10, 8), - (20, 1, 11), - (21, 11, 1), - (22, 9, 11), - (23, 11, 9), - ], - ); - - let actual = temporal_three_node_motif(&g, None, 10); - - let expected: HashMap> = HashMap::from([ - ( - "1".to_string(), - vec![ - 0, 0, 0, 0, 1, 2, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 2, 0, 0, 0, 3, 0, 0, 0, - 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 2, 0, - ], - ), - ( - "10".to_string(), - vec![ - 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, - 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, - ], - ), - ( - "11".to_string(), - vec![ - 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 0, - 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 1, 0, - ], - ), - ( - "2".to_string(), - vec![ - 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, - 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, - ], - ), - ( - "3".to_string(), - vec![ - 0, 0, 0, 2, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, - 0, 0, 0, 0, 0, 0, 0, 1, 0, 2, 0, 1, 2, 0, - ], - ), - ( - "4".to_string(), - vec![ - 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, - 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 2, 0, - ], - ), - ( - "5".to_string(), - vec![ - 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 4, 0, 0, 0, 3, 0, 0, 0, - 0, 0, 0, 0, 0, 0, 1, 2, 1, 3, 0, 1, 1, 1, - ], - ), - ( - "6".to_string(), - vec![ - 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, - 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, - ], - ), - ( - "7".to_string(), - vec![ - 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, - 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, - ], - ), - ( - "8".to_string(), - vec![ - 0, 0, 2, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, - 0, 0, 0, 0, 0, 0, 1, 2, 1, 2, 0, 1, 0, 1, - ], - ), - ( - "9".to_string(), - vec![ - 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, - 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 1, 0, - ], - ), - ]); - - for ind in 1..12 { - assert_eq!( - actual.get(&ind.to_string()).unwrap(), - expected.get(&ind.to_string()).unwrap() - ); - } - } -} diff --git a/raphtory/src/algorithms/motifs/three_node_local_single_thread.rs b/raphtory/src/algorithms/motifs/three_node_local_single_thread.rs new file mode 100644 index 0000000000..2cad41bb5a --- /dev/null +++ b/raphtory/src/algorithms/motifs/three_node_local_single_thread.rs @@ -0,0 +1,445 @@ +use crate::algorithms::algorithm_result::AlgorithmResult; +/// This class regards the counting of the number of three edge, up-to-three node delta-temporal motifs in the graph, using the algorithm of Paranjape et al, Motifs in Temporal Networks (2017). +/// We point the reader to this reference for more information on the algorithm and background, but provide a short summary below. +/// +/// ## Motifs included +/// +/// ### Stars +/// +/// There are three classes (in the order they are outputted) of star motif on three nodes based on the switching behaviour of the edges between the two leaf nodes. +/// +/// - PRE: Stars of the form i<->j, i<->j, i<->k (ie two interactions with leaf j followed by one with leaf k) +/// - MID: Stars of the form i<->j, i<->k, i<->j (ie switching interactions from leaf j to leaf k, back to j again) +/// - POST: Stars of the form i<->j, i<->k, i<->k (ie one interaction with leaf j followed by two with leaf k) +/// +/// Within each of these classes is 8 motifs depending on the direction of the first to the last edge -- incoming "I" or outgoing "O". +/// These are enumerated in the order III, IIO, IOI, IOO, OII, OIO, OOI, OOO (like binary with "I"-0 and "O"-1). +/// +/// ### Two node motifs +/// +/// Also included are two node motifs, of which there are 8 when counted from the perspective of each vertex. These are characterised by the direction of each edge, enumerated +/// in the above order. Note that for the global graph counts, each motif is counted in both directions (a single III motif for one vertex is an OOO motif for the other vertex). +/// +/// ### Triangles +/// +/// There are 8 triangle motifs: +/// +/// 1. i --> j, k --> j, i --> k +/// 2. i --> j, k --> i, j --> k +/// 3. i --> j, j --> k, i --> k +/// 4. i --> j, i --> k, j --> k +/// 5. i --> j, k --> j, k --> i +/// 6. i --> j, k --> i, k --> j +/// 7. i --> j, j --> k, k --> i +/// 8. i --> j, i --> k, k --> j +/// +use crate::{algorithms::motifs::three_node_motifs::*, db::api::view::*}; +use std::collections::HashMap; + +fn star_motif_count(graph: &G, v: u64, delta: i64) -> [usize; 24] { + if let Some(vertex) = graph.vertex(v) { + let neigh_map: HashMap = vertex + .neighbours() + .iter() + .enumerate() + .map(|(num, nb)| (nb.id(), num)) + .into_iter() + .collect(); + let mut exploded_edges = vertex + .edges() + .explode() + .map(|edge| { + if edge.src().id() == v { + star_event(neigh_map[&edge.dst().id()], 1, edge.time().unwrap()) + } else { + star_event(neigh_map[&edge.src().id()], 0, edge.time().unwrap()) + } + }) + .collect::>(); + exploded_edges.sort_by_key(|e| e.time); + let mut star_count = init_star_count(neigh_map.len()); + star_count.execute(&exploded_edges, delta); + star_count.return_counts() + } else { + [0; 24] + } +} + +fn twonode_motif_count(graph: &G, v: u64, delta: i64) -> [usize; 8] { + let mut counts = [0; 8]; + if let Some(vertex) = graph.vertex(v) { + for nb in vertex.neighbours().iter() { + let nb_id = nb.id(); + let out = graph.edge(vertex.id(), nb_id); + let inc = graph.edge(nb_id, vertex.id()); + let mut all_exploded = match (out, inc) { + (Some(o), Some(i)) => o + .explode() + .chain(i.explode()) + .map(|e| { + two_node_event(if e.src().id() == v { 1 } else { 0 }, e.time().unwrap()) + }) + .collect::>(), + (Some(o), None) => o + .explode() + .map(|e| two_node_event(1, e.time().unwrap())) + .collect::>(), + (None, Some(i)) => i + .explode() + .map(|e| two_node_event(0, e.time().unwrap())) + .collect::>(), + (None, None) => Vec::new(), + }; + all_exploded.sort_by_key(|e| e.time); + let mut two_node_counter = init_two_node_count(); + two_node_counter.execute(&all_exploded, delta); + let two_node_result = two_node_counter.return_counts(); + for i in 0..8 { + counts[i] += two_node_result[i]; + } + } + } + counts +} + +fn triangle_motif_count( + graph: &G, + delta: i64, +) -> AlgorithmResult> { + let mut counts: HashMap> = HashMap::new(); + for u in graph.vertices() { + counts.insert(u.id(), vec![0; 8]); + } + for u in graph.vertices() { + let uid = u.id(); + for v in u.neighbours().iter().filter(|x| x.id() > uid) { + for nb in u.neighbours().iter().filter(|x| x.id() > v.id()) { + let mut tri_edges: Vec = Vec::new(); + let out = graph.edge(v.id(), nb.id()); + let inc = graph.edge(nb.id(), v.id()); + // The following code checks for triangles + match (out, inc) { + (Some(o), Some(i)) => { + tri_edges.append( + &mut o + .explode() + .map(|e| new_triangle_edge(false, 1, 0, 1, e.time().unwrap())) + .collect::>(), + ); + tri_edges.append( + &mut i + .explode() + .map(|e| new_triangle_edge(false, 1, 0, 0, e.time().unwrap())) + .collect::>(), + ); + } + (Some(o), None) => { + tri_edges.append( + &mut o + .explode() + .map(|e| new_triangle_edge(false, 1, 0, 1, e.time().unwrap())) + .collect::>(), + ); + } + (None, Some(i)) => { + tri_edges.append( + &mut i + .explode() + .map(|e| new_triangle_edge(false, 1, 0, 0, e.time().unwrap())) + .collect::>(), + ); + } + (None, None) => { + continue; + } + } + if !tri_edges.is_empty() { + let uout = graph.edge(uid, nb.id()); + let uin = graph.edge(nb.id(), uid); + match (uout, uin) { + (Some(o), Some(i)) => { + tri_edges.append( + &mut o + .explode() + .map(|e| new_triangle_edge(false, 0, 0, 1, e.time().unwrap())) + .collect::>(), + ); + tri_edges.append( + &mut i + .explode() + .map(|e| new_triangle_edge(false, 0, 0, 0, e.time().unwrap())) + .collect::>(), + ); + } + (Some(o), None) => { + tri_edges.append( + &mut o + .explode() + .map(|e| new_triangle_edge(false, 0, 0, 1, e.time().unwrap())) + .collect::>(), + ); + } + (None, Some(i)) => { + tri_edges.append( + &mut i + .explode() + .map(|e| new_triangle_edge(false, 0, 0, 0, e.time().unwrap())) + .collect::>(), + ); + } + (None, None) => { + continue; + } + } + // found triangle at this point!! + let u_to_v = match graph.edge(uid, v.id()) { + Some(edge) => { + let r = edge + .explode() + .map(|e| new_triangle_edge(true, 1, 0, 1, e.time().unwrap())) + .collect::>(); + r.into_iter() + } + None => vec![].into_iter(), + }; + let v_to_u = match graph.edge(v.id(), uid) { + Some(edge) => { + let r = edge + .explode() + .map(|e| new_triangle_edge(true, 0, 0, 0, e.time().unwrap())) + .collect::>(); + r.into_iter() + } + None => vec![].into_iter(), + }; + tri_edges.append(&mut u_to_v.collect::>()); + tri_edges.append(&mut v_to_u.collect::>()); + tri_edges.sort_by_key(|e| e.time); + + let mut tri_count = init_tri_count(1); + tri_count.execute(&tri_edges, delta); + let tmp_counts = tri_count.return_counts().iter(); + for id in [uid, v.id(), nb.id()] { + counts.insert( + id, + counts + .get(&id) + .unwrap() + .iter() + .zip(tmp_counts.clone()) + .map(|(&i1, &i2)| i1 + i2) + .collect::>(), + ); + } + } + } + } + } + AlgorithmResult::new(counts) +} + +/// Computes the number of each type of motif that each node participates in. +/// +/// # Arguments +/// +/// * `g` - A reference to the graph +/// * `delta` - Maximum time difference between the first and last edge of the +/// motif. NB if time for edges was given as a UNIX epoch, this should be given in seconds, otherwise +/// milliseconds should be used (if edge times were given as string) +/// +/// # Returns +/// +/// A dictionary with vertex ids (u64) as keys and a 40 dimensional array of motif counts as a value. The first 24 elements are star counts, +/// the next 8 are two-node motif counts and the final 8 are triangle counts. +/// +/// # Notes +/// +/// For this local count, a node is counted as participating in a motif in the following way. For star motifs, only the centre node counts +/// the motif. For two node motifs, both constituent nodes count the motif. For triangles, all three constituent nodes count the motif. +/// +/// +pub fn local_temporal_three_node_motifs( + graph: &G, + delta: i64, +) -> AlgorithmResult> { + let mut counts = triangle_motif_count(graph, delta).get_all().to_owned(); + for v in graph.vertices() { + let vid = v.id(); + let two_nodes = twonode_motif_count(graph, vid, delta).to_vec(); + let tmp_stars = star_motif_count(graph, vid, delta); + let stars: Vec = tmp_stars + .iter() + .zip(two_nodes.iter().cycle().take(24)) + .map(|(&x1, &x2)| x1 - x2) + .collect(); + let mut final_cts = Vec::new(); + final_cts.extend(stars.into_iter()); + final_cts.extend(two_nodes.into_iter()); + final_cts.extend(counts.get(&vid).unwrap().into_iter()); + counts.insert(vid, final_cts); + } + AlgorithmResult::new(counts) +} + +/// Computes the number of each type of motif there is in the graph. +/// +/// # Arguments +/// +/// * `g` - A reference to the graph +/// * `delta` - Maximum time difference between the first and last edge of the +/// motif. NB if time for edges was given as a UNIX epoch, this should be given in seconds, otherwise +/// milliseconds should be used (if edge times were given as string) +/// +/// # Returns +/// +/// A 40 dimensional array with the counts of each motif, given in the same order as described in the class summary. Note that the two-node motif counts are symmetrical so it may be more useful just to consider the first four elements. +/// +/// # Notes +/// +/// This is achieved by calling the local motif counting algorithm, summing the resulting arrays and dealing with overcounted motifs: the triangles (by dividing each motif count by three) and two-node motifs (dividing by two). +/// +/// +pub fn global_temporal_three_node_motifs(graph: &G, delta: i64) -> Vec { + let counts = local_temporal_three_node_motifs(graph, delta) + .get_all() + .to_owned(); + let mut tmp_counts = counts.values().fold(vec![0; 40], |acc, x| { + acc.iter().zip(x.iter()).map(|(x1, x2)| x1 + x2).collect() + }); + for ind in 32..40 { + tmp_counts[ind] /= 3; + } + tmp_counts +} + +#[cfg(test)] +mod local_motif_test { + use crate::{ + algorithms::motifs::three_node_local_single_thread::*, + db::{api::mutation::AdditionOps, graph::graph::Graph}, + prelude::NO_PROPS, + }; + + #[test] + fn test_init() { + let graph = Graph::new(); + + let vs = vec![ + (1, 2, 1), + (1, 3, 2), + (1, 4, 3), + (3, 1, 4), + (3, 4, 5), + (3, 5, 6), + (4, 5, 7), + (5, 6, 8), + (5, 8, 9), + (7, 5, 10), + (8, 5, 11), + (1, 9, 12), + (9, 1, 13), + (6, 3, 14), + (4, 8, 15), + (8, 3, 16), + (5, 10, 17), + (10, 5, 18), + (10, 8, 19), + (1, 11, 20), + (11, 1, 21), + (9, 11, 22), + (11, 9, 23), + ]; + + for (src, dst, time) in &vs { + graph.add_edge(*time, *src, *dst, NO_PROPS, None).unwrap(); + } + + // let counts = star_motif_count(&graph, 1, 100); + let counts = local_temporal_three_node_motifs(&graph, 10); + // FIXME: Should test this + let _global_counts = global_temporal_three_node_motifs(&graph, 10); + let expected: HashMap> = HashMap::from([ + ( + 1, + vec![ + 0, 0, 0, 0, 1, 2, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 2, 0, 0, 0, 3, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 2, 0, + ], + ), + ( + 10, + vec![ + 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, + ], + ), + ( + 11, + vec![ + 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 1, 0, + ], + ), + ( + 2, + vec![ + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, + ], + ), + ( + 3, + vec![ + 0, 0, 0, 2, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 1, 0, 2, 0, 1, 2, 0, + ], + ), + ( + 4, + vec![ + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 2, 0, + ], + ), + ( + 5, + vec![ + 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 4, 0, 0, 0, 3, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 1, 2, 1, 3, 0, 1, 1, 1, + ], + ), + ( + 6, + vec![ + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, + ], + ), + ( + 7, + vec![ + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, + ], + ), + ( + 8, + vec![ + 0, 0, 2, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 1, 2, 1, 2, 0, 1, 0, 1, + ], + ), + ( + 9, + vec![ + 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 1, 0, + ], + ), + ]); + for ind in 1..12 { + assert_eq!(counts.get(&ind).unwrap(), expected.get(&ind).unwrap()); + } + // print!("{:?}", global_counts); + } +} diff --git a/raphtory/src/algorithms/motifs/three_node_motifs.rs b/raphtory/src/algorithms/motifs/three_node_motifs.rs index c55262a735..fa5e5fc445 100644 --- a/raphtory/src/algorithms/motifs/three_node_motifs.rs +++ b/raphtory/src/algorithms/motifs/three_node_motifs.rs @@ -72,7 +72,7 @@ pub fn init_two_node_count() -> TwoNodeCounter { // Star Motifs pub struct StarEvent { nb: usize, - dir: usize, + pub dir: usize, pub time: i64, } @@ -81,7 +81,7 @@ pub fn star_event(nb: usize, dir: usize, time: i64) -> StarEvent { } pub struct StarCounter { - N: usize, + n: usize, pre_nodes: Vec, post_nodes: Vec, pre_sum: [usize; 8], @@ -94,41 +94,41 @@ pub struct StarCounter { impl StarCounter { fn push_pre(&mut self, cur_edge: &StarEvent) { self.pre_sum[map2d(INCOMING, cur_edge.dir)] += - self.pre_nodes[INCOMING * self.N + cur_edge.nb]; + self.pre_nodes[INCOMING * self.n + cur_edge.nb]; self.pre_sum[map2d(OUTGOING, cur_edge.dir)] += - self.pre_nodes[OUTGOING * self.N + cur_edge.nb]; - self.pre_nodes[cur_edge.dir * self.N + cur_edge.nb] += 1; + self.pre_nodes[OUTGOING * self.n + cur_edge.nb]; + self.pre_nodes[cur_edge.dir * self.n + cur_edge.nb] += 1; } fn push_post(&mut self, cur_edge: &StarEvent) { self.post_sum[map2d(INCOMING, cur_edge.dir)] += - self.post_nodes[INCOMING * self.N + cur_edge.nb]; + self.post_nodes[INCOMING * self.n + cur_edge.nb]; self.post_sum[map2d(OUTGOING, cur_edge.dir)] += - self.post_nodes[OUTGOING * self.N + cur_edge.nb]; - self.post_nodes[cur_edge.dir * self.N + cur_edge.nb] += 1; + self.post_nodes[OUTGOING * self.n + cur_edge.nb]; + self.post_nodes[cur_edge.dir * self.n + cur_edge.nb] += 1; } fn pop_pre(&mut self, cur_edge: &StarEvent) { - self.pre_nodes[cur_edge.dir * self.N + cur_edge.nb] -= 1; + self.pre_nodes[cur_edge.dir * self.n + cur_edge.nb] -= 1; self.pre_sum[map2d(cur_edge.dir, INCOMING)] -= - self.pre_nodes[INCOMING * self.N + cur_edge.nb]; + self.pre_nodes[INCOMING * self.n + cur_edge.nb]; self.pre_sum[map2d(cur_edge.dir, OUTGOING)] -= - self.pre_nodes[OUTGOING * self.N + cur_edge.nb]; + self.pre_nodes[OUTGOING * self.n + cur_edge.nb]; } fn pop_post(&mut self, cur_edge: &StarEvent) { - self.post_nodes[cur_edge.dir * self.N + cur_edge.nb] -= 1; + self.post_nodes[cur_edge.dir * self.n + cur_edge.nb] -= 1; self.post_sum[map2d(cur_edge.dir, INCOMING)] -= - self.post_nodes[INCOMING * self.N + cur_edge.nb]; + self.post_nodes[INCOMING * self.n + cur_edge.nb]; self.post_sum[map2d(cur_edge.dir, OUTGOING)] -= - self.post_nodes[OUTGOING * self.N + cur_edge.nb]; + self.post_nodes[OUTGOING * self.n + cur_edge.nb]; } fn process_current(&mut self, cur_edge: &StarEvent) { self.mid_sum[map2d(INCOMING, cur_edge.dir)] -= - self.pre_nodes[INCOMING * self.N + cur_edge.nb]; + self.pre_nodes[INCOMING * self.n + cur_edge.nb]; self.mid_sum[map2d(OUTGOING, cur_edge.dir)] -= - self.pre_nodes[OUTGOING * self.N + cur_edge.nb]; + self.pre_nodes[OUTGOING * self.n + cur_edge.nb]; for (d1, d2) in DIRS2D { self.count_pre[map3d(d1, d2, cur_edge.dir)] += self.pre_sum[map2d(d1, d2)]; @@ -137,24 +137,24 @@ impl StarCounter { } self.mid_sum[map2d(cur_edge.dir, INCOMING)] += - self.post_nodes[INCOMING * self.N + cur_edge.nb]; + self.post_nodes[INCOMING * self.n + cur_edge.nb]; self.mid_sum[map2d(cur_edge.dir, OUTGOING)] += - self.post_nodes[OUTGOING * self.N + cur_edge.nb]; + self.post_nodes[OUTGOING * self.n + cur_edge.nb]; } pub fn execute(&mut self, edges: &Vec, delta: i64) { - let L = edges.len(); - if L < 3 { + let l = edges.len(); + if l < 3 { return; } let mut start = 0; let mut end = 0; - for j in 0..L { - while start < L && edges[start].time + delta < edges[j].time { + for j in 0..l { + while start < l && edges[start].time + delta < edges[j].time { self.pop_pre(&edges[start]); start += 1; } - while (end < L) && edges[end].time <= edges[j].time + delta { + while (end < l) && edges[end].time <= edges[j].time + delta { self.push_post(&edges[end]); end += 1; } @@ -174,11 +174,11 @@ impl StarCounter { counts } } -pub fn init_star_count(N: usize) -> StarCounter { +pub fn init_star_count(n: usize) -> StarCounter { StarCounter { - N: N, - pre_nodes: vec![0; 2 * N], - post_nodes: vec![0; 2 * N], + n, + pre_nodes: vec![0; 2 * n], + post_nodes: vec![0; 2 * n], pre_sum: [0; 8], mid_sum: [0; 8], post_sum: [0; 8], @@ -214,7 +214,7 @@ pub fn new_triangle_edge( } pub struct TriangleCounter { - N: usize, + n: usize, pre_nodes: Vec, post_nodes: Vec, pre_sum: [usize; 8], @@ -224,18 +224,18 @@ pub struct TriangleCounter { } impl TriangleCounter { pub fn execute(&mut self, edges: &Vec, delta: i64) { - let L = edges.len(); - if L < 3 { + let l = edges.len(); + if l < 3 { return; } let mut start = 0; let mut end = 0; - for j in 0..L { - while start < L && edges[start].time + delta < edges[j].time { + for j in 0..l { + while start < l && edges[start].time + delta < edges[j].time { self.pop_pre(&edges[start]); start += 1; } - while (end < L) && edges[end].time <= edges[j].time + delta { + while (end < l) && edges[end].time <= edges[j].time + delta { self.push_post(&edges[end]); end += 1; } @@ -249,10 +249,10 @@ impl TriangleCounter { let (is_uor_v, nb, dir) = (cur_edge.uorv, cur_edge.nb, cur_edge.dir); if !cur_edge.uv_edge { self.pre_sum[map3d(1 - is_uor_v, INCOMING, dir)] += - self.pre_nodes[self.N * map2d(INCOMING, 1 - is_uor_v) + nb]; + self.pre_nodes[self.n * map2d(INCOMING, 1 - is_uor_v) + nb]; self.pre_sum[map3d(1 - is_uor_v, OUTGOING, dir)] += - self.pre_nodes[self.N * map2d(OUTGOING, 1 - is_uor_v) + nb]; - self.pre_nodes[self.N * map2d(dir, is_uor_v) + nb] += 1; + self.pre_nodes[self.n * map2d(OUTGOING, 1 - is_uor_v) + nb]; + self.pre_nodes[self.n * map2d(dir, is_uor_v) + nb] += 1; } } @@ -260,32 +260,32 @@ impl TriangleCounter { let (is_uor_v, nb, dir) = (cur_edge.uorv, cur_edge.nb, cur_edge.dir); if !cur_edge.uv_edge { self.post_sum[map3d(1 - is_uor_v, INCOMING, dir)] += - self.post_nodes[self.N * map2d(INCOMING, 1 - is_uor_v) + nb]; + self.post_nodes[self.n * map2d(INCOMING, 1 - is_uor_v) + nb]; self.post_sum[map3d(1 - is_uor_v, OUTGOING, dir)] += - self.post_nodes[self.N * map2d(OUTGOING, 1 - is_uor_v) + nb]; - self.post_nodes[self.N * map2d(dir, is_uor_v) + nb] += 1; + self.post_nodes[self.n * map2d(OUTGOING, 1 - is_uor_v) + nb]; + self.post_nodes[self.n * map2d(dir, is_uor_v) + nb] += 1; } } fn pop_pre(&mut self, cur_edge: &TriangleEdge) { let (is_uor_v, nb, dir) = (cur_edge.uorv, cur_edge.nb, cur_edge.dir); if !cur_edge.uv_edge { - self.pre_nodes[self.N * map2d(dir, is_uor_v) + nb] -= 1; + self.pre_nodes[self.n * map2d(dir, is_uor_v) + nb] -= 1; self.pre_sum[map3d(is_uor_v, dir, INCOMING)] -= - self.pre_nodes[self.N * map2d(INCOMING, 1 - is_uor_v)]; + self.pre_nodes[self.n * map2d(INCOMING, 1 - is_uor_v)]; self.pre_sum[map3d(is_uor_v, dir, OUTGOING)] -= - self.pre_nodes[self.N * map2d(OUTGOING, 1 - is_uor_v)]; + self.pre_nodes[self.n * map2d(OUTGOING, 1 - is_uor_v)]; } } fn pop_post(&mut self, cur_edge: &TriangleEdge) { let (is_uor_v, nb, dir) = (cur_edge.uorv, cur_edge.nb, cur_edge.dir); if !cur_edge.uv_edge { - self.post_nodes[self.N * map2d(dir, is_uor_v) + nb] -= 1; + self.post_nodes[self.n * map2d(dir, is_uor_v) + nb] -= 1; self.post_sum[map3d(is_uor_v, dir, INCOMING)] -= - self.post_nodes[self.N * map2d(INCOMING, 1 - is_uor_v)]; + self.post_nodes[self.n * map2d(INCOMING, 1 - is_uor_v)]; self.post_sum[map3d(is_uor_v, dir, OUTGOING)] -= - self.post_nodes[self.N * map2d(OUTGOING, 1 - is_uor_v)]; + self.post_nodes[self.n * map2d(OUTGOING, 1 - is_uor_v)]; } } @@ -293,13 +293,13 @@ impl TriangleCounter { let (is_uor_v, nb, dir) = (cur_edge.uorv, cur_edge.nb, cur_edge.dir); if !cur_edge.uv_edge { self.mid_sum[map3d(1 - is_uor_v, INCOMING, dir)] -= - self.pre_nodes[self.N * map2d(INCOMING, 1 - is_uor_v) + nb]; + self.pre_nodes[self.n * map2d(INCOMING, 1 - is_uor_v) + nb]; self.mid_sum[map3d(1 - is_uor_v, OUTGOING, dir)] -= - self.pre_nodes[self.N * map2d(OUTGOING, 1 - is_uor_v) + nb]; + self.pre_nodes[self.n * map2d(OUTGOING, 1 - is_uor_v) + nb]; self.mid_sum[map3d(is_uor_v, dir, INCOMING)] += - self.post_nodes[self.N * map2d(INCOMING, 1 - is_uor_v) + nb]; + self.post_nodes[self.n * map2d(INCOMING, 1 - is_uor_v) + nb]; self.mid_sum[map3d(is_uor_v, dir, OUTGOING)] += - self.post_nodes[self.N * map2d(OUTGOING, 1 - is_uor_v) + nb]; + self.post_nodes[self.n * map2d(OUTGOING, 1 - is_uor_v) + nb]; } else { self.final_counts[0] += self.mid_sum[map3d(dir, 0, 0)] + self.post_sum[map3d(dir, 0, 1)] @@ -334,7 +334,7 @@ impl TriangleCounter { } pub fn init_tri_count(n: usize) -> TriangleCounter { TriangleCounter { - N: n, + n: n, pre_nodes: vec![0; 4 * n], post_nodes: vec![0; 4 * n], pre_sum: [0; 8], diff --git a/raphtory/src/algorithms/motifs/three_node_temporal_motifs.rs b/raphtory/src/algorithms/motifs/three_node_temporal_motifs.rs new file mode 100644 index 0000000000..d1cbd35711 --- /dev/null +++ b/raphtory/src/algorithms/motifs/three_node_temporal_motifs.rs @@ -0,0 +1,632 @@ +// Imports /////////////////////////////////////////// +use crate::{ + algorithms::{k_core::k_core_set, motifs::three_node_motifs::*}, + core::state::{ + accumulator_id::{ + accumulators::{self, val}, + AccId, + }, + agg::ValDef, + compute_state::ComputeStateVec, + }, + db::{ + api::view::{GraphViewOps, VertexViewOps, *}, + graph::{edge::EdgeView, views::vertex_subgraph::VertexSubgraph}, + task::{ + context::Context, + edge::eval_edge::EvalEdgeView, + task::{ATask, Job, Step}, + task_runner::TaskRunner, + vertex::eval_vertex::EvalVertexView, + }, + }, +}; + +use crate::core::entities::vertices::vertex_ref::VertexRef; +use itertools::{enumerate, Itertools}; +use num_traits::Zero; +use rand::{rngs::StdRng, Rng, SeedableRng}; +use rustc_hash::FxHashSet; +use std::{cmp::Ordering, collections::HashMap, ops::Add, slice::Iter}; +/////////////////////////////////////////////////////// + +// State objects for three node motifs +#[derive(Eq, PartialEq, Clone, Debug)] +pub struct MotifCounter { + pub two_nodes: Vec<[usize; 8]>, + pub star_nodes: Vec<[usize; 24]>, + pub triangle: Vec<[usize; 8]>, +} + +impl MotifCounter { + fn new( + size: usize, + two_nodes: Vec<[usize; 8]>, + star_nodes: Vec<[usize; 24]>, + triangle: Vec<[usize; 8]>, + ) -> Self { + let _ = size; + Self { + two_nodes: two_nodes, + star_nodes: star_nodes, + triangle: triangle, + } + } +} + +impl Default for MotifCounter { + fn default() -> Self { + Self::zero() + } +} + +impl Add for MotifCounter { + type Output = MotifCounter; + + fn add(self, rhs: Self) -> Self::Output { + rhs + } +} + +impl Zero for MotifCounter { + fn zero() -> Self { + MotifCounter { + two_nodes: vec![], + star_nodes: vec![], + triangle: vec![], + } + } + + fn set_zero(&mut self) { + *self = Zero::zero(); + } + + fn is_zero(&self) -> bool { + self.two_nodes.is_empty() && self.star_nodes.is_empty() && self.triangle.is_empty() + } +} + +/////////////////////////////////////////////////////// + +pub fn star_motif_count( + evv: &EvalVertexView, + deltas: Vec, +) -> Vec<[usize; 24]> +where + G: GraphViewOps, +{ + let neigh_map: HashMap = evv + .neighbours() + .into_iter() + .enumerate() + .map(|(num, nb)| (nb.id(), num)) + .collect(); + let mut events = evv + .edges() + .explode() + .sorted_by_key(|e| e.time_and_index()) + .map(|edge| { + if edge.src().id() == evv.id() { + star_event(neigh_map[&edge.dst().id()], 1, edge.time().unwrap()) + } else { + star_event(neigh_map[&edge.src().id()], 0, edge.time().unwrap()) + } + }) + .collect::>(); + + deltas + .into_iter() + .map(|delta| { + let mut star_count = init_star_count(evv.degree()); + star_count.execute(&events, delta); + star_count.return_counts() + }) + .collect::>() +} + +/////////////////////////////////////////////////////// + +pub fn twonode_motif_count( + graph: &G, + evv: &EvalVertexView, + deltas: Vec, +) -> Vec<[usize; 8]> +where + G: GraphViewOps, +{ + let mut results = deltas.iter().map(|_| [0; 8]).collect::>(); + + // Define a closure for sorting by time_and_index() + let sort_by_time_and_index = |e1: &EdgeView, e2: &EdgeView| -> Ordering { + Ord::cmp(&e1.time_and_index(), &e2.time_and_index()) + }; + + for nb in evv.neighbours().into_iter() { + let nb_id = nb.id(); + let out = graph.edge(evv.id(), nb_id); + let inc = graph.edge(nb_id, evv.id()); + let mut events: Vec = out + .iter() + .flat_map(|e| e.explode()) + .chain(inc.iter().flat_map(|e| e.explode())) + .sorted_by_key(|e| e.time_and_index()) + .map(|e| { + two_node_event( + if e.src().id() == evv.id() { 1 } else { 0 }, + e.time().unwrap(), + ) + }) + .collect(); + for j in 0..deltas.len() { + let mut two_node_counter = init_two_node_count(); + two_node_counter.execute(&events, deltas[j]); + let two_node_result = two_node_counter.return_counts(); + for i in 0..8 { + results[j][i] += two_node_result[i]; + } + } + } + results +} + +/////////////////////////////////////////////////////// + +pub fn triangle_motifs( + graph: &G, + deltas: Vec, + _motifs_count_id: AccId>, + threads: Option, +) -> HashMap> +where + G: GraphViewOps, +{ + let delta_len = deltas.len(); + + // Define a closure for sorting by time_and_index() + let sort_by_time_and_index = + |e1: &EdgeView>, e2: &EdgeView>| -> Ordering { + Ord::cmp(&e1.time_and_index(), &e2.time_and_index()) + }; + + // Define a closure for sorting by time() + let vertex_set = k_core_set(graph, 2, usize::MAX, None); + let g: VertexSubgraph = graph.subgraph(vertex_set); + let mut ctx: Context, ComputeStateVec> = Context::from(&g); + + let neighbours_set = accumulators::hash_set::(1); + + ctx.agg(neighbours_set); + + let step1 = ATask::new( + move |u: &mut EvalVertexView, ComputeStateVec, MotifCounter>| { + for v in u.neighbours() { + if u.id() > v.id() { + v.update(&neighbours_set, u.id()); + } + } + Step::Continue + }, + ); + + let step2 = ATask::new( + move |u: &mut EvalVertexView, ComputeStateVec, MotifCounter>| { + let uu = u.get_mut(); + if uu.triangle.len() == 0 { + uu.triangle = vec![[0 as usize; 8]; delta_len]; + } + for v in u.neighbours() { + // Find triangles on the UV edge + if u.id() > v.id() { + let intersection_nbs = { + match ( + u.entry(&neighbours_set) + .read_ref() + .unwrap_or(&FxHashSet::default()), + v.entry(&neighbours_set) + .read_ref() + .unwrap_or(&FxHashSet::default()), + ) { + (u_set, v_set) => { + let intersection = + u_set.intersection(v_set).cloned().collect::>(); + intersection + } + } + }; + + if intersection_nbs.is_empty() { + continue; + } + // let mut nb_ct = 0; + intersection_nbs.iter().for_each(|w| { + // For each triangle, run the triangle count. + + let mut all_exploded = vec![u.id(), v.id(), *w] + .into_iter() + .sorted() + .permutations(2) + .flat_map(|e| { + g.edge(e.get(0).unwrap().clone(), e.get(1).unwrap().clone()) + .iter() + .flat_map(|edge| edge.explode()) + .collect::>() + }) + .sorted_by_key(|e| e.time_and_index()) + .map(|e| { + let (src_id, dst_id) = (e.src().id(), e.dst().id()); + let (uid, vid) = (u.id(), v.id()); + if src_id == w.clone() { + new_triangle_edge( + false, + if dst_id == uid { 0 } else { 1 }, + 0, + 0, + e.time().unwrap(), + ) + } else if dst_id == w.clone() { + new_triangle_edge( + false, + if src_id == uid { 0 } else { 1 }, + 0, + 1, + e.time().unwrap(), + ) + } else if src_id == uid { + new_triangle_edge(true, 1, 0, 1, e.time().unwrap()) + } else { + new_triangle_edge(true, 0, 0, 0, e.time().unwrap()) + } + }) + .collect::>(); + + for i in 0..deltas.len() { + let delta = deltas[i]; + let mut tri_count = init_tri_count(2); + tri_count.execute(&all_exploded, delta); + let tmp_counts: Iter = tri_count.return_counts().iter(); + + // Triangle counts are going to be WRONG without w + // update_counter(&mut vec![u, &v], motifs_count_id, tmp_counts); + + let mc_u = u.get_mut(); + let triangle_u = mc_u.triangle[i] + .iter() + .zip(tmp_counts.clone()) + .map(|(&i1, &i2)| i1 + i2) + .collect::>() + .try_into() + .unwrap(); + mc_u.triangle[i] = triangle_u; + } + }) + } + } + Step::Continue + }, + ); + + let mut runner: TaskRunner, _> = TaskRunner::new(ctx); + + runner.run( + vec![Job::new(step1)], + vec![Job::read_only(step2)], + None, + |_, _, _els, local| { + let mut tri_motifs = HashMap::new(); + let layers = graph.layer_ids(); + let edge_filter = graph.edge_filter(); + for (vref, mc) in enumerate(local) { + if graph.has_vertex_ref(VertexRef::Internal(vref.into()), &layers, edge_filter) { + let v_gid = graph.vertex_name(vref.into()); + if mc.triangle.is_empty() { + tri_motifs.insert(v_gid.clone(), vec![[0; 8]; delta_len]); + } else { + tri_motifs.insert(v_gid.clone(), mc.triangle); + } + } + } + tri_motifs + }, + threads, + 1, + None, + None, + ) +} + +/////////////////////////////////////////////////////// + +pub fn temporal_three_node_motif( + g: &G, + deltas: Vec, + threads: Option, +) -> HashMap>> +where + G: GraphViewOps, +{ + let mut ctx: Context = g.into(); + let motifs_counter = val::(0); + let delta_len = deltas.len(); + + ctx.agg(motifs_counter); + + let out1 = triangle_motifs(g, deltas.clone(), motifs_counter, threads); + + let step1 = ATask::new( + move |evv: &mut EvalVertexView| { + let g = evv.graph; + + let two_nodes = twonode_motif_count(g, evv, deltas.clone()); + let star_nodes = star_motif_count(evv, deltas.clone()); + + *evv.get_mut() = MotifCounter::new( + deltas.len(), + two_nodes, + star_nodes, + evv.get().triangle.clone(), + ); + + Step::Continue + }, + ); + + let mut runner: TaskRunner = TaskRunner::new(ctx); + + let out2 = runner.run( + vec![Job::new(step1)], + vec![], + None, + |_, _, _els, local| { + let mut motifs = HashMap::new(); + for (vref, mc) in enumerate(local) { + let v_gid = g.vertex_name(vref.into()); + let triangles = out1 + .get(&v_gid) + .map(|v| v.clone()) + .unwrap_or_else(|| vec![[0 as usize; 8]; delta_len]); + let run_counts = (0..delta_len) + .map(|i| { + let two_nodes = mc.two_nodes[i].to_vec(); + let tmp_stars = mc.star_nodes[i].to_vec(); + let stars: Vec = tmp_stars + .iter() + .zip(two_nodes.iter().cycle().take(24)) + .map(|(&x1, &x2)| x1 - x2) + .collect(); + let mut final_cts = Vec::new(); + final_cts.extend(stars.into_iter()); + final_cts.extend(two_nodes.into_iter()); + final_cts.extend(triangles[i].into_iter()); + final_cts + }) + .collect::>>(); + motifs.insert(v_gid.clone(), run_counts); + } + motifs + }, + threads, + 1, + None, + None, + ); + out2 +} + +pub fn global_temporal_three_node_motif_from_local( + counts: HashMap>, +) -> Vec { + let tmp_counts = counts.values().fold(vec![0; 40], |acc, x| { + acc.iter().zip(x.iter()).map(|(x1, x2)| x1 + x2).collect() + }); + tmp_counts +} + +pub fn global_temporal_three_node_motif( + graph: &G, + delta: i64, + threads: Option, +) -> Vec { + let counts = global_temporal_three_node_motif_general(graph, vec![delta], threads); + counts[0].clone() +} + +pub fn global_temporal_three_node_motif_general( + graph: &G, + deltas: Vec, + threads: Option, +) -> Vec> { + let counts = temporal_three_node_motif(graph, deltas.clone(), threads); + + let mut result: Vec> = vec![vec![0; 40]; deltas.len()]; + for (_, values) in counts.iter() { + for i in 0..deltas.len() { + for j in 0..40 { + result[i][j] += values[i][j] + } + } + } + result +} + +#[cfg(test)] +mod motifs_test { + use super::*; + use crate::{ + db::{api::mutation::AdditionOps, graph::graph::Graph}, + prelude::NO_PROPS, + }; + + fn load_graph(edges: Vec<(i64, u64, u64)>) -> Graph { + let graph = Graph::new(); + + for (t, src, dst) in edges { + graph.add_edge(t, src, dst, NO_PROPS, None).unwrap(); + } + graph + } + + #[test] + #[ignore = "This is not correct, local version does not work"] + fn test_two_node_motif() { + let g = load_graph(vec![ + (1, 1, 2), + (2, 1, 3), + (3, 1, 4), + (4, 3, 1), + (5, 3, 4), + (6, 3, 5), + (7, 4, 5), + (8, 5, 6), + (9, 5, 8), + (10, 7, 5), + (11, 8, 5), + (12, 1, 9), + (13, 9, 1), + (14, 6, 3), + (15, 4, 8), + (16, 8, 3), + (17, 5, 10), + (18, 10, 5), + (19, 10, 8), + (20, 1, 11), + (21, 11, 1), + (22, 9, 11), + (23, 11, 9), + ]); + + let binding = temporal_three_node_motif(&g, Vec::from([10]), None); + let actual = binding + .iter() + .map(|(k, v)| (k, v[0].clone())) + .into_iter() + .collect::>>(); + + let expected: HashMap> = HashMap::from([ + ( + "1".to_string(), + vec![ + 0, 0, 0, 0, 1, 2, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 2, 0, 0, 0, 3, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 2, 0, + ], + ), + ( + "10".to_string(), + vec![ + 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, + ], + ), + ( + "11".to_string(), + vec![ + 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 1, 0, + ], + ), + ( + "2".to_string(), + vec![ + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, + ], + ), + ( + "3".to_string(), + vec![ + 0, 0, 0, 2, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 1, 0, 2, 0, 1, 2, 0, + ], + ), + ( + "4".to_string(), + vec![ + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 2, 0, + ], + ), + ( + "5".to_string(), + vec![ + 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 4, 0, 0, 0, 3, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 1, 2, 1, 3, 0, 1, 1, 1, + ], + ), + ( + "6".to_string(), + vec![ + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, + ], + ), + ( + "7".to_string(), + vec![ + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, + ], + ), + ( + "8".to_string(), + vec![ + 0, 0, 2, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 1, 2, 1, 2, 0, 1, 0, 1, + ], + ), + ( + "9".to_string(), + vec![ + 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, + 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 1, 0, + ], + ), + ]); + + for ind in 3..12 { + assert_eq!( + actual.get(&ind.to_string()).unwrap(), + expected.get(&ind.to_string()).unwrap() + ); + } + } + + #[test] + fn test_global() { + let g = load_graph(vec![ + (1, 1, 2), + (2, 1, 3), + (3, 1, 4), + (4, 3, 1), + (5, 3, 4), + (6, 3, 5), + (7, 4, 5), + (8, 5, 6), + (9, 5, 8), + (10, 7, 5), + (11, 8, 5), + (12, 1, 9), + (13, 9, 1), + (14, 6, 3), + (15, 4, 8), + (16, 8, 3), + (17, 5, 10), + (18, 10, 5), + (19, 10, 8), + (20, 1, 11), + (21, 11, 1), + (22, 9, 11), + (23, 11, 9), + ]); + + let global_motifs = &global_temporal_three_node_motif(&g, 10, None); + assert_eq!( + *global_motifs, + vec![ + 0, 0, 3, 6, 2, 3, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 6, 0, 0, 1, 7, 0, 0, 0, 0, 0, + 0, 0, 0, 0, 2, 3, 2, 4, 1, 2, 3, 1 + ] + .into_iter() + .map(|x| x as usize) + .collect::>() + ); + } +} diff --git a/raphtory/src/algorithms/pagerank.rs b/raphtory/src/algorithms/pagerank.rs index a04ac8a43d..828620afee 100644 --- a/raphtory/src/algorithms/pagerank.rs +++ b/raphtory/src/algorithms/pagerank.rs @@ -1,21 +1,23 @@ -use num_traits::abs; - -use crate::core::vertex_ref::LocalVertexRef; -use crate::db::view_api::VertexViewOps; use crate::{ - core::state::{accumulator_id::accumulators, compute_state::ComputeStateVec} , + algorithms::algorithm_result::AlgorithmResult, + core::{ + entities::{vertices::vertex_ref::VertexRef, VID}, + state::{accumulator_id::accumulators, compute_state::ComputeStateVec}, + }, db::{ + api::view::{GraphViewOps, VertexViewOps}, task::{ context::Context, task::{ATask, Job, Step}, task_runner::TaskRunner, }, - view_api::GraphViewOps, }, }; +use num_traits::abs; +use ordered_float::OrderedFloat; use std::collections::HashMap; -#[derive(Clone, Debug)] +#[derive(Clone, Debug, Default)] struct PageRankState { score: f64, out_degree: usize, @@ -34,6 +36,21 @@ impl PageRankState { } } +/// PageRank Algorithm: +/// PageRank shows how important a vertex is in a graph. +/// +/// Arguments: +/// +/// * `g`: A GraphView object +/// * `iter_count`: Number of iterations to run the algorithm for +/// * `threads`: Number of threads to use for parallel execution +/// * `tol`: The tolerance value for convergence +/// * `use_l2_norm`: Whether to use L2 norm for convergence +/// +/// Result: +/// +/// * An AlgorithmResult object containing the mapping from vertex ID to the PageRank score of the vertex +/// #[allow(unused_variables)] pub fn unweighted_page_rank( g: &G, @@ -41,9 +58,9 @@ pub fn unweighted_page_rank( threads: Option, tol: Option, use_l2_norm: bool, -) -> HashMap { - let n = g.num_vertices(); - let total_edges = g.num_edges(); +) -> AlgorithmResult> { + let n = g.count_vertices(); + let total_edges = g.count_edges(); let mut ctx: Context = g.into(); @@ -139,20 +156,23 @@ pub fn unweighted_page_rank( let mut runner: TaskRunner = TaskRunner::new(ctx); - let num_vertices = g.num_vertices(); + let num_vertices = g.count_vertices(); - let out: HashMap = runner.run( + let out: HashMap = runner.run( vec![Job::new(step1)], vec![Job::new(step2), Job::new(step3), Job::new(step4), step5], - PageRankState::new(num_vertices), - |g, _, _, local| { + Some(vec![PageRankState::new(num_vertices); num_vertices]), + |_, _, _, local| { + let layers = g.layer_ids(); + let edge_filter = g.edge_filter(); local .iter() - .filter_map(|line| { - line.as_ref() - .map(|(v_ref, state)| (v_ref.clone(), state.score)) + .enumerate() + .filter_map(|(v_ref, score)| { + g.has_vertex_ref(VertexRef::Internal(v_ref.into()), &layers, edge_filter) + .then_some((v_ref.into(), score.score)) }) - .collect::>() + .collect::>() }, threads, iter_count, @@ -160,9 +180,12 @@ pub fn unweighted_page_rank( None, ); - out.into_iter() + let res = out + .into_iter() .map(|(k, v)| (g.vertex_name(k), v)) - .collect() + .collect(); + + AlgorithmResult::new(res) } #[cfg(test)] @@ -172,27 +195,29 @@ mod page_rank_tests { use itertools::Itertools; use pretty_assertions::assert_eq; - use crate::db::graph::Graph; + use crate::{ + db::{api::mutation::AdditionOps, graph::graph::Graph}, + prelude::NO_PROPS, + }; use super::*; - fn load_graph(n_shards: usize) -> Graph { - let graph = Graph::new(n_shards); + fn load_graph() -> Graph { + let graph = Graph::new(); let edges = vec![(1, 2), (1, 4), (2, 3), (3, 1), (4, 1)]; for (src, dst) in edges { - graph.add_edge(0, src, dst, &vec![], None).unwrap(); + graph.add_edge(0, src, dst, NO_PROPS, None).unwrap(); } graph } - fn test_page_rank(n_shards: usize) { - let graph = load_graph(n_shards); + #[test] + fn test_page_rank() { + let graph = load_graph(); - let results: HashMap = unweighted_page_rank(&graph, 1000, Some(1), None, true) - .into_iter() - .collect(); + let results = unweighted_page_rank(&graph, 1000, Some(1), None, true); assert_eq_f64(results.get("1"), Some(&0.38694), 5); assert_eq_f64(results.get("2"), Some(&0.20195), 5); @@ -200,26 +225,6 @@ mod page_rank_tests { assert_eq_f64(results.get("3"), Some(&0.20916), 5); } - #[test] - fn test_page_rank_1() { - test_page_rank(1); - } - - #[test] - fn test_page_rank_2() { - test_page_rank(2); - } - - #[test] - fn test_page_rank_3() { - test_page_rank(3); - } - - #[test] - fn test_page_rank_4() { - test_page_rank(4); - } - #[test] fn motif_page_rank() { let edges = vec![ @@ -248,15 +253,13 @@ mod page_rank_tests { (11, 9, 23), ]; - let graph = Graph::new(4); + let graph = Graph::new(); for (src, dst, t) in edges { - graph.add_edge(t, src, dst, &vec![], None).unwrap(); + graph.add_edge(t, src, dst, NO_PROPS, None).unwrap(); } - let results: HashMap = unweighted_page_rank(&graph, 1000, Some(4), None, true) - .into_iter() - .collect(); + let results = unweighted_page_rank(&graph, 1000, Some(4), None, true); assert_eq_f64(results.get("10"), Some(&0.072082), 5); assert_eq_f64(results.get("8"), Some(&0.136473), 5); @@ -275,15 +278,13 @@ mod page_rank_tests { fn two_nodes_page_rank() { let edges = vec![(1, 2), (2, 1)]; - let graph = Graph::new(4); + let graph = Graph::new(); for (t, (src, dst)) in edges.into_iter().enumerate() { - graph.add_edge(t as i64, src, dst, &vec![], None).unwrap(); + graph.add_edge(t as i64, src, dst, NO_PROPS, None).unwrap(); } - let results: HashMap = unweighted_page_rank(&graph, 1000, Some(4), None, false) - .into_iter() - .collect(); + let results = unweighted_page_rank(&graph, 1000, Some(4), None, false); assert_eq_f64(results.get("1"), Some(&0.5), 3); assert_eq_f64(results.get("2"), Some(&0.5), 3); @@ -293,15 +294,13 @@ mod page_rank_tests { fn three_nodes_page_rank_one_dangling() { let edges = vec![(1, 2), (2, 1), (2, 3)]; - let graph = Graph::new(4); + let graph = Graph::new(); for (t, (src, dst)) in edges.into_iter().enumerate() { - graph.add_edge(t as i64, src, dst, &vec![], None).unwrap(); + graph.add_edge(t as i64, src, dst, NO_PROPS, None).unwrap(); } - let results: HashMap = unweighted_page_rank(&graph, 10, Some(4), None, false) - .into_iter() - .collect(); + let results = unweighted_page_rank(&graph, 10, Some(4), None, false); assert_eq_f64(results.get("1"), Some(&0.303), 3); assert_eq_f64(results.get("2"), Some(&0.393), 3); @@ -331,15 +330,13 @@ mod page_rank_tests { .map(|(t, (src, dst))| (src, dst, t as i64)) .collect_vec(); - let graph = Graph::new(4); + let graph = Graph::new(); for (src, dst, t) in edges { - graph.add_edge(t, src, dst, &vec![], None).unwrap(); + graph.add_edge(t, src, dst, NO_PROPS, None).unwrap(); } - let results: HashMap = unweighted_page_rank(&graph, 1000, Some(4), None, true) - .into_iter() - .collect(); + let results = unweighted_page_rank(&graph, 1000, Some(4), None, true); assert_eq_f64(results.get("1"), Some(&0.055), 3); assert_eq_f64(results.get("2"), Some(&0.079), 3); @@ -367,10 +364,7 @@ mod page_rank_tests { (Some(a), Some(b)) => { let left = (a.borrow() * factor).round(); let right = (b.borrow() * factor).round(); - assert_eq!( - left, - right, - ); + assert_eq!(left, right,); } _ => unreachable!(), } diff --git a/raphtory/src/algorithms/reciprocity.rs b/raphtory/src/algorithms/reciprocity.rs index 46bc7b8fa2..e03ca5b647 100644 --- a/raphtory/src/algorithms/reciprocity.rs +++ b/raphtory/src/algorithms/reciprocity.rs @@ -23,9 +23,8 @@ //! //! ```rust //! use raphtory::algorithms::reciprocity::{all_local_reciprocity, global_reciprocity}; -//! use raphtory::db::graph::Graph; -//! use raphtory::db::view_api::*; -//! let g = Graph::new(1); +//! use raphtory::prelude::*; +//! let g = Graph::new(); //! let vs = vec![ //! (1, 1, 2), //! (1, 1, 4), @@ -38,20 +37,30 @@ //! ]; //! //! for (t, src, dst) in &vs { -//! g.add_edge(*t, *src, *dst, &vec![], None); +//! g.add_edge(*t, *src, *dst, NO_PROPS, None).unwrap(); //! } //! //! println!("all_local_reciprocity: {:?}", all_local_reciprocity(&g, None)); //! println!("global_reciprocity: {:?}", global_reciprocity(&g, None)); //! ``` -use crate::core::state::accumulator_id::accumulators::sum; -use crate::core::state::compute_state::{ComputeState, ComputeStateVec}; -use crate::db::task::context::Context; -use crate::db::task::eval_vertex::EvalVertexView; -use crate::db::task::task::{ATask, Job, Step}; -use crate::db::task::task_runner::TaskRunner; -use crate::db::view_api::{GraphViewOps, VertexViewOps}; -use std::collections::{HashMap, HashSet}; +use crate::{ + algorithms::algorithm_result::AlgorithmResult, + core::state::{ + accumulator_id::accumulators::sum, + compute_state::{ComputeState, ComputeStateVec}, + }, + db::{ + api::view::{GraphViewOps, VertexViewOps}, + task::{ + context::Context, + task::{ATask, Job, Step}, + task_runner::TaskRunner, + vertex::eval_vertex::EvalVertexView, + }, + }, +}; +use ordered_float::OrderedFloat; +use std::collections::HashSet; /// Gets the unique edge counts excluding cycles for a vertex. Returns a tuple of usize /// (out neighbours, in neighbours, the intersection of the out and in neighbours) @@ -90,7 +99,7 @@ pub fn global_reciprocity(g: &G, threads: Option) -> f64 runner.run( vec![], vec![Job::new(step1)], - (), + None, |egs, _, _, _| { (egs.finalize(&total_out_inter_in) as f64) / (egs.finalize(&total_out_neighbours) as f64) @@ -103,17 +112,18 @@ pub fn global_reciprocity(g: &G, threads: Option) -> f64 } /// returns the reciprocity of every vertex in the graph as a tuple of +/// vector id and the reciprocity pub fn all_local_reciprocity( g: &G, threads: Option, -) -> HashMap { +) -> AlgorithmResult> { let mut ctx: Context = g.into(); let min = sum(0); ctx.agg(min); let step1 = ATask::new(move |evv| { - let edge_counts = get_reciprocal_edge_count(&evv); + let edge_counts = get_reciprocal_edge_count(evv); let res = (2.0 * edge_counts.2 as f64) / (edge_counts.1 as f64 + edge_counts.0 as f64); if res.is_nan() { evv.global_update(&min, 0.0); @@ -125,28 +135,31 @@ pub fn all_local_reciprocity( let mut runner: TaskRunner = TaskRunner::new(ctx); - runner.run( + AlgorithmResult::new(runner.run( vec![], vec![Job::new(step1)], - (), + None, |_, ess, _, _| ess.finalize(&min, |min| min), threads, 1, None, None, - ) + )) } #[cfg(test)] mod reciprocity_test { - use crate::algorithms::reciprocity::{all_local_reciprocity, global_reciprocity}; - use crate::db::graph::Graph; + use crate::{ + algorithms::reciprocity::{all_local_reciprocity, global_reciprocity}, + db::{api::mutation::AdditionOps, graph::graph::Graph}, + prelude::NO_PROPS, + }; use pretty_assertions::assert_eq; use std::collections::HashMap; #[test] fn test_global_recip() { - let graph = Graph::new(2); + let graph = Graph::new(); let vs = vec![ (1, 2), @@ -160,26 +173,20 @@ mod reciprocity_test { ]; for (src, dst) in &vs { - graph.add_edge(0, *src, *dst, &vec![], None).unwrap(); + graph.add_edge(0, *src, *dst, NO_PROPS, None).unwrap(); } let actual = global_reciprocity(&graph, None); assert_eq!(actual, 0.5); - let expected_vec: Vec<(String, f64)> = vec![ - ("1".to_string(), 0.4), - ("2".to_string(), 2.0 / 3.0), - ("3".to_string(), 0.5), - ("4".to_string(), 2.0 / 3.0), - ("5".to_string(), 0.0), - ]; - - let map_names_by_id: HashMap = expected_vec - .iter() - .map(|x| (x.0.to_string(), x.1)) - .collect(); + let mut hash_map_result: HashMap = HashMap::new(); + hash_map_result.insert("1".to_string(), 0.4); + hash_map_result.insert("2".to_string(), 2.0 / 3.0); + hash_map_result.insert("3".to_string(), 0.5); + hash_map_result.insert("4".to_string(), 2.0 / 3.0); + hash_map_result.insert("5".to_string(), 0.0); - let actual = all_local_reciprocity(&graph, None); - assert_eq!(actual, map_names_by_id); + let res = all_local_reciprocity(&graph, None); + assert_eq!(res.get("1"), hash_map_result.get("1")); } } diff --git a/raphtory/src/algorithms/generic_taint.rs b/raphtory/src/algorithms/temporal_reachability.rs similarity index 60% rename from raphtory/src/algorithms/generic_taint.rs rename to raphtory/src/algorithms/temporal_reachability.rs index 5ad7cbb043..971ddd91ab 100644 --- a/raphtory/src/algorithms/generic_taint.rs +++ b/raphtory/src/algorithms/temporal_reachability.rs @@ -1,14 +1,22 @@ -use crate::core::state::accumulator_id::accumulators::{hash_set, min, or}; -use crate::core::state::compute_state::ComputeStateVec; -use crate::core::vertex::InputVertex; -use crate::db::task::context::Context; -use crate::db::task::task::{ATask, Job, Step}; -use crate::db::task::task_runner::TaskRunner; -use crate::db::view_api::edge::EdgeViewOps; -use crate::db::view_api::{GraphViewOps, TimeOps, VertexViewOps}; +use crate::{ + algorithms::algorithm_result::AlgorithmResult, + core::{ + entities::vertices::input_vertex::InputVertex, + state::{ + accumulator_id::accumulators::{hash_set, min, or}, + compute_state::ComputeStateVec, + }, + }, + db::task::{ + context::Context, + task::{ATask, Job, Step}, + task_runner::TaskRunner, + vertex::eval_vertex::EvalVertexView, + }, + prelude::*, +}; use itertools::Itertools; use num_traits::Zero; -use std::collections::HashMap; use std::ops::Add; #[derive(Eq, Hash, PartialEq, Clone, Debug, Default)] @@ -46,18 +54,31 @@ impl Zero for TaintMessage { } } -pub fn generic_taint( +/// Temporal Reachability starts from a set of seed nodes and propagates the taint to all nodes that are reachable +/// from the seed nodes within a given time window. The algorithm stops when all nodes that are reachable from the +/// seed nodes have been tainted or when the taint has propagated to all nodes in the graph. +/// +/// Returns +/// +/// * An AlgorithmResult object containing the mapping from vertex ID to a vector of tuples containing the time at which +/// the vertex was tainted and the ID of the vertex that tainted it +/// +pub fn temporally_reachable_nodes( g: &G, threads: Option, - iter_count: usize, + max_hops: usize, start_time: i64, - infected_nodes: Vec, - stop_nodes: Vec, -) -> HashMap> { + seed_nodes: Vec, + stop_nodes: Option>, +) -> AlgorithmResult> { let mut ctx: Context = g.into(); - let infected_nodes = infected_nodes.into_iter().map(|n| n.id()).collect_vec(); - let stop_nodes = stop_nodes.into_iter().map(|n| n.id()).collect_vec(); + let infected_nodes = seed_nodes.into_iter().map(|n| n.id()).collect_vec(); + let stop_nodes = stop_nodes + .unwrap_or(vec![]) + .into_iter() + .map(|n| n.id()) + .collect_vec(); let taint_status = or(0); ctx.global_agg(taint_status); @@ -74,36 +95,38 @@ pub fn generic_taint( let tainted_vertices = hash_set::(4); ctx.global_agg(tainted_vertices); - let step1 = ATask::new(move |evv| { - if infected_nodes.contains(&evv.id()) { - evv.global_update(&tainted_vertices, evv.id()); - evv.update(&taint_status, true); - evv.update(&earliest_taint_time, start_time); - evv.update( - &taint_history, - TaintMessage { - event_time: start_time, - src_vertex: "start".to_string(), - }, - ); - evv.window(start_time, i64::MAX) - .out_edges() - .for_each(|eev| { - let dst = eev.dst(); - eev.history().into_iter().for_each(|t| { - dst.update(&earliest_taint_time, t); - dst.update( - &recv_tainted_msgs, - TaintMessage { - event_time: t, - src_vertex: evv.name(), - }, - ) + let step1 = ATask::new( + move |evv: &mut EvalVertexView<'_, G, ComputeStateVec, ()>| { + if infected_nodes.contains(&evv.id()) { + evv.global_update(&tainted_vertices, evv.id()); + evv.update(&taint_status, true); + evv.update(&earliest_taint_time, start_time); + evv.update( + &taint_history, + TaintMessage { + event_time: start_time, + src_vertex: "start".to_string(), + }, + ); + evv.window(start_time, i64::MAX) + .out_edges() + .for_each(|eev| { + let dst = eev.dst(); + eev.history().into_iter().for_each(|t| { + dst.update(&earliest_taint_time, t); + dst.update( + &recv_tainted_msgs, + TaintMessage { + event_time: t, + src_vertex: evv.name(), + }, + ) + }); }); - }); - } - Step::Continue - }); + } + Step::Continue + }, + ); let step2 = ATask::new(move |evv| { let msgs = evv.read(&recv_tainted_msgs); @@ -158,10 +181,10 @@ pub fn generic_taint( let mut runner: TaskRunner = TaskRunner::new(ctx); - runner.run( + AlgorithmResult::new(runner.run( vec![Job::new(step1)], vec![Job::new(step2), step3], - (), + None, |_, ess, _, _| { ess.finalize(&taint_history, |taint_history| { taint_history @@ -171,22 +194,22 @@ pub fn generic_taint( }) }, threads, - iter_count, + max_hops, None, None, - ) + )) } #[cfg(test)] mod generic_taint_tests { use super::*; - use crate::db::graph::Graph; + use crate::db::{api::mutation::AdditionOps, graph::graph::Graph}; - fn load_graph(n_shards: usize, edges: Vec<(i64, u64, u64)>) -> Graph { - let graph = Graph::new(n_shards); + fn load_graph(edges: Vec<(i64, u64, u64)>) -> Graph { + let graph = Graph::new(); for (t, src, dst) in edges { - graph.add_edge(t, src, dst, &vec![], None).unwrap(); + graph.add_edge(t, src, dst, NO_PROPS, None).unwrap(); } graph } @@ -196,9 +219,9 @@ mod generic_taint_tests { iter_count: usize, start_time: i64, infected_nodes: Vec, - stop_nodes: Vec, + stop_nodes: Option>, ) -> Vec<(String, Vec<(i64, String)>)> { - let mut results: Vec<(String, Vec<(i64, String)>)> = generic_taint( + let results: Vec<(String, Vec<(i64, String)>)> = temporally_reachable_nodes( &graph, None, iter_count, @@ -206,6 +229,7 @@ mod generic_taint_tests { infected_nodes, stop_nodes, ) + .sort_by_key(false) .into_iter() .map(|(k, mut v)| { v.sort(); @@ -213,29 +237,25 @@ mod generic_taint_tests { }) .collect_vec(); - results.sort(); results } #[test] fn test_generic_taint_1() { - let graph = load_graph( - 1, - vec![ - (10, 1, 3), - (11, 1, 2), - (12, 2, 4), - (13, 2, 5), - (14, 5, 5), - (14, 5, 4), - (5, 4, 6), - (15, 4, 7), - (10, 4, 7), - (10, 5, 8), - ], - ); - - let results = test_generic_taint(graph, 20, 11, vec![2], vec![]); + let graph = load_graph(vec![ + (10, 1, 3), + (11, 1, 2), + (12, 2, 4), + (13, 2, 5), + (14, 5, 5), + (14, 5, 4), + (5, 4, 6), + (15, 4, 7), + (10, 4, 7), + (10, 5, 8), + ]); + + let results = test_generic_taint(graph, 20, 11, vec![2], None); assert_eq!( results, @@ -253,29 +273,27 @@ mod generic_taint_tests { ), ("6".to_string(), vec![]), ("7".to_string(), vec![(15, "4".to_string())]), + ("8".to_string(), vec![]), ]) ); } #[test] fn test_generic_taint_1_multiple_start() { - let graph = load_graph( - 1, - vec![ - (10, 1, 3), - (11, 1, 2), - (12, 2, 4), - (13, 2, 5), - (14, 5, 5), - (14, 5, 4), - (5, 4, 6), - (15, 4, 7), - (10, 4, 7), - (10, 5, 8), - ], - ); - - let results = test_generic_taint(graph, 20, 11, vec![1, 2], vec![]); + let graph = load_graph(vec![ + (10, 1, 3), + (11, 1, 2), + (12, 2, 4), + (13, 2, 5), + (14, 5, 5), + (14, 5, 4), + (5, 4, 6), + (15, 4, 7), + (10, 4, 7), + (10, 5, 8), + ]); + + let results = test_generic_taint(graph, 20, 11, vec![1, 2], None); assert_eq!( results, @@ -296,29 +314,27 @@ mod generic_taint_tests { ), ("6".to_string(), vec![]), ("7".to_string(), vec![(15, "4".to_string())]), + ("8".to_string(), vec![]), ]) ); } #[test] fn test_generic_taint_1_stop_nodes() { - let graph = load_graph( - 1, - vec![ - (10, 1, 3), - (11, 1, 2), - (12, 2, 4), - (13, 2, 5), - (14, 5, 5), - (14, 5, 4), - (5, 4, 6), - (15, 4, 7), - (10, 4, 7), - (10, 5, 8), - ], - ); - - let results = test_generic_taint(graph, 20, 11, vec![1, 2], vec![4, 5]); + let graph = load_graph(vec![ + (10, 1, 3), + (11, 1, 2), + (12, 2, 4), + (13, 2, 5), + (14, 5, 5), + (14, 5, 4), + (5, 4, 6), + (15, 4, 7), + (10, 4, 7), + (10, 5, 8), + ]); + + let results = test_generic_taint(graph, 20, 11, vec![1, 2], Some(vec![4, 5])); assert_eq!( results, @@ -331,31 +347,31 @@ mod generic_taint_tests { ("3".to_string(), vec![]), ("4".to_string(), vec![(12, "2".to_string())]), ("5".to_string(), vec![(13, "2".to_string())]), + ("6".to_string(), vec![]), + ("7".to_string(), vec![]), + ("8".to_string(), vec![]), ]) ); } #[test] fn test_generic_taint_1_multiple_history_points() { - let graph = load_graph( - 1, - vec![ - (10, 1, 3), - (11, 1, 2), - (12, 1, 2), - (9, 1, 2), - (12, 2, 4), - (13, 2, 5), - (14, 5, 5), - (14, 5, 4), - (5, 4, 6), - (15, 4, 7), - (10, 4, 7), - (10, 5, 8), - ], - ); - - let results = test_generic_taint(graph, 20, 11, vec![1, 2], vec![4, 5]); + let graph = load_graph(vec![ + (10, 1, 3), + (11, 1, 2), + (12, 1, 2), + (9, 1, 2), + (12, 2, 4), + (13, 2, 5), + (14, 5, 5), + (14, 5, 4), + (5, 4, 6), + (15, 4, 7), + (10, 4, 7), + (10, 5, 8), + ]); + + let results = test_generic_taint(graph, 20, 11, vec![1, 2], Some(vec![4, 5])); assert_eq!( results, @@ -372,6 +388,9 @@ mod generic_taint_tests { ("3".to_string(), vec![]), ("4".to_string(), vec![(12, "2".to_string())]), ("5".to_string(), vec![(13, "2".to_string())]), + ("6".to_string(), vec![]), + ("7".to_string(), vec![]), + ("8".to_string(), vec![]), ]) ); } diff --git a/raphtory/src/algorithms/triangle_count.rs b/raphtory/src/algorithms/triangle_count.rs index e9748edf58..f7454c1680 100644 --- a/raphtory/src/algorithms/triangle_count.rs +++ b/raphtory/src/algorithms/triangle_count.rs @@ -1,9 +1,17 @@ -use crate::core::state::accumulator_id::accumulators; -use crate::core::state::compute_state::ComputeStateVec; -use crate::db::task::context::Context; -use crate::db::task::task::{ATask, Job, Step}; -use crate::db::task::task_runner::TaskRunner; -use crate::db::view_api::*; +use crate::{ + algorithms::k_core::k_core_set, + core::state::{accumulator_id::accumulators, compute_state::ComputeStateVec}, + db::{ + api::view::*, + graph::views::vertex_subgraph::VertexSubgraph, + task::{ + context::Context, + task::{ATask, Job, Step}, + task_runner::TaskRunner, + vertex::eval_vertex::EvalVertexView, + }, + }, +}; use rustc_hash::FxHashSet; /// Computes the number of triangles in a graph using a fast algorithm @@ -21,10 +29,10 @@ use rustc_hash::FxHashSet; /// # Example /// ```rust /// use std::{cmp::Reverse, iter::once}; -/// use raphtory::db::graph::Graph; /// use raphtory::algorithms::triangle_count::triangle_count; +/// use raphtory::prelude::*; /// -/// let graph = Graph::new(2); +/// let graph = Graph::new(); /// /// let edges = vec![ /// // triangle 1 @@ -44,29 +52,34 @@ use rustc_hash::FxHashSet; /// ]; /// /// for (src, dst, ts) in edges { -/// graph.add_edge(ts, src, dst, &vec![], None); +/// graph.add_edge(ts, src, dst, NO_PROPS, None); /// } /// /// let actual_tri_count = triangle_count(&graph, None); /// ``` /// -pub fn triangle_count(g: &G, threads: Option) -> usize { - let mut ctx: Context = g.into(); +pub fn triangle_count(graph: &G, threads: Option) -> usize { + let vertex_set = k_core_set(graph, 2, usize::MAX, None); + let g = graph.subgraph(vertex_set); + let mut ctx: Context, ComputeStateVec> = Context::from(&g); + // let mut ctx: Context = graph.into(); let neighbours_set = accumulators::hash_set::(0); let count = accumulators::sum::(1); ctx.agg(neighbours_set); ctx.global_agg(count); - let step1 = ATask::new(move |s| { - for t in s.neighbours() { - if s.id() > t.id() { - t.update(&neighbours_set, s.id()); + let step1 = ATask::new( + move |s: &mut EvalVertexView<'_, VertexSubgraph, ComputeStateVec, ()>| { + for t in s.neighbours() { + if s.id() > t.id() { + t.update(&neighbours_set, s.id()); + } } - } - Step::Continue - }); + Step::Continue + }, + ); let step2 = ATask::new(move |s| { for t in s.neighbours() { @@ -98,12 +111,12 @@ pub fn triangle_count(g: &G, threads: Option) -> usize { let init_tasks = vec![Job::new(step1)]; let tasks = vec![Job::new(step2)]; - let mut runner: TaskRunner = TaskRunner::new(ctx); + let mut runner: TaskRunner, _> = TaskRunner::new(ctx); runner.run( init_tasks, tasks, - (), + None, |egs, _, _, _| egs.finalize(&count), threads, 1, @@ -115,11 +128,14 @@ pub fn triangle_count(g: &G, threads: Option) -> usize { #[cfg(test)] mod triangle_count_tests { use super::*; - use crate::db::graph::Graph; + use crate::{ + db::{api::mutation::AdditionOps, graph::graph::Graph}, + prelude::NO_PROPS, + }; #[test] fn triangle_count_1() { - let graph = Graph::new(2); + let graph = Graph::new(); let edges = vec![ // triangle 1 @@ -139,7 +155,7 @@ mod triangle_count_tests { ]; for (src, dst, ts) in edges { - graph.add_edge(ts, src, dst, &vec![], None).unwrap(); + graph.add_edge(ts, src, dst, NO_PROPS, None).unwrap(); } let actual_tri_count = triangle_count(&graph, Some(2)); @@ -149,7 +165,7 @@ mod triangle_count_tests { #[test] fn triangle_count_3() { - let graph = Graph::new(2); + let graph = Graph::new(); let edges = vec![ (1, 2, 1), @@ -178,7 +194,7 @@ mod triangle_count_tests { ]; for (src, dst, ts) in edges { - graph.add_edge(ts, src, dst, &vec![], None).unwrap(); + graph.add_edge(ts, src, dst, NO_PROPS, None).unwrap(); } let actual_tri_count = triangle_count(&graph, None); diff --git a/raphtory/src/algorithms/triplet_count.rs b/raphtory/src/algorithms/triplet_count.rs index 695af8df14..5302dd59ec 100644 --- a/raphtory/src/algorithms/triplet_count.rs +++ b/raphtory/src/algorithms/triplet_count.rs @@ -14,10 +14,9 @@ //! # Example //! //! ```rust -//! use raphtory::db::graph::Graph; +//! use raphtory::prelude::*; //! use raphtory::algorithms::triplet_count::triplet_count; -//! use raphtory::db::view_api::*; -//! let graph = Graph::new(2); +//! let graph = Graph::new(); //! let edges = vec![ //! (1, 2), //! (1, 3), @@ -27,18 +26,24 @@ //! (2, 7), //! ]; //! for (src, dst) in edges { -//! graph.add_edge(0, src, dst, &vec![], None); +//! graph.add_edge(0, src, dst, NO_PROPS, None); //! } //! let results = triplet_count(&graph.at(1), None); //! println!("triplet count: {}", results); //! ``` //! -use crate::core::state::accumulator_id::accumulators::sum; -use crate::core::state::compute_state::ComputeStateVec; -use crate::db::task::context::Context; -use crate::db::task::task::{ATask, Job, Step}; -use crate::db::task::task_runner::TaskRunner; -use crate::db::view_api::{GraphViewOps, VertexViewOps}; +use crate::{ + core::state::{accumulator_id::accumulators::sum, compute_state::ComputeStateVec}, + db::{ + api::view::{GraphViewOps, VertexViewOps}, + task::{ + context::Context, + task::{ATask, Job, Step}, + task_runner::TaskRunner, + vertex::eval_vertex::EvalVertexView, + }, + }, +}; /// Computes the number of both open and closed triplets within a graph /// @@ -56,10 +61,9 @@ use crate::db::view_api::{GraphViewOps, VertexViewOps}; /// # Example /// /// ```rust -/// use raphtory::db::graph::Graph; /// use raphtory::algorithms::triplet_count::triplet_count; -/// use raphtory::db::view_api::*; -/// let graph = Graph::new(2); +/// use raphtory::prelude::*; +/// let graph = Graph::new(); /// let edges = vec![ /// (1, 2), /// (1, 3), @@ -69,7 +73,7 @@ use crate::db::view_api::{GraphViewOps, VertexViewOps}; /// (2, 7), /// ]; /// for (src, dst) in edges { -/// graph.add_edge(0, src, dst, &vec![], None); +/// graph.add_edge(0, src, dst, NO_PROPS, None); /// } /// /// let results = triplet_count(&graph.at(1), None); @@ -87,19 +91,21 @@ pub fn triplet_count(g: &G, threads: Option) -> usize { let count = sum::(0); ctx.global_agg(count); - let step1 = ATask::new(move |evv| { - let c1 = evv.neighbours().id().filter(|n| *n != evv.id()).count(); - let c2 = count_two_combinations(c1); - evv.global_update(&count, c2); - Step::Continue - }); + let step1 = ATask::new( + move |evv: &mut EvalVertexView<'_, G, ComputeStateVec, ()>| { + let c1 = evv.neighbours().id().filter(|n| *n != evv.id()).count(); + let c2 = count_two_combinations(c1); + evv.global_update(&count, c2); + Step::Continue + }, + ); let mut runner: TaskRunner = TaskRunner::new(ctx); runner.run( vec![], vec![Job::new(step1)], - (), + None, |egs, _, _, _| egs.finalize(&count), threads, 1, @@ -111,14 +117,19 @@ pub fn triplet_count(g: &G, threads: Option) -> usize { #[cfg(test)] mod triplet_test { use super::*; - use crate::db::graph::Graph; - use crate::db::view_api::*; + use crate::{ + db::{ + api::{mutation::AdditionOps, view::*}, + graph::graph::Graph, + }, + prelude::NO_PROPS, + }; use pretty_assertions::assert_eq; /// Test the global clustering coefficient #[test] fn test_triplet_count() { - let graph = Graph::new(1); + let graph = Graph::new(); // Graph has 2 triangles and 20 triplets let edges = vec![ @@ -145,7 +156,7 @@ mod triplet_test { ]; for (src, dst) in edges { - graph.add_edge(0, src, dst, &vec![], None).unwrap(); + graph.add_edge(0, src, dst, NO_PROPS, None).unwrap(); } let exp_triplet_count = 20; let results = triplet_count(&graph.at(1), None); diff --git a/raphtory/src/core/adj.rs b/raphtory/src/core/adj.rs deleted file mode 100644 index 844e901132..0000000000 --- a/raphtory/src/core/adj.rs +++ /dev/null @@ -1,77 +0,0 @@ -use crate::core::edge_layer::VID; -use crate::core::{tadjset::TAdjSet, Direction}; -use serde::{Deserialize, Serialize}; - -#[derive(Debug, Serialize, Deserialize, PartialEq, Default)] -pub(crate) enum Adj { - #[default] - Solo, - List { - // local: - out: TAdjSet, - into: TAdjSet, - // remote: - remote_out: TAdjSet, - remote_into: TAdjSet, - }, -} - -impl Adj { - pub(crate) fn get_edge(&self, v: VID, dir: Direction) -> Option { - match self { - Adj::Solo => None, - Adj::List { - out, - into, - remote_out, - remote_into, - } => match dir { - Direction::OUT => match v { - VID::Remote(v) => remote_out.find(v), - VID::Local(v) => out.find(v), - }, - Direction::IN => match v { - VID::Remote(v) => remote_into.find(v), - VID::Local(v) => into.find(v), - }, - Direction::BOTH => self - .get_edge(v, Direction::OUT) - .or_else(|| self.get_edge(v, Direction::IN)), - }, - } - } - - pub(crate) fn new_out(v: VID, e: usize) -> Self { - match v { - VID::Local(v) => Adj::List { - out: TAdjSet::new(v, e), - into: TAdjSet::default(), - remote_out: TAdjSet::default(), - remote_into: TAdjSet::default(), - }, - VID::Remote(v) => Adj::List { - out: TAdjSet::default(), - into: TAdjSet::default(), - remote_out: TAdjSet::new(v, e), - remote_into: TAdjSet::default(), - }, - } - } - - pub(crate) fn new_into(v: VID, e: usize) -> Self { - match v { - VID::Local(v) => Adj::List { - into: TAdjSet::new(v, e), - out: TAdjSet::default(), - remote_out: TAdjSet::default(), - remote_into: TAdjSet::default(), - }, - VID::Remote(v) => Adj::List { - out: TAdjSet::default(), - into: TAdjSet::default(), - remote_into: TAdjSet::new(v, e), - remote_out: TAdjSet::default(), - }, - } - } -} diff --git a/raphtory/src/core/edge_layer.rs b/raphtory/src/core/edge_layer.rs deleted file mode 100644 index 5e3b2293f5..0000000000 --- a/raphtory/src/core/edge_layer.rs +++ /dev/null @@ -1,753 +0,0 @@ -use itertools::chain; -use itertools::Itertools; -use rayon::prelude::*; -use serde::{Deserialize, Serialize}; -use std::iter; -use std::ops::Range; - -use crate::core::adj::Adj; -use crate::core::edge_ref::EdgeRef; -use crate::core::props::Props; -use crate::core::timeindex::TimeIndex; -use crate::core::{Direction, Prop}; - -#[derive(Clone, Copy, PartialEq, Eq, PartialOrd, Ord)] -pub(crate) enum VID { - Local(usize), - Remote(u64), -} - -impl From for VID { - fn from(value: u64) -> Self { - VID::Remote(value) - } -} - -impl From for VID { - fn from(value: usize) -> Self { - VID::Local(value) - } -} - -#[derive(Debug, Serialize, Deserialize, PartialEq)] -pub(crate) struct EdgeLayer { - layer_id: usize, - shard_id: usize, - local_timestamps: Vec, - remote_out_timestamps: Vec, - remote_into_timestamps: Vec, - - // Vector of adjacency lists. It is populated lazyly, so avoid using [] accessor for reading - adj_lists: Vec, - local_props: Props, - remote_out_props: Props, - remote_into_props: Props, -} - -impl EdgeLayer { - pub(crate) fn new(layer_id: usize, shard_id: usize) -> Self { - Self { - layer_id, - shard_id, - adj_lists: Default::default(), - local_props: Default::default(), - remote_out_props: Default::default(), - local_timestamps: Default::default(), - remote_out_timestamps: Default::default(), - remote_into_timestamps: Default::default(), - remote_into_props: Default::default(), - } - } - - fn new_local_out_edge_ref( - &self, - src_pid: usize, - dst_pid: usize, - e_pid: usize, - time: Option, - ) -> EdgeRef { - EdgeRef::LocalOut { - e_pid, - shard_id: self.shard_id, - layer_id: self.layer_id, - src_pid, - dst_pid, - time, - } - } - - fn new_local_into_edge_ref( - &self, - src_pid: usize, - dst_pid: usize, - e_pid: usize, - time: Option, - ) -> EdgeRef { - EdgeRef::LocalInto { - e_pid, - shard_id: self.shard_id, - layer_id: self.layer_id, - src_pid, - dst_pid, - time, - } - } - - fn new_remote_out_edge_ref( - &self, - src_pid: usize, - dst: u64, - e_pid: usize, - time: Option, - ) -> EdgeRef { - EdgeRef::RemoteOut { - e_pid, - shard_id: self.shard_id, - layer_id: self.layer_id, - src_pid, - dst, - time, - } - } - - fn new_remote_into_edge_ref( - &self, - src: u64, - dst_pid: usize, - e_pid: usize, - time: Option, - ) -> EdgeRef { - EdgeRef::RemoteInto { - e_pid, - shard_id: self.shard_id, - layer_id: self.layer_id, - src, - dst_pid, - time, - } - } -} - -// INGESTION: -impl EdgeLayer { - pub(crate) fn add_edge_with_props( - &mut self, - t: i64, - src_pid: usize, - dst_pid: usize, - props: &Vec<(String, Prop)>, - ) { - let required_len = std::cmp::max(src_pid, dst_pid) + 1; - let dst = VID::Local(dst_pid); - let src = VID::Local(src_pid); - self.ensure_adj_lists_len(required_len); - let edge_meta = self.get_edge_and_update_time(src_pid, dst, t, Direction::OUT); - self.link_outbound_edge(edge_meta, src_pid, dst); - self.link_inbound_edge(edge_meta, src, dst_pid); - self.local_props.upsert_temporal_props(t, edge_meta, props); - } - - #[allow(unused_variables)] - pub(crate) fn add_edge_remote_out( - &mut self, - t: i64, - src_pid: usize, - dst: u64, - props: &Vec<(String, Prop)>, - ) { - self.ensure_adj_lists_len(src_pid + 1); - let dst = VID::Remote(dst); - let edge_meta = self.get_edge_and_update_time(src_pid, dst, t, Direction::OUT); - self.link_outbound_edge(edge_meta, src_pid, dst); - self.remote_out_props - .upsert_temporal_props(t, edge_meta, props); - } - - #[allow(unused_variables)] - pub(crate) fn add_edge_remote_into( - &mut self, - t: i64, - src: u64, - dst_pid: usize, - props: &Vec<(String, Prop)>, - ) { - let src = VID::Remote(src); - self.ensure_adj_lists_len(dst_pid + 1); - let edge_meta = self.get_edge_and_update_time(dst_pid, src, t, Direction::IN); - self.link_inbound_edge(edge_meta, src, dst_pid); - self.remote_into_props - .upsert_temporal_props(t, edge_meta, props); - } - - pub(crate) fn edge_props_mut(&mut self, edge: EdgeRef) -> &mut Props { - match edge { - EdgeRef::RemoteInto { .. } => &mut self.remote_into_props, - EdgeRef::RemoteOut { .. } => &mut self.remote_out_props, - _ => &mut self.local_props, - } - } - - pub(crate) fn edge_props(&self, edge: EdgeRef) -> &Props { - match edge { - EdgeRef::RemoteInto { .. } => &self.remote_into_props, - EdgeRef::RemoteOut { .. } => &self.remote_out_props, - _ => &self.local_props, - } - } -} - -// INGESTION HELPERS: -impl EdgeLayer { - #[inline] - fn ensure_adj_lists_len(&mut self, len: usize) { - if self.adj_lists.len() < len { - self.adj_lists.resize_with(len, Default::default); - } - } - - #[inline] - fn get_adj(&self, v_pid: usize) -> &Adj { - self.adj_lists.get(v_pid).unwrap_or(&Adj::Solo) - } - - fn get_edge_and_update_time( - &mut self, - local_v: usize, - other: VID, - t: i64, - dir: Direction, - ) -> usize { - let timestamps = match other { - VID::Remote(_) => match dir { - Direction::IN => &mut self.remote_into_timestamps, - Direction::OUT => &mut self.remote_out_timestamps, - Direction::BOTH => { - panic!("Internal get_edge function should not be called with `Direction::BOTH`") - } - }, - VID::Local(_) => &mut self.local_timestamps, - }; - match self.adj_lists[local_v].get_edge(other, dir) { - Some(edge) => { - timestamps[edge].insert(t); - edge - } - None => { - let edge = timestamps.len(); - timestamps.push(TimeIndex::one(t)); - edge - } - } - } - - pub(crate) fn link_inbound_edge( - &mut self, - edge: usize, - src: VID, // may or may not be physical id depending on remote_edge flag - dst_pid: usize, - ) { - match &mut self.adj_lists[dst_pid] { - entry @ Adj::Solo => { - *entry = Adj::new_into(src, edge); - } - Adj::List { - into, remote_into, .. - } => match src { - VID::Remote(v) => remote_into.push(v, edge), - VID::Local(v) => into.push(v, edge), - }, - } - } - - pub(crate) fn link_outbound_edge( - &mut self, - edge: usize, - src_pid: usize, - dst: VID, // may or may not pe physical id depending on remote_edge flag - ) { - match &mut self.adj_lists[src_pid] { - entry @ Adj::Solo => { - *entry = Adj::new_out(dst, edge); - } - Adj::List { - out, remote_out, .. - } => match dst { - VID::Remote(v) => remote_out.push(v, edge), - VID::Local(v) => out.push(v, edge), - }, - } - } -} - -// SINGLE EDGE ACCESS: -impl EdgeLayer { - pub(crate) fn edge(&self, src: VID, dst: VID, w: Option>) -> Option { - match src { - VID::Local(src_pid) => { - let adj = self.get_adj(src_pid); - match adj { - Adj::Solo => None, - Adj::List { - out, remote_out, .. - } => match dst { - VID::Local(dst_pid) => { - let e = out.find(dst_pid).and_then(|e| match w { - Some(w) => self.local_timestamps[e].active(w).then_some(e), - None => Some(e), - })?; - Some(EdgeRef::LocalOut { - e_pid: e, - shard_id: self.shard_id, - layer_id: self.layer_id, - src_pid, - dst_pid, - time: None, - }) - } - VID::Remote(dst) => { - let e = remote_out.find(dst).and_then(|e| match w { - Some(w) => self.remote_out_timestamps[e].active(w).then_some(e), - None => Some(e), - })?; - Some(EdgeRef::RemoteOut { - e_pid: e, - shard_id: self.shard_id, - layer_id: self.layer_id, - src_pid, - dst, - time: None, - }) - } - }, - } - } - VID::Remote(src) => match dst { - VID::Local(dst_pid) => { - let adj = self.get_adj(dst_pid); - match adj { - Adj::Solo => None, - Adj::List { remote_into, .. } => { - let e = remote_into.find(src).filter(|e| match w { - Some(w) => self.remote_into_timestamps[*e].active(w), - None => true, - })?; - Some(EdgeRef::RemoteInto { - e_pid: e, - shard_id: self.shard_id, - layer_id: self.layer_id, - src, - dst_pid, - time: None, - }) - } - } - } - VID::Remote(_) => None, - }, - } - } - - pub(crate) fn has_edge(&self, src: VID, dst: VID, w: Option>) -> bool { - self.edge(src, dst, w).is_some() - } - - #[inline] - pub(crate) fn get_edge_history(&self, edge: EdgeRef) -> impl Iterator + '_ { - let timestamps = match edge { - EdgeRef::RemoteInto { e_pid, .. } => &self.remote_into_timestamps[e_pid], - EdgeRef::RemoteOut { e_pid, .. } => &self.remote_out_timestamps[e_pid], - local_edge => &self.local_timestamps[local_edge.pid()], - }; - timestamps.iter().copied() - } - - #[inline] - pub(crate) fn get_edge_history_window( - &self, - edge: EdgeRef, - w: Range, - ) -> impl Iterator + '_ { - let timestamps = match edge { - EdgeRef::RemoteInto { e_pid, .. } => &self.remote_into_timestamps[e_pid], - EdgeRef::RemoteOut { e_pid, .. } => &self.remote_out_timestamps[e_pid], - local_edge => &self.local_timestamps[local_edge.pid()], - }; - timestamps.range(w).copied() - } - - pub(crate) fn explode_edge(&self, edge: EdgeRef) -> impl Iterator + '_ { - self.get_edge_history(edge).map(move |t| edge.at(t)) - } - - pub(crate) fn explode_edge_window( - &self, - edge: EdgeRef, - w: Range, - ) -> impl Iterator + '_ { - self.get_edge_history_window(edge, w) - .map(move |t| edge.at(t)) - } -} - -// AGGREGATED ACCESS: -impl EdgeLayer { - pub(crate) fn out_edges_len(&self) -> usize { - self.local_timestamps.len() + self.remote_out_timestamps.len() - } - - pub(crate) fn out_edges_len_window(&self, w: &Range) -> usize { - self.local_timestamps - .par_iter() - .filter(|ts| ts.active(w.clone())) - .count() - + self - .remote_out_timestamps - .par_iter() - .filter(|ts| ts.active(w.clone())) - .count() - } -} - -// MULTIPLE EDGE ACCES: -impl EdgeLayer { - pub fn vertex_neighbours( - &self, - v_pid: usize, - d: Direction, - ) -> Box + Send + '_> { - let adj = self.get_adj(v_pid); - match adj { - Adj::Solo => { - let iter: Box + Send + '_> = Box::new(iter::empty()); - iter - } - Adj::List { - out, - into, - remote_out, - remote_into, - } => match d { - Direction::OUT => { - let iter: Box + Send + '_> = Box::new( - out.vertices() - .map_into() - .chain(remote_out.vertices().map_into()), - ); - iter - } - Direction::IN => { - let iter: Box + Send + '_> = Box::new( - into.vertices() - .map_into() - .chain(remote_into.vertices().map_into()), - ); - iter - } - Direction::BOTH => { - let iter: Box + Send + '_> = Box::new( - out.vertices() - .merge(into.vertices()) - .dedup() - .map_into() - .chain( - remote_out - .vertices() - .merge(remote_into.vertices()) - .dedup() - .map_into(), - ), - ); - iter - } - }, - } - } - - pub fn vertex_neighbours_window( - &self, - v_pid: usize, - d: Direction, - window: &Range, - ) -> Box + Send + '_> { - let adj = self.get_adj(v_pid); - match adj { - Adj::Solo => { - let iter: Box + Send + '_> = Box::new(iter::empty()); - iter - } - Adj::List { - out, - into, - remote_out, - remote_into, - } => match d { - Direction::OUT => { - let iter: Box + Send + '_> = Box::new( - out.vertices_window(&self.local_timestamps, window) - .map_into() - .chain( - remote_out - .vertices_window(&self.remote_out_timestamps, window) - .map_into(), - ), - ); - iter - } - Direction::IN => { - let iter: Box + Send + '_> = Box::new( - into.vertices_window(&self.local_timestamps, window) - .map_into() - .chain( - remote_into - .vertices_window(&self.remote_into_timestamps, window) - .map_into(), - ), - ); - iter - } - Direction::BOTH => { - let iter: Box + Send + '_> = Box::new( - out.vertices_window(&self.local_timestamps, window) - .merge(into.vertices_window(&self.local_timestamps, window)) - .dedup() - .map_into() - .chain( - remote_out - .vertices_window(&self.remote_out_timestamps, window) - .merge( - remote_into - .vertices_window(&self.remote_into_timestamps, window), - ) - .dedup() - .map_into(), - ), - ); - iter - } - }, - } - } - - pub fn degree(&self, v_pid: usize, d: Direction) -> usize { - let adj = self.get_adj(v_pid); - match adj { - Adj::Solo => 0, - Adj::List { - out, - into, - remote_out, - remote_into, - } => match d { - Direction::OUT => out.len() + remote_out.len(), - Direction::IN => into.len() + remote_into.len(), - Direction::BOTH => { - out.vertices().merge(into.vertices()).dedup().count() - + remote_out - .vertices() - .merge(remote_into.vertices()) - .dedup() - .count() - } - }, - } - } - - pub fn degree_window(&self, v_pid: usize, d: Direction, window: &Range) -> usize { - let adj = self.get_adj(v_pid); - match adj { - Adj::Solo => 0, - Adj::List { - out, - remote_out, - into, - remote_into, - } => match d { - Direction::OUT => { - out.len_window(&self.local_timestamps, window) - + remote_out.len_window(&self.remote_out_timestamps, window) - } - Direction::IN => { - into.len_window(&self.local_timestamps, window) - + remote_into.len_window(&self.remote_into_timestamps, window) - } - Direction::BOTH => { - out.vertices_window(&self.local_timestamps, window) - .merge(into.vertices_window(&self.local_timestamps, window)) - .dedup() - .count() - + remote_out - .vertices_window(&self.remote_out_timestamps, window) - .merge( - remote_into.vertices_window(&self.remote_into_timestamps, window), - ) - .dedup() - .count() - } - }, - } - } - - pub(crate) fn vertex_edges_iter( - &self, - v_pid: usize, - d: Direction, - ) -> Box + Send + '_> { - match self.get_adj(v_pid) { - Adj::List { - out, - into, - remote_out, - remote_into, - } => match d { - Direction::OUT => Box::new( - out.iter() - .map(move |(dst_pid, e)| { - self.new_local_out_edge_ref(v_pid, dst_pid, e, None) - }) - .chain(remote_out.iter().map(move |(dst, e)| { - self.new_remote_out_edge_ref(v_pid, dst, e, None) - })), - ), - Direction::IN => Box::new( - into.iter() - .map(move |(src_pid, e)| { - self.new_local_into_edge_ref(src_pid, v_pid, e, None) - }) - .chain(remote_into.iter().map(move |(src, e)| { - self.new_remote_into_edge_ref(src, v_pid, e, None) - })), - ), - - Direction::BOTH => { - let remote = remote_out - .iter() - .map(move |(dst, e)| { - (dst, self.new_remote_out_edge_ref(v_pid, dst, e, None)) - }) - .merge_by( - remote_into.iter().map(move |(src, e)| { - (src, self.new_remote_into_edge_ref(src, v_pid, e, None)) - }), - |(left, _), (right, _)| left < right, - ) - .map(|item| item.1); - - let local = out - .iter() - .map(move |(dst_pid, e)| { - ( - dst_pid, - self.new_local_out_edge_ref(v_pid, dst_pid, e, None), - ) - }) - .merge_by( - into.iter().map(move |(src_pid, e)| { - ( - src_pid, - self.new_local_into_edge_ref(src_pid, v_pid, e, None), - ) - }), - |(left, _), (right, _)| left < right, - ) - .map(|item| item.1); - Box::new(chain!(local, remote)) - } - }, - _ => Box::new(std::iter::empty()), - } - } - - pub(crate) fn vertex_edges_iter_window( - &self, - v_pid: usize, - r: &Range, - d: Direction, - ) -> Box + Send + '_> { - match self.get_adj(v_pid) { - Adj::List { - out, - into, - remote_out, - remote_into, - } => match d { - Direction::OUT => Box::new(chain!( - out.iter_window(&self.local_timestamps, r) - .map(move |(dst_pid, e)| self - .new_local_out_edge_ref(v_pid, dst_pid, e, None)), - remote_out - .iter_window(&self.remote_out_timestamps, r) - .map(move |(dst, e)| self.new_remote_out_edge_ref(v_pid, dst, e, None)) - )), - Direction::IN => { - let iter = chain!( - into.iter_window(&self.local_timestamps, r) - .map(move |(src_pid, e)| self - .new_local_into_edge_ref(src_pid, v_pid, e, None)), - remote_into - .iter_window(&self.remote_into_timestamps, r) - .map(move |(src, e)| self.new_remote_into_edge_ref(src, v_pid, e, None)) - ); - Box::new(iter) - } - Direction::BOTH => Box::new(chain!( - out.iter_window(&self.local_timestamps, r) - .map(move |(dst_pid, e)| ( - dst_pid, - self.new_local_out_edge_ref(v_pid, dst_pid, e, None) - )) - .merge_by( - into.iter_window(&self.local_timestamps, r) - .map(move |(src_pid, e)| ( - src_pid, - self.new_local_into_edge_ref(src_pid, v_pid, e, None) - )), - |left, right| left.0 < right.0 - ) - .map(|item| item.1), - remote_out - .iter_window(&self.remote_out_timestamps, r) - .map(move |(dst, e)| ( - dst, - self.new_remote_out_edge_ref(v_pid, dst, e, None) - )) - .merge_by( - remote_into - .iter_window(&self.remote_into_timestamps, r) - .map(move |(src, e)| ( - src, - self.new_remote_into_edge_ref(src, v_pid, e, None) - )), - |left, right| left.0 < right.0 - ) - .map(|item| item.1) - )), - }, - _ => Box::new(std::iter::empty()), - } - } - - pub(crate) fn vertex_edges_iter_t( - // TODO: change back to private if appropriate - &self, - v_pid: usize, - d: Direction, - ) -> Box + Send + '_> { - Box::new( - self.vertex_edges_iter(v_pid, d) - .flat_map(|e| self.explode_edge(e)), - ) - } - - pub(crate) fn vertex_edges_iter_window_t<'a>( - // TODO: change back to private if appropriate - &'a self, - v_pid: usize, - w: &'a Range, - d: Direction, - ) -> Box + Send + '_> { - Box::new( - self.vertex_edges_iter_window(v_pid, w, d) - .flat_map(|e| self.explode_edge_window(e, w.clone())), - ) - } -} diff --git a/raphtory/src/core/edge_ref.rs b/raphtory/src/core/edge_ref.rs deleted file mode 100644 index 0a91a3f6ed..0000000000 --- a/raphtory/src/core/edge_ref.rs +++ /dev/null @@ -1,210 +0,0 @@ -use crate::core::vertex_ref::VertexRef; - -#[derive(Debug, Copy, Clone, PartialEq)] -pub enum EdgeRef { - RemoteInto { - e_pid: usize, - shard_id: usize, - layer_id: usize, - src: u64, - dst_pid: usize, - time: Option, - }, - RemoteOut { - e_pid: usize, - shard_id: usize, - layer_id: usize, - src_pid: usize, - dst: u64, - time: Option, - }, - LocalInto { - e_pid: usize, - shard_id: usize, - layer_id: usize, - src_pid: usize, - dst_pid: usize, - time: Option, - }, - LocalOut { - e_pid: usize, - shard_id: usize, - layer_id: usize, - src_pid: usize, - dst_pid: usize, - time: Option, - }, -} - -impl EdgeRef { - #[inline(always)] - pub fn shard(&self) -> usize { - match &self { - EdgeRef::RemoteInto { shard_id, .. } => *shard_id, - EdgeRef::RemoteOut { shard_id, .. } => *shard_id, - EdgeRef::LocalInto { shard_id, .. } => *shard_id, - EdgeRef::LocalOut { shard_id, .. } => *shard_id, - } - } - - #[inline(always)] - pub fn layer(&self) -> usize { - match &self { - EdgeRef::RemoteInto { layer_id, .. } => *layer_id, - EdgeRef::RemoteOut { layer_id, .. } => *layer_id, - EdgeRef::LocalInto { layer_id, .. } => *layer_id, - EdgeRef::LocalOut { layer_id, .. } => *layer_id, - } - } - - #[inline(always)] - pub fn time(&self) -> Option { - match self { - EdgeRef::RemoteInto { time, .. } => *time, - EdgeRef::RemoteOut { time, .. } => *time, - EdgeRef::LocalInto { time, .. } => *time, - EdgeRef::LocalOut { time, .. } => *time, - } - } - - pub fn src(&self) -> VertexRef { - match self { - EdgeRef::RemoteInto { src, .. } => VertexRef::Remote(*src), - EdgeRef::RemoteOut { - src_pid, shard_id, .. - } => VertexRef::new_local(*src_pid, *shard_id), - EdgeRef::LocalInto { - src_pid, shard_id, .. - } => VertexRef::new_local(*src_pid, *shard_id), - EdgeRef::LocalOut { - src_pid, shard_id, .. - } => VertexRef::new_local(*src_pid, *shard_id), - } - } - - pub fn dst(&self) -> VertexRef { - match self { - EdgeRef::RemoteInto { - dst_pid, shard_id, .. - } => VertexRef::new_local(*dst_pid, *shard_id), - EdgeRef::RemoteOut { dst, .. } => VertexRef::Remote(*dst), - EdgeRef::LocalInto { - dst_pid, shard_id, .. - } => VertexRef::new_local(*dst_pid, *shard_id), - EdgeRef::LocalOut { - dst_pid, shard_id, .. - } => VertexRef::new_local(*dst_pid, *shard_id), - } - } - - pub fn remote(&self) -> VertexRef { - match self { - EdgeRef::RemoteInto { .. } => self.src(), - EdgeRef::RemoteOut { .. } => self.dst(), - EdgeRef::LocalInto { .. } => self.src(), - EdgeRef::LocalOut { .. } => self.dst(), - } - } - - pub fn local(&self) -> VertexRef { - match self { - EdgeRef::RemoteInto { .. } => self.dst(), - EdgeRef::RemoteOut { .. } => self.src(), - EdgeRef::LocalInto { .. } => self.dst(), - EdgeRef::LocalOut { .. } => self.src(), - } - } - - pub fn is_remote(&self) -> bool { - match self { - EdgeRef::RemoteInto { .. } => true, - EdgeRef::RemoteOut { .. } => true, - EdgeRef::LocalInto { .. } => false, - EdgeRef::LocalOut { .. } => false, - } - } - - pub fn is_local(&self) -> bool { - !self.is_remote() - } - - #[inline(always)] - pub(in crate::core) fn pid(&self) -> usize { - match self { - EdgeRef::RemoteInto { e_pid, .. } => *e_pid, - EdgeRef::RemoteOut { e_pid, .. } => *e_pid, - EdgeRef::LocalInto { e_pid, .. } => *e_pid, - EdgeRef::LocalOut { e_pid, .. } => *e_pid, - } - } - - pub(in crate::core) fn merge_cmp(&self, other: &EdgeRef) -> bool { - (self.local(), self.remote(), self.time(), self.layer()) - < (other.local(), other.remote(), other.time(), other.layer()) - } - - pub fn at(&self, time: i64) -> Self { - match *self { - EdgeRef::RemoteInto { - e_pid, - shard_id, - layer_id, - src, - dst_pid, - .. - } => EdgeRef::RemoteInto { - time: Some(time), - e_pid, - shard_id, - layer_id, - src, - dst_pid, - }, - EdgeRef::RemoteOut { - e_pid, - shard_id, - layer_id, - src_pid, - dst, - .. - } => EdgeRef::RemoteOut { - time: Some(time), - e_pid, - shard_id, - layer_id, - src_pid, - dst, - }, - EdgeRef::LocalInto { - e_pid, - shard_id, - layer_id, - src_pid, - dst_pid, - .. - } => EdgeRef::LocalInto { - time: Some(time), - e_pid, - shard_id, - layer_id, - src_pid, - dst_pid, - }, - EdgeRef::LocalOut { - e_pid, - shard_id, - layer_id, - src_pid, - dst_pid, - .. - } => EdgeRef::LocalOut { - time: Some(time), - e_pid, - shard_id, - layer_id, - src_pid, - dst_pid, - }, - } - } -} diff --git a/raphtory/src/core/entities/edges/edge.rs b/raphtory/src/core/entities/edges/edge.rs new file mode 100644 index 0000000000..620e4c031c --- /dev/null +++ b/raphtory/src/core/entities/edges/edge.rs @@ -0,0 +1,289 @@ +use crate::core::{ + entities::{ + edges::edge_store::EdgeStore, + graph::{ + tgraph::TGraph, + tgraph_storage::{GraphEntry, LockedGraphStorage}, + }, + properties::tprop::{LockedLayeredTProp, TProp}, + vertices::vertex::Vertex, + GraphItem, LayerIds, VRef, EID, VID, + }, + storage::{ + locked_view::LockedView, + timeindex::{LayeredIndex, TimeIndex, TimeIndexOps}, + Entry, + }, + Direction, Prop, +}; +// use crate::prelude::Layer::Default; +use crate::core::storage::timeindex::{LockedLayeredIndex, TimeIndexEntry}; +use std::{ + default::Default, + ops::{Deref, Range}, + sync::Arc, +}; + +#[derive(Debug)] +pub(crate) enum ERef<'a, const N: usize> { + ERef(Entry<'a, EdgeStore, N>), + ELock { + lock: Arc>, + eid: EID, + }, +} + +// impl fn edge_id for ERef +impl<'a, const N: usize> ERef<'a, N> { + pub(crate) fn edge_id(&self) -> EID { + match self { + ERef::ELock { lock: _, eid } => *eid, + ERef::ERef(es) => es.index().into(), + } + } + + fn vertex_ref(&self, src: VID) -> Option> { + match self { + ERef::ELock { lock, .. } => { + Some(VRef::LockedEntry(GraphEntry::new(lock.clone(), src.into()))) + } + _ => None, + } + } +} + +impl<'a, const N: usize> Deref for ERef<'a, N> { + type Target = EdgeStore; + + fn deref(&self) -> &Self::Target { + match self { + ERef::ERef(e) => e, + ERef::ELock { lock, eid } => lock.get_edge((*eid).into()), + } + } +} + +impl<'a, const N: usize> GraphItem<'a, N> for EdgeView<'a, N> { + fn from_edge_ids( + src: VID, + dst: VID, + e_id: ERef<'a, N>, + dir: Direction, + graph: &'a TGraph, + ) -> Self { + EdgeView::from_edge_ids(src, dst, e_id, dir, graph) + } +} +#[derive(Debug)] +pub struct EdgeView<'a, const N: usize> { + src: VID, + dst: VID, + edge_id: ERef<'a, N>, + dir: Direction, + graph: &'a TGraph, +} + +impl<'a, const N: usize> PartialEq for EdgeView<'a, N> { + fn eq(&self, other: &Self) -> bool { + self.edge_id.edge_id() == other.edge_id.edge_id() + && self.src == other.src + && self.dst == other.dst + } +} + +impl<'a, const N: usize> PartialOrd for EdgeView<'a, N> { + fn partial_cmp(&self, other: &Self) -> Option { + self.origin() + .eq(&other.origin()) + .then(|| self.neighbour().cmp(&other.neighbour())) + } +} + +impl<'a, const N: usize> EdgeView<'a, N> { + pub(crate) fn additions( + self, + layer_ids: LayerIds, + ) -> Option> { + match self.edge_id { + ERef::ERef(entry) => { + let t_index = entry.map(|entry| entry.additions()); + Some(LayeredIndex::new(layer_ids, t_index)) + } + _ => None, + } + } + + pub(crate) fn deletions( + self, + layer_ids: LayerIds, + ) -> Option> { + match self.edge_id { + ERef::ERef(entry) => { + let t_index = entry.map(|entry| entry.deletions()); + Some(LayeredIndex::new(layer_ids, t_index)) + } + _ => None, + } + } + + pub(crate) fn temporal_property( + self, + layer_ids: LayerIds, + prop_id: usize, + ) -> Option> { + match self.edge_id { + ERef::ERef(entry) => { + if entry.has_temporal_prop(&layer_ids, prop_id) { + match layer_ids { + LayerIds::None => None, + LayerIds::All => { + let props: Vec<_> = entry + .layer_ids_iter() + .flat_map(|id| { + entry.temporal_prop_layer(id, prop_id).is_some().then(|| { + entry + .clone() + .map(|e| e.temporal_prop_layer(id, prop_id).unwrap()) + }) + }) + .collect(); + Some(LockedLayeredTProp::new(props)) + } + LayerIds::One(id) => Some(LockedLayeredTProp::new(vec![entry.map(|e| { + e.temporal_prop_layer(id, prop_id) + .expect("already checked in the beginning") + })])), + LayerIds::Multiple(ids) => { + let props: Vec<_> = ids + .iter() + .flat_map(|&id| { + entry.temporal_prop_layer(id, prop_id).is_some().then(|| { + entry + .clone() + .map(|e| e.temporal_prop_layer(id, prop_id).unwrap()) + }) + }) + .collect(); + Some(LockedLayeredTProp::new(props)) + } + } + } else { + None + } + } + _ => None, + } + } + + fn neighbour(&self) -> VID { + match self.dir { + Direction::OUT => self.dst, + Direction::IN => self.src, + _ => panic!("Invalid direction"), // FIXME: perhaps we should have 2 enums for direction one strict and one not + } + } + + fn origin(&self) -> VID { + match self.dir { + Direction::OUT => self.src, + Direction::IN => self.dst, + _ => panic!("Invalid direction"), // FIXME: perhaps we should have 2 enums for direction one strict and one not + } + } + + pub fn src_id(&self) -> VID { + self.src + } + + pub fn dst_id(&self) -> VID { + self.dst + } + + pub fn edge_id(&self) -> EID { + self.edge_id.edge_id() + } + + pub fn src(&self) -> Vertex<'a, N> { + if let Some(v_ref) = self.edge_id.vertex_ref(self.src) { + Vertex::new(v_ref, self.graph) + } else { + self.graph.vertex(self.src) + } + } + + pub fn dst(&self) -> Vertex<'a, N> { + if let Some(v_ref) = self.edge_id.vertex_ref(self.dst) { + Vertex::new(v_ref, self.graph) + } else { + self.graph.vertex(self.dst) + } + } + + pub(crate) fn from_edge_ids( + v1: VID, // the initiator of the edges call + v2: VID, // the edge on the other side + edge_id: ERef<'a, N>, + dir: Direction, + graph: &'a TGraph, + ) -> Self { + let (src, dst) = match dir { + Direction::OUT => (v1, v2), + Direction::IN => (v2, v1), + _ => panic!("Invalid direction"), + }; + EdgeView { + src, + dst, + edge_id, + graph, + dir, + } + } + + pub(crate) fn from_entry(entry: Entry<'a, EdgeStore, N>, graph: &'a TGraph) -> Self { + Self { + src: entry.src().into(), + dst: entry.dst().into(), + edge_id: ERef::ERef(entry), + dir: Direction::OUT, + graph, + } + } + + pub(crate) fn active(&'a self, layer_ids: LayerIds, w: Range) -> bool { + match &self.edge_id { + ERef::ELock { lock, .. } => { + let e = lock.get_edge(self.edge_id().into()); + self.check_layers(layer_ids, e, |t| t.active(w.clone())) + } + ERef::ERef(entry) => { + let e = entry.deref(); + self.check_layers(layer_ids, e, |t| t.active(w.clone())) + } + } + } + + fn check_layers, F: Fn(&TimeIndex) -> bool>( + &self, + layer_ids: LayerIds, + e: E, + f: F, + ) -> bool { + match layer_ids { + LayerIds::All => e.additions().iter().any(f), + LayerIds::One(id) => f(&e.additions()[id]), + LayerIds::Multiple(ids) => ids.iter().any(|id| f(&e.additions()[*id])), + LayerIds::None => false, + } + } + + pub(crate) fn layer_ids(&self) -> LayerIds { + match &self.edge_id { + ERef::ELock { lock, .. } => { + let e = lock.get_edge(self.edge_id().into()); + e.layer_ids() + } + ERef::ERef(entry) => (*entry).layer_ids(), + } + } +} diff --git a/raphtory/src/core/entities/edges/edge_ref.rs b/raphtory/src/core/entities/edges/edge_ref.rs new file mode 100644 index 0000000000..dcb42274c4 --- /dev/null +++ b/raphtory/src/core/entities/edges/edge_ref.rs @@ -0,0 +1,142 @@ +use crate::core::{ + entities::{vertices::vertex_ref::VertexRef, EID, VID}, + storage::timeindex::{AsTime, TimeIndexEntry}, +}; +use std::cmp::Ordering; + +#[derive(Debug, Copy, Clone, PartialEq)] +pub struct EdgeRef { + e_pid: EID, + src_pid: VID, + dst_pid: VID, + e_type: Dir, + time: Option, + layer_id: Option, +} + +// This is used for merging iterators of EdgeRefs and only makes sense if the local vertex for both +// sides is the same +impl PartialOrd for EdgeRef { + fn partial_cmp(&self, other: &Self) -> Option { + self.remote().partial_cmp(&other.remote()) + } +} + +#[derive(Debug, Copy, Clone, PartialEq)] +pub enum Dir { + Into, + Out, +} + +impl EdgeRef { + #[inline] + pub fn new_outgoing(e_pid: EID, src_pid: VID, dst_pid: VID) -> Self { + EdgeRef { + e_pid, + src_pid, + dst_pid, + e_type: Dir::Out, + time: None, + layer_id: None, + } + } + + #[inline] + pub fn new_incoming(e_pid: EID, src_pid: VID, dst_pid: VID) -> Self { + EdgeRef { + e_pid, + src_pid, + dst_pid, + e_type: Dir::Into, + time: None, + layer_id: None, + } + } + + #[inline] + pub fn new(e_pid: EID, local_pid: VID, remote_pid: VID, dir: Dir) -> Self { + match dir { + Dir::Out => EdgeRef { + e_pid, + src_pid: local_pid, + dst_pid: remote_pid, + e_type: dir, + time: None, + layer_id: None, + }, + Dir::Into => EdgeRef { + e_pid, + src_pid: remote_pid, + dst_pid: local_pid, + e_type: dir, + time: None, + layer_id: None, + }, + } + } + + #[inline(always)] + pub fn layer(&self) -> Option<&usize> { + self.layer_id.as_ref() + } + + #[inline(always)] + pub fn time(&self) -> Option { + self.time + } + + #[inline(always)] + pub fn time_t(&self) -> Option { + self.time.map(|t| *t.t()) + } + + #[inline] + pub fn dir(&self) -> Dir { + self.e_type + } + + #[inline] + pub fn src(&self) -> VID { + self.src_pid + } + + #[inline] + pub fn dst(&self) -> VID { + self.dst_pid + } + + #[inline] + pub fn remote(&self) -> VID { + match self.e_type { + Dir::Into => self.src(), + Dir::Out => self.dst(), + } + } + + #[inline] + pub fn local(&self) -> VID { + match self.e_type { + Dir::Into => self.dst(), + Dir::Out => self.src(), + } + } + + #[inline(always)] + pub(crate) fn pid(&self) -> EID { + self.e_pid + } + + #[inline] + pub fn at(&self, time: TimeIndexEntry) -> Self { + let mut e_ref = *self; + e_ref.time = Some(time); + e_ref + } + + #[inline] + pub fn at_layer(&self, layer: usize) -> Self { + let mut e_ref = *self; + e_ref.layer_id = Some(layer); + e_ref + } +} diff --git a/raphtory/src/core/entities/edges/edge_store.rs b/raphtory/src/core/entities/edges/edge_store.rs new file mode 100644 index 0000000000..3453ad31c0 --- /dev/null +++ b/raphtory/src/core/entities/edges/edge_store.rs @@ -0,0 +1,425 @@ +use crate::{ + core::{ + entities::{ + edges::edge_ref::EdgeRef, + properties::{props::Props, tprop::TProp}, + LayerIds, EID, VID, + }, + storage::{ + lazy_vec::IllegalSet, + locked_view::LockedView, + timeindex::{TimeIndex, TimeIndexEntry, TimeIndexOps}, + }, + utils::errors::{GraphError, MutateGraphError}, + Prop, + }, + prelude::TimeOps, +}; +use itertools::Itertools; +use serde::{Deserialize, Serialize}; +use std::ops::{Deref, DerefMut, Range}; +use tantivy::HasLen; + +#[derive(Serialize, Deserialize, Debug, Default, PartialEq)] +pub struct EdgeStore { + pub(crate) eid: EID, + src: VID, + dst: VID, + layers: Vec, // each layer has its own set of properties + additions: Vec>, + deletions: Vec>, +} + +#[derive(Serialize, Deserialize, Debug, Default, PartialEq)] +pub struct EdgeLayer { + props: Option, // memory optimisation: only allocate props if needed +} + +impl EdgeLayer { + pub fn props(&self) -> Option<&Props> { + self.props.as_ref() + } + + pub fn add_prop( + &mut self, + t: TimeIndexEntry, + prop_id: usize, + prop: Prop, + ) -> Result<(), GraphError> { + let props = self.props.get_or_insert_with(|| Props::new()); + props.add_prop(t, prop_id, prop) + } + + pub fn add_constant_prop( + &mut self, + prop_id: usize, + prop: Prop, + ) -> Result<(), IllegalSet>> { + let props = self.props.get_or_insert_with(|| Props::new()); + props.add_constant_prop(prop_id, prop) + } + + pub(crate) fn const_prop_ids(&self) -> impl Iterator + '_ { + self.props + .as_ref() + .into_iter() + .flat_map(|props| props.const_prop_ids()) + } + + pub(crate) fn const_prop(&self, prop_id: usize) -> Option<&Prop> { + self.props.as_ref().and_then(|ps| ps.const_prop(prop_id)) + } + + pub(crate) fn temporal_property(&self, prop_id: usize) -> Option<&TProp> { + self.props.as_ref().and_then(|ps| ps.temporal_prop(prop_id)) + } + + pub(crate) fn temporal_properties<'a>( + &'a self, + prop_id: usize, + window: Option>, + ) -> Box + 'a> { + if let Some(window) = window { + self.props + .as_ref() + .map(|props| props.temporal_props_window(prop_id, window.start, window.end)) + .unwrap_or_else(|| Box::new(std::iter::empty())) + } else { + self.props + .as_ref() + .map(|props| props.temporal_props(prop_id)) + .unwrap_or_else(|| Box::new(std::iter::empty())) + } + } +} + +impl> From for EdgeRef { + fn from(val: E) -> Self { + EdgeRef::new_outgoing(val.e_id(), val.src(), val.dst()) + } +} + +impl EdgeStore { + fn get_or_allocate_layer(&mut self, layer_id: usize) -> &mut EdgeLayer { + if self.layers.len() <= layer_id { + self.layers.resize_with(layer_id + 1, Default::default); + } + &mut self.layers[layer_id] + } + + pub fn has_layer(&self, layers: &LayerIds) -> bool { + match layers { + LayerIds::All => true, + LayerIds::One(layer_ids) => { + self.additions + .get(*layer_ids) + .filter(|t_index| !t_index.is_empty()) + .is_some() + || self + .deletions + .get(*layer_ids) + .filter(|t_index| !t_index.is_empty()) + .is_some() + } + LayerIds::Multiple(layer_ids) => layer_ids + .iter() + .any(|layer_id| self.has_layer(&LayerIds::One(*layer_id))), + LayerIds::None => false, + } + } + + // an edge is in a layer if it has either deletions or additions in that layer + pub fn layer_ids(&self) -> LayerIds { + let layer_ids = self.layer_ids_iter().collect::>(); + if layer_ids.len() == 1 { + LayerIds::One(layer_ids[0]) + } else { + LayerIds::Multiple(layer_ids.into()) + } + } + + pub fn layer_iter(&self) -> impl Iterator + '_ { + self.layers.iter() + } + pub fn layer_ids_iter(&self) -> impl Iterator + '_ { + let layer_ids = self + .additions + .iter() + .enumerate() + .zip_longest(self.deletions.iter().enumerate()) + .flat_map(|e| match e { + itertools::EitherOrBoth::Both((i, t1), (_, t2)) => { + if !t1.is_empty() || !t2.is_empty() { + Some(i) + } else { + None + } + } + itertools::EitherOrBoth::Left((i, t)) => { + if !t.is_empty() { + Some(i) + } else { + None + } + } + itertools::EitherOrBoth::Right((i, t)) => { + if !t.is_empty() { + Some(i) + } else { + None + } + } + }); + layer_ids + } + + pub fn layer_ids_window_iter(&self, w: Range) -> impl Iterator + '_ { + let layer_ids = self + .additions + .iter() + .enumerate() + .zip_longest(self.deletions.iter().enumerate()) + .flat_map(move |e| match e { + itertools::EitherOrBoth::Both((i, t1), (_, t2)) => { + if t1.contains(w.clone()) || t2.contains(w.clone()) { + Some(i) + } else { + None + } + } + itertools::EitherOrBoth::Left((i, t)) => { + if t.contains(w.clone()) { + Some(i) + } else { + None + } + } + itertools::EitherOrBoth::Right((i, t)) => { + if t.contains(w.clone()) { + Some(i) + } else { + None + } + } + }); + + layer_ids + } + + pub fn new(src: VID, dst: VID) -> Self { + Self { + eid: 0.into(), + src, + dst, + layers: Vec::with_capacity(1), + additions: Vec::with_capacity(1), + deletions: Vec::with_capacity(1), + } + } + + pub fn layer(&self, layer_id: usize) -> Option<&EdgeLayer> { + self.layers.get(layer_id) + } + + pub fn additions(&self) -> &Vec> { + &self.additions + } + + pub fn deletions(&self) -> &Vec> { + &self.deletions + } + + /// an edge is active in a window if it has an addition event in any of the layers + pub fn active(&self, layer_ids: &LayerIds, w: Range) -> bool { + match layer_ids { + LayerIds::None => false, + LayerIds::All => self + .additions() + .iter() + .any(|t_index| t_index.contains(w.clone())), + LayerIds::One(l_id) => self + .additions() + .get(*l_id) + .map(|t_index| t_index.contains(w)) + .unwrap_or(false), + LayerIds::Multiple(layers) => layers + .iter() + .any(|l_id| self.active(&LayerIds::One(*l_id), w.clone())), + } + } + + pub fn last_deletion(&self, layer_ids: &LayerIds) -> Option<&TimeIndexEntry> { + match layer_ids { + LayerIds::None => None, + LayerIds::All => self.deletions().iter().flat_map(|d| d.last()).max(), + LayerIds::One(id) => self.deletions.get(*id).and_then(|t| t.last()), + LayerIds::Multiple(ids) => ids + .iter() + .flat_map(|id| self.deletions.get(*id).and_then(|t| t.last())) + .max(), + } + } + + pub fn last_addition(&self, layer_ids: &LayerIds) -> Option<&TimeIndexEntry> { + match layer_ids { + LayerIds::None => None, + LayerIds::All => self.additions().iter().flat_map(|d| d.last()).max(), + LayerIds::One(id) => self.additions.get(*id).and_then(|t| t.last()), + LayerIds::Multiple(ids) => ids + .iter() + .flat_map(|id| self.additions.get(*id).and_then(|t| t.last())) + .max(), + } + } + + pub fn last_deletion_before(&self, layer_ids: &LayerIds, t: i64) -> Option { + match layer_ids { + LayerIds::None => None, + LayerIds::All => self + .deletions() + .iter() + .flat_map(|dels| dels.range(i64::MIN..t).last_t()) + .max(), + LayerIds::One(id) => { + let layer = self.deletions.get(*id)?; + layer.range(i64::MIN..t).last_t() + } + LayerIds::Multiple(ids) => ids + .iter() + .flat_map(|id| { + self.deletions + .get(*id) + .and_then(|t_index| t_index.range(i64::MIN..t).last_t()) + }) + .max(), + } + } + + pub fn has_temporal_prop(&self, layer_ids: &LayerIds, prop_id: usize) -> bool { + match layer_ids { + LayerIds::None => false, + LayerIds::All => self.layer_ids_iter().any(|id| { + self.layer(id) + .and_then(|layer| layer.temporal_property(prop_id)) + .is_some() + }), + LayerIds::One(id) => self + .layer(*id) + .and_then(|layer| layer.temporal_property(prop_id)) + .is_some(), + LayerIds::Multiple(ids) => ids.iter().any(|id| { + self.layer(*id) + .and_then(|layer| layer.temporal_property(prop_id)) + .is_some() + }), + } + } + + pub fn has_temporal_prop_window( + &self, + layer_ids: LayerIds, + prop_id: usize, + w: Range, + ) -> bool { + match layer_ids { + LayerIds::None => false, + LayerIds::All => self.layer_ids_iter().any(|id| { + self.layer(id) + .and_then(|layer| { + layer + .temporal_property(prop_id) + .filter(|p| p.iter_window(w.clone()).next().is_some()) + }) + .is_some() + }), + LayerIds::One(id) => self + .layer(id) + .and_then(|layer| { + layer + .temporal_property(prop_id) + .filter(|p| p.iter_window(w.clone()).next().is_some()) + }) + .is_some(), + LayerIds::Multiple(ids) => ids.iter().any(|id| { + self.layer(*id) + .and_then(|layer| { + layer + .temporal_property(prop_id) + .filter(|p| p.iter_window(w.clone()).next().is_some()) + }) + .is_some() + }), + } + } + + pub fn temporal_prop_layer(&self, layer_id: usize, prop_id: usize) -> Option<&TProp> { + self.layers + .get(layer_id) + .and_then(|layer| layer.temporal_property(prop_id)) + } + + pub fn layer_mut(&mut self, layer_id: usize) -> impl DerefMut + '_ { + self.get_or_allocate_layer(layer_id) + } + + pub fn deletions_mut(&mut self, layer_id: usize) -> &mut TimeIndex { + if self.deletions.len() <= layer_id { + self.deletions.resize_with(layer_id + 1, Default::default); + } + &mut self.deletions[layer_id] + } + + pub fn additions_mut(&mut self, layer_id: usize) -> &mut TimeIndex { + if self.additions.len() <= layer_id { + self.additions.resize_with(layer_id + 1, Default::default); + } + &mut self.additions[layer_id] + } + + pub fn src(&self) -> VID { + self.src + } + + pub fn dst(&self) -> VID { + self.dst + } + + pub fn e_id(&self) -> EID { + self.eid + } + + pub(crate) fn props(&self, layer_id: Option) -> Box + '_> { + if let Some(layer_id) = layer_id { + let iter = self + .layers + .get(layer_id) + .into_iter() + .flat_map(|layer| layer.props()); + Box::new(iter) + } else { + Box::new(self.layers.iter().flat_map(|layer| layer.props())) + } + } + + pub(crate) fn temp_prop_ids( + &self, + layer_id: Option, + ) -> Box + '_> { + if let Some(layer_id) = layer_id { + Box::new(self.layers.get(layer_id).into_iter().flat_map(|layer| { + layer + .props() + .into_iter() + .flat_map(|props| props.temporal_prop_ids()) + })) + } else { + Box::new( + self.layers + .iter() + .flat_map(|layer| layer.props().map(|prop| prop.temporal_prop_ids())) + .kmerge() + .dedup(), + ) + } + } +} diff --git a/raphtory/src/core/entities/edges/mod.rs b/raphtory/src/core/entities/edges/mod.rs new file mode 100644 index 0000000000..28c344e2dd --- /dev/null +++ b/raphtory/src/core/entities/edges/mod.rs @@ -0,0 +1,3 @@ +pub(crate) mod edge; +pub mod edge_ref; +pub mod edge_store; diff --git a/raphtory/src/core/entities/graph/mod.rs b/raphtory/src/core/entities/graph/mod.rs new file mode 100644 index 0000000000..42c9d80327 --- /dev/null +++ b/raphtory/src/core/entities/graph/mod.rs @@ -0,0 +1,77 @@ +pub mod tgraph; +pub mod tgraph_storage; +pub(crate) mod timer; + +#[cfg(test)] +mod test { + use crate::{ + core::{Direction, PropType}, + db::api::mutation::internal::InternalAdditionOps, + prelude::{IntoProp, Prop, NO_PROPS}, + }; + + use super::{tgraph::InnerTemporalGraph, *}; + + #[test] + fn test_neighbours_multiple_layers() { + let g: InnerTemporalGraph<2> = InnerTemporalGraph::default(); + let l_btc = g.resolve_layer(Some("btc")); + let l_eth = g.resolve_layer(Some("eth")); + let l_tether = g.resolve_layer(Some("tether")); + let v1 = g.resolve_vertex(1, None); + let v2 = g.resolve_vertex(2, None); + let tx_sent_id = g + .resolve_edge_property("tx_sent", PropType::I32, false) + .unwrap(); + g.inner() + .add_edge_internal(1.into(), v1, v2, vec![(tx_sent_id, Prop::I32(10))], l_btc); + g.inner() + .add_edge_internal(1.into(), v1, v2, vec![(tx_sent_id, Prop::I32(20))], l_eth); + g.inner().add_edge_internal( + 1.into(), + v1, + v2, + vec![(tx_sent_id, Prop::I32(70))], + l_tether, + ); + + let first = g.inner().vertex(0.into()); + + let ns = first + .neighbours(vec!["btc", "eth"], Direction::OUT) + .map(|v| v.id().0) + .collect::>(); + + assert_eq!(ns, vec![1]); + + let first = g.inner().vertex_arc(0.into()); + let edges = first + .edge_tuples([0, 1, 2, 3, 4].into(), Direction::OUT) + .collect::>(); + + assert_eq!(edges.len(), 1, "should only have one edge {:?}", edges); + } + + #[test] + fn simple_triangle() { + let g: InnerTemporalGraph<2> = InnerTemporalGraph::default(); + let v1 = g.resolve_vertex(1, None); + let v2 = g.resolve_vertex(2, None); + let v3 = g.resolve_vertex(3, None); + let vs = vec![(1, v1, v2), (2, v1, v3), (3, v2, v1), (4, v3, v2)]; + + let empty: Vec<(usize, Prop)> = vec![]; + for (t, src, dst) in vs { + g.inner() + .add_edge_internal(t.into(), src, dst, empty.clone(), 0); + } + + let v = g.inner().vertex(0.into()); + + let ns = v + .neighbours(vec![], Direction::BOTH) + .map(|v| v.id().0) + .collect::>(); + assert_eq!(ns, vec![1, 2]); + } +} diff --git a/raphtory/src/core/entities/graph/tgraph.rs b/raphtory/src/core/entities/graph/tgraph.rs new file mode 100644 index 0000000000..60109f3666 --- /dev/null +++ b/raphtory/src/core/entities/graph/tgraph.rs @@ -0,0 +1,555 @@ +use crate::{ + core::{ + entities::{ + edges::{ + edge::EdgeView, + edge_ref::EdgeRef, + edge_store::{EdgeLayer, EdgeStore}, + }, + graph::{ + tgraph_storage::{GraphStorage, LockedIter}, + timer::{MaxCounter, MinCounter, TimeCounterTrait}, + }, + properties::{ + graph_props::GraphProps, + props::{ArcReadLockedVec, Meta}, + tprop::TProp, + }, + vertices::{ + input_vertex::InputVertex, + vertex::{ArcEdge, ArcVertex, Vertex}, + vertex_ref::VertexRef, + vertex_store::VertexStore, + }, + LayerIds, EID, VID, + }, + storage::{ + lazy_vec::IllegalSet, + locked_view::LockedView, + timeindex::{AsTime, LayeredIndex, TimeIndexEntry, TimeIndexOps}, + ArcEntry, Entry, EntryMut, + }, + utils::{ + errors::{GraphError, IllegalMutate, MutateGraphError}, + time::TryIntoTime, + }, + ArcStr, Direction, Prop, PropUnwrap, + }, + db::api::view::{internal::EdgeFilter, BoxedIter, Layer}, +}; +use dashmap::{DashMap, DashSet}; +use itertools::Itertools; +use parking_lot::RwLockReadGuard; +use rayon::prelude::*; +use rustc_hash::FxHasher; +use serde::{Deserialize, Serialize}; +use std::{ + fmt::Debug, + hash::BuildHasherDefault, + iter, + ops::{Deref, Range}, + path::Path, + sync::{atomic::AtomicUsize, Arc}, +}; + +pub(crate) type FxDashMap = DashMap>; +pub(crate) type FxDashSet = DashSet>; + +pub(crate) type TGraph = TemporalGraph; + +#[derive(Serialize, Deserialize, Debug, Clone)] +pub struct InnerTemporalGraph(Arc>); + +impl InnerTemporalGraph { + #[inline] + pub(crate) fn inner(&self) -> &TemporalGraph { + &self.0 + } +} + +#[derive(Serialize, Deserialize, Debug)] +pub struct TemporalGraph { + // mapping between logical and physical ids + logical_to_physical: FxDashMap, + string_pool: FxDashSet, + + pub(crate) storage: GraphStorage, + + pub(crate) event_counter: AtomicUsize, + + //earliest time seen in this graph + pub(in crate::core) earliest_time: MinCounter, + + //latest time seen in this graph + pub(in crate::core) latest_time: MaxCounter, + + // props meta data for vertices (mapping between strings and ids) + pub(crate) vertex_meta: Arc, + + // props meta data for edges (mapping between strings and ids) + pub(crate) edge_meta: Arc, + + // graph properties + pub(crate) graph_props: GraphProps, +} + +impl std::fmt::Display for InnerTemporalGraph { + fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result { + write!( + f, + "Graph(num_vertices={}, num_edges={})", + self.inner().storage.nodes.len(), + self.inner().storage.edges.len() + ) + } +} + +impl Default for InnerTemporalGraph { + fn default() -> Self { + let tg = TemporalGraph { + logical_to_physical: FxDashMap::default(), // TODO: could use DictMapper here + string_pool: Default::default(), + storage: GraphStorage::new(), + event_counter: AtomicUsize::new(0), + earliest_time: MinCounter::new(), + latest_time: MaxCounter::new(), + vertex_meta: Arc::new(Meta::new()), + edge_meta: Arc::new(Meta::new()), + graph_props: GraphProps::new(), + }; + + Self(Arc::new(tg)) + } +} + +impl TemporalGraph { + pub(crate) fn num_layers(&self) -> usize { + self.edge_meta.layer_meta().len() + } + + pub(crate) fn layer_names(&self, layer_ids: LayerIds) -> BoxedIter { + match layer_ids { + LayerIds::None => Box::new(iter::empty()), + LayerIds::All => Box::new(self.edge_meta.layer_meta().get_keys().into_iter()), + LayerIds::One(id) => { + let name = self.edge_meta.layer_meta().get_name(id).clone(); + Box::new(iter::once(name)) + } + LayerIds::Multiple(ids) => { + let keys = self.edge_meta.layer_meta().get_keys(); + Box::new((0..ids.len()).map(move |index| { + let id = ids[index]; + keys[id].clone() + })) + } + } + } + + fn as_local_vertex(&self, v: VertexRef) -> Result { + match v { + VertexRef::Internal(vid) => Ok(vid), + VertexRef::External(gid) => self + .logical_to_physical + .get(&gid) + .map(|entry| *entry) + .ok_or(GraphError::FailedToMutateGraph { + source: MutateGraphError::VertexNotFoundError { vertex_id: gid }, + }), + } + } + + pub(crate) fn get_all_vertex_property_names( + &self, + is_static: bool, + ) -> ArcReadLockedVec { + self.vertex_meta.get_all_property_names(is_static) + } + + pub(crate) fn get_all_edge_property_names(&self, is_static: bool) -> ArcReadLockedVec { + self.edge_meta.get_all_property_names(is_static) + } + + pub(crate) fn get_all_layers(&self) -> Vec { + self.edge_meta.get_all_layers() + } + + pub(crate) fn layer_id(&self, key: Layer) -> LayerIds { + match key { + Layer::All => LayerIds::All, + Layer::Default => LayerIds::One(0), + Layer::One(id) => match self.edge_meta.get_layer_id(&id) { + Some(id) => LayerIds::One(id), + None => LayerIds::None, + }, + Layer::Multiple(ids) => { + let mut new_layers = ids + .iter() + .filter_map(|id| self.edge_meta.get_layer_id(id)) + .collect::>(); + let num_layers = self.num_layers(); + let num_new_layers = new_layers.len(); + if num_new_layers == 0 { + LayerIds::None + } else if num_new_layers == 1 { + LayerIds::One(new_layers[0]) + } else if num_new_layers == num_layers { + LayerIds::All + } else { + new_layers.sort_unstable(); + new_layers.dedup(); + LayerIds::Multiple(new_layers.into()) + } + } + } + } + + pub(crate) fn get_layer_name(&self, layer: usize) -> ArcStr { + self.edge_meta.get_layer_name_by_id(layer) + } + + pub(crate) fn graph_earliest_time(&self) -> Option { + Some(self.earliest_time.get()).filter(|t| *t != i64::MAX) + } + + pub(crate) fn graph_latest_time(&self) -> Option { + Some(self.latest_time.get()).filter(|t| *t != i64::MIN) + } + + pub(crate) fn load_from_file>(path: P) -> Result> { + let f = std::fs::File::open(path)?; + let mut reader = std::io::BufReader::new(f); + bincode::deserialize_from(&mut reader) + } + + pub(crate) fn save_to_file>( + &self, + path: P, + ) -> Result<(), Box> { + let f = std::fs::File::create(path)?; + let mut writer = std::io::BufWriter::new(f); + bincode::serialize_into(&mut writer, self) + } + + #[inline] + pub(crate) fn global_vertex_id(&self, v: VID) -> u64 { + let node = self.storage.get_node(v); + node.global_id() + } + + pub(crate) fn vertex_name(&self, v: VID) -> String { + let node = self.storage.get_node(v); + node.name + .clone() + .unwrap_or_else(|| node.global_id().to_string()) + } + + #[inline] + pub(crate) fn node_entry(&self, v: VID) -> Entry<'_, VertexStore, N> { + self.storage.get_node(v.into()) + } + + pub(crate) fn edge_refs(&self) -> impl Iterator + Send { + self.storage.edge_refs() + } + + #[inline] + pub(crate) fn edge_entry(&self, e: EID) -> Entry<'_, EdgeStore, N> { + self.storage.get_edge(e.into()) + } +} + +impl TemporalGraph { + pub(crate) fn internal_num_vertices(&self) -> usize { + self.storage.nodes.len() + } + #[inline] + pub(crate) fn num_edges(&self, layers: &LayerIds, filter: Option<&EdgeFilter>) -> usize { + match filter { + None => match layers { + LayerIds::All => self.storage.edges.len(), + _ => { + let guard = self.storage.edges.read_lock(); + guard.par_iter().filter(|e| e.has_layer(layers)).count() + } + }, + Some(filter) => { + let guard = self.storage.edges.read_lock(); + guard.par_iter().filter(|e| filter(e, layers)).count() + } + } + } + + #[inline] + pub(crate) fn degree( + &self, + v: VID, + dir: Direction, + layers: &LayerIds, + filter: Option<&EdgeFilter>, + ) -> usize { + let node_store = self.storage.get_node(v); + match filter { + None => node_store.degree(layers, dir), + Some(filter) => { + let edges_locked = self.storage.edges.read_lock(); + node_store + .edge_tuples(layers, dir) + .filter(|e| filter(edges_locked.get(e.pid().into()), layers)) + .dedup_by(|e1, e2| e1.remote() == e2.remote()) + .count() + } + } + } + + #[inline] + fn update_time(&self, time: TimeIndexEntry) { + let t = *time.t(); + self.earliest_time.update(t); + self.latest_time.update(t); + } + + /// return local id for vertex, initialising storage if vertex does not exist yet + pub(crate) fn resolve_vertex(&self, id: u64, name: Option<&str>) -> VID { + *(self.logical_to_physical.entry(id).or_insert_with(|| { + let name = name.map(|s| s.to_owned()); + let node_store = VertexStore::empty(id, name); + self.storage.push_node(node_store) + })) + } + + #[inline] + pub(crate) fn add_vertex_no_props( + &self, + time: TimeIndexEntry, + v_id: VID, + ) -> EntryMut { + self.update_time(time); + // get the node and update the time index + let mut node = self.storage.get_node_mut(v_id); + node.update_time(time); + node + } + + pub(crate) fn add_vertex_internal( + &self, + time: TimeIndexEntry, + v_id: VID, + props: Vec<(usize, Prop)>, + ) -> Result<(), GraphError> { + let mut node = self.add_vertex_no_props(time, v_id); + for (id, prop) in props { + node.add_prop(time, id, prop)?; + } + Ok(()) + } + + pub(crate) fn add_edge_properties_internal( + &self, + edge_id: EID, + props: Vec<(usize, Prop)>, + layer: usize, + ) -> Result<(), IllegalMutate> { + let mut edge = self.storage.get_edge_mut(edge_id.into()); + + let mut layer = edge.layer_mut(layer); + for (prop_id, prop) in props { + layer.add_constant_prop(prop_id, prop).map_err(|err| { + IllegalMutate::from_source(err, &self.edge_meta.get_prop_name(prop_id, true)) + })?; + } + Ok(()) + } + + pub(crate) fn add_constant_properties( + &self, + props: Vec<(usize, Prop)>, + ) -> Result<(), GraphError> { + for (id, prop) in props { + self.graph_props.add_constant_prop(id, prop)?; + } + Ok(()) + } + + pub(crate) fn add_properties( + &self, + t: TimeIndexEntry, + props: Vec<(usize, Prop)>, + ) -> Result<(), GraphError> { + for (prop_id, prop) in props { + self.graph_props.add_prop(t, prop_id, prop)?; + } + Ok(()) + } + + pub(crate) fn get_constant_prop(&self, id: usize) -> Option { + self.graph_props.get_constant(id) + } + + pub(crate) fn get_temporal_prop(&self, id: usize) -> Option> { + self.graph_props.get_temporal_prop(id) + } + + pub(crate) fn const_prop_names(&self) -> ArcReadLockedVec { + self.graph_props.constant_names() + } + + pub(crate) fn temporal_property_names(&self) -> ArcReadLockedVec { + self.graph_props.temporal_names() + } + + pub(crate) fn delete_edge( + &self, + t: TimeIndexEntry, + src_id: VID, + dst_id: VID, + layer: usize, + ) -> Result<(), GraphError> { + self.link_nodes(src_id, dst_id, t, layer, |new_edge| { + new_edge.deletions_mut(layer).insert(t); + Ok(()) + })?; + Ok(()) + } + + fn get_or_allocate_layer(&self, layer: Option<&str>) -> usize { + layer + .map(|layer| self.edge_meta.get_or_create_layer_id(layer)) + .unwrap_or(0) + } + + fn link_nodes Result<(), GraphError>>( + &self, + src_id: VID, + dst_id: VID, + t: TimeIndexEntry, + layer: usize, + edge_fn: F, + ) -> Result { + let mut node_pair = self.storage.pair_node_mut(src_id.into(), dst_id.into()); + self.update_time(t); + let src = node_pair.get_mut_i(); + + let edge_id = match src.find_edge(dst_id, &LayerIds::All) { + Some(edge_id) => { + let mut edge = self.storage.get_edge_mut(edge_id); + edge_fn(&mut edge)?; + edge_id + } + None => { + let mut edge = EdgeStore::new(src_id, dst_id); + edge_fn(&mut edge)?; + self.storage.push_edge(edge) + } + }; + + src.add_edge(dst_id, Direction::OUT, layer, edge_id); + src.update_time(t); + let dst = node_pair.get_mut_j(); + dst.add_edge(src_id, Direction::IN, layer, edge_id); + dst.update_time(t); + Ok(edge_id) + } + + pub(crate) fn add_edge_internal( + &self, + t: TimeIndexEntry, + src_id: VID, + dst_id: VID, + props: Vec<(usize, Prop)>, + layer: usize, + ) -> Result { + // get the entries for the src and dst nodes + self.link_nodes(src_id, dst_id, t, layer, move |edge| { + edge.additions_mut(layer).insert(t); + let mut edge_layer = edge.layer_mut(layer); + for (prop_id, prop_value) in props { + edge_layer.add_prop(t, prop_id, prop_value)?; + } + Ok(()) + }) + } + + #[inline] + pub(crate) fn vertex_ids(&self) -> impl Iterator { + (0..self.storage.nodes.len()).map(|i| i.into()) + } + + pub(crate) fn locked_edges(&self) -> impl Iterator> { + self.storage.locked_edges() + } + + pub(crate) fn find_edge(&self, src: VID, dst: VID, layer_id: &LayerIds) -> Option { + let node = self.storage.get_node(src.into()); + node.find_edge(dst, layer_id) + } + + pub(crate) fn resolve_vertex_ref(&self, v: VertexRef) -> Option { + match v { + VertexRef::Internal(vid) => Some(vid), + VertexRef::External(gid) => { + let v_id = self.logical_to_physical.get(&gid)?; + Some((*v_id).into()) + } + } + } + + pub(crate) fn vertex(&self, v: VID) -> Vertex { + let node = self.storage.get_node(v.into()); + Vertex::from_entry(node, self) + } + + pub(crate) fn vertex_arc(&self, v: VID) -> ArcVertex { + let node = self.storage.get_node_arc(v.into()); + ArcVertex::from_entry(node, self.vertex_meta.clone()) + } + + pub(crate) fn edge_arc(&self, e: EID) -> ArcEdge { + let edge = self.storage.get_edge_arc(e.into()); + ArcEdge::from_entry(edge, self.edge_meta.clone()) + } + + #[inline] + pub(crate) fn edge(&self, e: EID) -> EdgeView { + let edge = self.storage.get_edge(e.into()); + EdgeView::from_entry(edge, self) + } + + /// Checks if the same string value already exists and returns a pointer to the same existing value if it exists, + /// otherwise adds the string to the pool. + pub(crate) fn resolve_str(&self, value: ArcStr) -> ArcStr { + match self.string_pool.get(&value) { + Some(value) => value.clone(), + None => { + if self.string_pool.insert(value.clone()) { + value + } else { + self.string_pool + .get(&value) + .expect("value exists due to insert above returning false") + .clone() + } + } + } + } +} + +#[cfg(test)] +mod test_additions { + use crate::prelude::*; + use rayon::{join, prelude::*}; + #[test] + fn add_edge_and_read_props_concurrent() { + let g = Graph::new(); + for t in 0..1000 { + join( + || g.add_edge(t, 1, 2, [("test", true)], None), + || { + // if the edge exists already, it should have the property set + g.window(t, t + 1) + .edge(1, 2) + .map(|e| assert!(e.properties().get("test").is_some())) + }, + ); + } + } +} diff --git a/raphtory/src/core/entities/graph/tgraph_storage.rs b/raphtory/src/core/entities/graph/tgraph_storage.rs new file mode 100644 index 0000000000..ddbd40fb82 --- /dev/null +++ b/raphtory/src/core/entities/graph/tgraph_storage.rs @@ -0,0 +1,208 @@ +use crate::core::{ + entities::{ + edges::{edge_ref::EdgeRef, edge_store::EdgeStore}, + vertices::vertex_store::VertexStore, + LayerIds, EID, VID, + }, + storage::{self, ArcEntry, Entry, EntryMut, PairEntryMut}, + Direction, +}; +use rayon::prelude::{ParallelBridge, ParallelIterator}; +use serde::{Deserialize, Serialize}; +use std::{ + ops::{Deref, Range}, + sync::Arc, +}; + +#[derive(Debug, Deserialize, Serialize, PartialEq)] +pub(crate) struct GraphStorage { + // node storage with having (id, time_index, properties, adj list for each layer) + pub(crate) nodes: storage::RawStorage, + + // edge storage with having (src, dst, time_index, properties) for each layer + pub(crate) edges: storage::RawStorage, +} + +impl GraphStorage { + pub(crate) fn new() -> Self { + Self { + nodes: storage::RawStorage::new(), + edges: storage::RawStorage::new(), + } + } + + pub(crate) fn push_node(&self, node: VertexStore) -> VID { + self.nodes + .push(node, |vid, node| node.vid = vid.into()) + .into() + } + + pub(crate) fn push_edge(&self, edge: EdgeStore) -> EID { + self.edges + .push(edge, |eid, edge| edge.eid = eid.into()) + .into() + } + + #[inline] + pub(crate) fn get_node_mut(&self, id: VID) -> EntryMut<'_, VertexStore> { + self.nodes.entry_mut(id.into()) + } + + #[inline] + pub(crate) fn get_edge_mut(&self, id: EID) -> EntryMut<'_, EdgeStore> { + self.edges.entry_mut(id.into()) + } + + #[inline] + pub(crate) fn get_node(&self, id: VID) -> Entry<'_, VertexStore, N> { + self.nodes.entry(id.into()) + } + + pub(crate) fn get_node_arc(&self, id: VID) -> ArcEntry { + self.nodes.entry_arc(id.into()) + } + + pub(crate) fn get_edge_arc(&self, id: EID) -> ArcEntry { + self.edges.entry_arc(id.into()) + } + + #[inline] + pub(crate) fn get_edge(&self, id: EID) -> Entry<'_, EdgeStore, N> { + self.edges.entry(id.into()) + } + + pub(crate) fn pair_node_mut(&self, i: VID, j: VID) -> PairEntryMut<'_, VertexStore> { + self.nodes.pair_entry_mut(i.into(), j.into()) + } + + fn lock(&self) -> LockedGraphStorage { + LockedGraphStorage::new(self) + } + + pub(crate) fn locked_nodes(&self) -> LockedIter { + LockedIter { + from: 0, + to: self.nodes.len(), + locked_gs: Arc::new(self.lock()), + phantom: std::marker::PhantomData, + } + } + + pub(crate) fn locked_edges(&self) -> impl Iterator> { + self.edges.read_lock().into_iter() + } + + pub(crate) fn edge_refs(&self) -> impl Iterator + Send { + self.edges + .read_lock() + .into_iter() + .map(|entry| EdgeRef::from(entry)) + } +} + +pub(crate) struct LockedIter { + from: usize, + to: usize, + locked_gs: Arc>, + phantom: std::marker::PhantomData, +} + +impl Iterator for LockedIter { + type Item = GraphEntry; + + fn next(&mut self) -> Option { + if self.from < self.to { + let node = Some(GraphEntry { + locked_gs: self.locked_gs.clone(), + i: self.from, + _marker: std::marker::PhantomData, + }); + self.from += 1; + node + } else { + None + } + } +} + +impl<'a, const N: usize> Iterator for LockedIter { + type Item = GraphEntry; + + fn next(&mut self) -> Option { + if self.from < self.to { + let node = Some(GraphEntry { + locked_gs: self.locked_gs.clone(), + i: self.from, + _marker: std::marker::PhantomData, + }); + self.from += 1; + node + } else { + None + } + } +} + +pub struct GraphEntry { + locked_gs: Arc>, + i: usize, + _marker: std::marker::PhantomData, +} + +// impl new +impl<'a, const N: usize, T> GraphEntry { + pub(crate) fn new(gs: Arc>, i: usize) -> Self { + Self { + locked_gs: gs, + i, + _marker: std::marker::PhantomData, + } + } + + pub(crate) fn index(&self) -> usize { + self.i + } + + pub(crate) fn locked_gs(&self) -> &Arc> { + &self.locked_gs + } +} + +impl<'a, const N: usize> Deref for GraphEntry { + type Target = VertexStore; + + fn deref(&self) -> &Self::Target { + self.locked_gs.get_node(self.i) + } +} + +impl<'a, const N: usize> Deref for GraphEntry { + type Target = EdgeStore; + + fn deref(&self) -> &Self::Target { + self.locked_gs.get_edge(self.i) + } +} + +#[derive(Debug)] +pub(crate) struct LockedGraphStorage { + nodes: storage::ReadLockedStorage, + edges: storage::ReadLockedStorage, +} + +impl LockedGraphStorage { + pub(crate) fn new(storage: &GraphStorage) -> Self { + Self { + nodes: storage.nodes.read_lock(), + edges: storage.edges.read_lock(), + } + } + + pub(crate) fn get_node(&self, id: usize) -> &VertexStore { + self.nodes.get(id) + } + + pub(crate) fn get_edge(&self, id: usize) -> &EdgeStore { + self.edges.get(id) + } +} diff --git a/raphtory/src/core/entities/graph/timer.rs b/raphtory/src/core/entities/graph/timer.rs new file mode 100644 index 0000000000..f7eda2d487 --- /dev/null +++ b/raphtory/src/core/entities/graph/timer.rs @@ -0,0 +1,108 @@ +use serde::{Deserialize, Serialize}; +use std::sync::atomic::{AtomicI64, Ordering}; + +pub(crate) trait TimeCounterTrait { + fn cmp(a: i64, b: i64) -> bool; + fn counter(&self) -> &AtomicI64; + + fn update(&self, new_value: i64) { + let mut current_value = self.get(); + while Self::cmp(new_value, current_value) { + match self.counter().compare_exchange_weak( + current_value, + new_value, + Ordering::Relaxed, + Ordering::Relaxed, + ) { + Ok(_) => break, + Err(value) => current_value = value, + } + } + } + fn get(&self) -> i64; +} + +#[derive(Serialize, Deserialize, Debug)] +pub(crate) struct MinCounter { + counter: AtomicI64, +} + +impl MinCounter { + pub fn new() -> Self { + Self { + counter: AtomicI64::new(i64::MAX), + } + } +} + +impl TimeCounterTrait for MinCounter { + fn cmp(new_value: i64, current_value: i64) -> bool { + new_value < current_value + } + + fn counter(&self) -> &AtomicI64 { + &self.counter + } + + fn get(&self) -> i64 { + self.counter.load(Ordering::Relaxed) + } +} + +#[derive(Serialize, Deserialize, Debug)] +pub(crate) struct MaxCounter { + counter: AtomicI64, +} + +impl MaxCounter { + pub fn new() -> Self { + Self { + counter: AtomicI64::new(i64::MIN), + } + } +} + +impl TimeCounterTrait for MaxCounter { + fn cmp(a: i64, b: i64) -> bool { + a > b + } + fn get(&self) -> i64 { + self.counter.load(Ordering::Relaxed) + } + + fn counter(&self) -> &AtomicI64 { + &self.counter + } +} + +#[cfg(test)] +mod test { + + use super::*; + + #[test] + fn min_counter() { + let counter = MinCounter::new(); + counter.update(0); + assert_eq!(counter.get(), 0); + counter.update(1); + assert_eq!(counter.get(), 0); + counter.update(0); + assert_eq!(counter.get(), 0); + counter.update(-1); + assert_eq!(counter.get(), -1); + } + + #[test] + fn max_counter() { + let counter = MaxCounter::new(); + counter.update(0); + assert_eq!(counter.get(), 0); + counter.update(-1); + assert_eq!(counter.get(), 0); + counter.update(0); + assert_eq!(counter.get(), 0); + counter.update(1); + assert_eq!(counter.get(), 1); + } +} diff --git a/raphtory/src/core/entities/mod.rs b/raphtory/src/core/entities/mod.rs new file mode 100644 index 0000000000..8b0db056e3 --- /dev/null +++ b/raphtory/src/core/entities/mod.rs @@ -0,0 +1,185 @@ +#![allow(unused)] + +use std::{ops::Deref, sync::Arc}; + +use crate::core::entities::edges::edge_ref::EdgeRef; +use edges::edge::ERef; +use graph::{tgraph::TGraph, tgraph_storage::GraphEntry}; +use serde::{Deserialize, Serialize}; +use vertices::{vertex_ref::VertexRef, vertex_store::VertexStore}; + +use super::{storage::Entry, Direction}; + +pub mod edges; +pub mod graph; +pub mod properties; +pub mod vertices; + +// the only reason this is public is because the phisical ids of the vertices don't move +#[repr(transparent)] +#[derive( + Copy, Clone, Debug, PartialEq, Eq, Hash, PartialOrd, Ord, Deserialize, Serialize, Default, +)] +pub struct VID(pub usize); + +#[derive(Copy, Clone, Debug, PartialEq, Eq, Hash)] +pub(crate) struct LocalID { + pub(crate) bucket: usize, + pub(crate) offset: usize, +} + +impl From for VID { + fn from(id: usize) -> Self { + VID(id) + } +} + +impl From for usize { + fn from(id: VID) -> Self { + id.0 + } +} + +#[repr(transparent)] +#[derive( + Copy, Clone, Debug, PartialEq, Eq, Hash, PartialOrd, Ord, Deserialize, Serialize, Default, +)] +pub struct EID(pub usize); + +impl From for usize { + fn from(id: EID) -> Self { + id.0 + } +} + +impl From for EID { + fn from(id: usize) -> Self { + EID(id) + } +} + +pub(crate) enum VRef<'a, const N: usize> { + Entry(Entry<'a, VertexStore, N>), // returned from graph.vertex + LockedEntry(GraphEntry), // returned from locked_vertices +} + +// return index -> usize for VRef +impl<'a, const N: usize> VRef<'a, N> { + fn index(&'a self) -> usize { + match self { + VRef::Entry(e) => e.index(), + VRef::LockedEntry(ge) => ge.index(), + } + } + + fn edge_ref(&self, edge_id: EID, graph: &'a TGraph) -> ERef<'a, N> { + match self { + VRef::Entry(_) => ERef::ERef(graph.edge_entry(edge_id)), + VRef::LockedEntry(ge) => ERef::ELock { + lock: ge.locked_gs().clone(), + eid: edge_id, + }, + } + } +} + +impl<'a, const N: usize> Deref for VRef<'a, N> { + type Target = VertexStore; + + fn deref(&self) -> &Self::Target { + match self { + VRef::Entry(e) => e, + VRef::LockedEntry(e) => e, + } + } +} + +pub(crate) trait GraphItem<'a, const N: usize> { + fn from_edge_ids( + src: VID, + dst: VID, + e_id: ERef<'a, N>, + dir: Direction, + graph: &'a TGraph, + ) -> Self; +} + +#[derive(Clone, Debug)] +pub enum LayerIds { + None, + All, + One(usize), + Multiple(Arc<[usize]>), +} + +impl LayerIds { + pub fn find(&self, layer_id: usize) -> Option { + match self { + LayerIds::All => Some(layer_id), + LayerIds::One(id) => { + if *id == layer_id { + Some(layer_id) + } else { + None + } + } + LayerIds::Multiple(ids) => ids.binary_search(&layer_id).ok().map(|_| layer_id), + LayerIds::None => None, + } + } + + pub fn constrain_from_edge(self, e: EdgeRef) -> LayerIds { + match e.layer() { + None => self, + Some(l) => self + .find(*l) + .map(|l| LayerIds::One(l)) + .unwrap_or(LayerIds::None), + } + } + + pub fn contains(&self, layer_id: &usize) -> bool { + self.find(*layer_id).is_some() + } +} + +impl From> for LayerIds { + fn from(mut v: Vec) -> Self { + match v.len() { + 0 => LayerIds::All, + 1 => LayerIds::One(v[0]), + _ => { + v.sort_unstable(); + v.dedup(); + LayerIds::Multiple(v.into()) + } + } + } +} + +impl From<[usize; N]> for LayerIds { + fn from(v: [usize; N]) -> Self { + match v.len() { + 0 => LayerIds::All, + 1 => LayerIds::One(v[0]), + _ => { + let mut v = v.to_vec(); + v.sort_unstable(); + v.dedup(); + LayerIds::Multiple(v.into()) + } + } + } +} + +impl From for LayerIds { + fn from(id: usize) -> Self { + LayerIds::One(id) + } +} + +impl From> for LayerIds { + fn from(id: Arc<[usize]>) -> Self { + LayerIds::Multiple(id) + } +} diff --git a/raphtory/src/core/entities/properties/graph_props.rs b/raphtory/src/core/entities/properties/graph_props.rs new file mode 100644 index 0000000000..56e335882e --- /dev/null +++ b/raphtory/src/core/entities/properties/graph_props.rs @@ -0,0 +1,141 @@ +use crate::core::{ + entities::{ + graph::tgraph::FxDashMap, + properties::{ + props::{ArcReadLockedVec, DictMapper}, + tprop::TProp, + }, + }, + storage::{lazy_vec::IllegalSet, locked_view::LockedView, timeindex::TimeIndexEntry}, + utils::errors::{GraphError, IllegalMutate, MutateGraphError}, + ArcStr, Prop, PropType, +}; +use parking_lot::RwLockReadGuard; +use serde::{Deserialize, Serialize}; +use std::{ + ops::{Deref, DerefMut}, + sync::Arc, +}; + +#[derive(Serialize, Deserialize, Debug)] +pub struct GraphProps { + constant_mapper: DictMapper, + temporal_mapper: DictMapper, + constant: FxDashMap>, + temporal: FxDashMap, +} + +impl GraphProps { + pub(crate) fn new() -> Self { + Self { + constant_mapper: DictMapper::default(), + temporal_mapper: DictMapper::default(), + constant: FxDashMap::default(), + temporal: FxDashMap::default(), + } + } + + #[inline] + pub fn const_prop_meta(&self) -> &DictMapper { + &self.constant_mapper + } + + #[inline] + pub fn temporal_prop_meta(&self) -> &DictMapper { + &self.temporal_mapper + } + + #[inline] + pub(crate) fn resolve_property(&self, name: &str, is_static: bool) -> usize { + if is_static { + self.constant_mapper.get_or_create_id(name) + } else { + self.temporal_mapper.get_or_create_id(name) + } + } + + pub(crate) fn add_constant_prop( + &self, + prop_id: usize, + prop: Prop, + ) -> Result<(), MutateGraphError> { + let mut prop_entry = self.constant.entry(prop_id).or_insert(None); + match prop_entry.deref_mut() { + Some(old_value) => { + if !(old_value == &prop) { + return Err(MutateGraphError::IllegalGraphPropertyChange { + name: self.constant_mapper.get_name(prop_id).to_string(), + old_value: old_value.clone(), + new_value: prop, + }); + } + } + None => { + (*prop_entry) = Some(prop); + } + } + Ok(()) + } + + pub(crate) fn add_prop( + &self, + t: TimeIndexEntry, + prop_id: usize, + prop: Prop, + ) -> Result<(), GraphError> { + let mut prop_entry = self.temporal.entry(prop_id).or_insert(TProp::default()); + (*prop_entry).set(t, prop) + } + + pub(crate) fn get_constant(&self, id: usize) -> Option { + let entry = self.constant.get(&id)?; + entry.as_ref().cloned() + } + + pub(crate) fn get_temporal_prop(&self, prop_id: usize) -> Option> { + let entry = self.temporal.get(&prop_id)?; + Some(LockedView::DashMap(entry)) + } + + pub fn get_const_prop_id(&self, name: &str) -> Option { + self.constant_mapper.get_id(name) + } + + pub fn get_temporal_id(&self, name: &str) -> Option { + self.temporal_mapper.get_id(name) + } + + pub fn get_const_prop_name(&self, prop_id: usize) -> ArcStr { + self.constant_mapper.get_name(prop_id) + } + + pub fn get_temporal_name(&self, prop_id: usize) -> ArcStr { + self.temporal_mapper.get_name(prop_id) + } + + pub fn get_constant_dtype(&self, prop_id: usize) -> Option { + self.constant + .get(&prop_id) + .and_then(|v| v.as_ref().map(|v| v.dtype())) + } + + pub fn get_temporal_dtype(&self, prop_id: usize) -> Option { + self.temporal.get(&prop_id).map(|v| v.dtype()) + } + + pub(crate) fn constant_names(&self) -> ArcReadLockedVec { + self.constant_mapper.get_keys() + } + + pub(crate) fn const_prop_ids(&self) -> impl Iterator { + 0..self.constant_mapper.len() + } + + pub(crate) fn temporal_names(&self) -> ArcReadLockedVec { + self.temporal_mapper.get_keys() + } + + pub(crate) fn temporal_ids(&self) -> impl Iterator { + 0..self.temporal_mapper.len() + } +} diff --git a/raphtory/src/core/entities/properties/mod.rs b/raphtory/src/core/entities/properties/mod.rs new file mode 100644 index 0000000000..c5875f71b6 --- /dev/null +++ b/raphtory/src/core/entities/properties/mod.rs @@ -0,0 +1,4 @@ +pub mod graph_props; +pub mod props; +pub mod tcell; +pub mod tprop; diff --git a/raphtory/src/core/entities/properties/props.rs b/raphtory/src/core/entities/properties/props.rs new file mode 100644 index 0000000000..695cc16948 --- /dev/null +++ b/raphtory/src/core/entities/properties/props.rs @@ -0,0 +1,462 @@ +use crate::core::{ + entities::{graph::tgraph::FxDashMap, properties::tprop::TProp}, + storage::{ + lazy_vec::{IllegalSet, LazyVec}, + locked_view::LockedView, + timeindex::TimeIndexEntry, + }, + utils::errors::{GraphError, IllegalMutate, MutateGraphError}, + ArcStr, Prop, PropType, +}; +use lock_api; +use parking_lot::{RwLock, RwLockReadGuard}; +use serde::{Deserialize, Serialize}; +use std::{ + borrow::Borrow, + fmt::Debug, + hash::Hash, + ops::Deref, + sync::{ + atomic::{AtomicUsize, Ordering}, + Arc, + }, +}; +use tantivy::HasLen; + +type ArcRwLockReadGuard = lock_api::ArcRwLockReadGuard; + +#[derive(Serialize, Deserialize, Default, Debug, PartialEq)] +pub struct Props { + // properties + constant_props: LazyVec>, + temporal_props: LazyVec, +} + +#[derive(Debug, Serialize, Deserialize, PartialEq, Eq, Hash, Clone)] +enum PropId { + Static(usize), + Temporal(usize), +} + +impl Props { + pub fn new() -> Self { + Self { + constant_props: LazyVec::Empty, + temporal_props: LazyVec::Empty, + } + } + + pub fn add_prop( + &mut self, + t: TimeIndexEntry, + prop_id: usize, + prop: Prop, + ) -> Result<(), GraphError> { + self.temporal_props.update(prop_id, |p| p.set(t, prop)) + } + + pub fn add_constant_prop( + &mut self, + prop_id: usize, + prop: Prop, + ) -> Result<(), IllegalSet>> { + self.constant_props.set(prop_id, Some(prop)) + } + + pub fn temporal_props(&self, prop_id: usize) -> Box + '_> { + let o = self.temporal_props.get(prop_id); + if let Some(t_prop) = o { + Box::new(t_prop.iter()) + } else { + Box::new(std::iter::empty()) + } + } + + pub fn temporal_props_window( + &self, + prop_id: usize, + t_start: i64, + t_end: i64, + ) -> Box + '_> { + let o = self.temporal_props.get(prop_id); + if let Some(t_prop) = o { + Box::new(t_prop.iter_window(t_start..t_end)) + } else { + Box::new(std::iter::empty()) + } + } + + pub fn const_prop(&self, prop_id: usize) -> Option<&Prop> { + let prop = self.constant_props.get(prop_id)?; + prop.as_ref() + } + + pub fn temporal_prop(&self, prop_id: usize) -> Option<&TProp> { + self.temporal_props.get(prop_id) + } + + pub fn const_prop_ids(&self) -> impl Iterator + '_ { + self.constant_props.filled_ids() + } + + pub fn temporal_prop_ids(&self) -> impl Iterator + '_ { + self.temporal_props.filled_ids() + } +} + +#[derive(Serialize, Deserialize, Debug)] +pub struct Meta { + meta_prop_temporal: PropMapper, + meta_prop_constant: PropMapper, + meta_layer: DictMapper, +} + +impl Meta { + pub fn const_prop_meta(&self) -> &PropMapper { + &self.meta_prop_constant + } + + pub fn temporal_prop_meta(&self) -> &PropMapper { + &self.meta_prop_temporal + } + + pub fn layer_meta(&self) -> &DictMapper { + &self.meta_layer + } + + pub fn new() -> Self { + let meta_layer = DictMapper::default(); + meta_layer.get_or_create_id("_default"); + Self { + meta_prop_temporal: PropMapper::default(), + meta_prop_constant: PropMapper::default(), + meta_layer, // layer 0 is the default layer + } + } + + #[inline] + pub fn resolve_prop_id( + &self, + prop: &str, + dtype: PropType, + is_static: bool, + ) -> Result { + if is_static { + self.meta_prop_constant + .get_or_create_and_validate(prop, dtype) + } else { + self.meta_prop_temporal + .get_or_create_and_validate(prop, dtype) + } + } + + #[inline] + pub fn get_prop_id(&self, name: &str, is_static: bool) -> Option { + if is_static { + self.meta_prop_constant.get_id(name) + } else { + self.meta_prop_temporal.get_id(name) + } + } + + #[inline] + pub fn get_or_create_layer_id(&self, name: &str) -> usize { + self.meta_layer.get_or_create_id(name) + } + + #[inline] + pub fn get_layer_id(&self, name: &str) -> Option { + self.meta_layer.map.get(name).as_deref().copied() + } + + pub fn get_layer_name_by_id(&self, id: usize) -> ArcStr { + self.meta_layer.get_name(id) + } + + pub fn get_all_layers(&self) -> Vec { + self.meta_layer + .map + .iter() + .map(|entry| *entry.value()) + .collect() + } + + pub fn get_all_property_names(&self, is_static: bool) -> ArcReadLockedVec { + if is_static { + self.meta_prop_constant.get_keys() + } else { + self.meta_prop_temporal.get_keys() + } + } + + pub fn get_prop_name(&self, prop_id: usize, is_static: bool) -> ArcStr { + if is_static { + self.meta_prop_constant.get_name(prop_id) + } else { + self.meta_prop_temporal.get_name(prop_id) + } + } +} + +#[derive(Serialize, Deserialize, Default, Debug)] +pub struct DictMapper { + map: FxDashMap, + reverse_map: Arc>>, //FIXME: a boxcar vector would be a great fit if it was serializable... +} + +#[derive(Debug)] +pub struct ArcReadLockedVec { + guard: ArcRwLockReadGuard>, +} + +impl Deref for ArcReadLockedVec { + type Target = Vec; + + #[inline] + fn deref(&self) -> &Self::Target { + self.guard.deref() + } +} + +impl IntoIterator for ArcReadLockedVec { + type Item = T; + type IntoIter = LockedIter; + + fn into_iter(self) -> Self::IntoIter { + let guard = self.guard; + let len = guard.len(); + let pos = 0; + LockedIter { guard, pos, len } + } +} + +pub struct LockedIter { + guard: ArcRwLockReadGuard>, + pos: usize, + len: usize, +} + +impl Iterator for LockedIter { + type Item = T; + + fn next(&mut self) -> Option { + if self.pos < self.len { + let next_val = Some(self.guard[self.pos].clone()); + self.pos += 1; + next_val + } else { + None + } + } +} + +impl DictMapper { + pub fn get_or_create_id(&self, name: &Q) -> usize + where + ArcStr: Borrow, + Q: Hash + Eq + ?Sized + ToOwned, + T: Into, + { + if let Some(existing_id) = self.map.get(name) { + return *existing_id; + } + + let name = name.to_owned().into(); + let new_id = self.map.entry(name.clone()).or_insert_with(|| { + let mut reverse = self.reverse_map.write(); + let id = reverse.len(); + reverse.push(name); + id + }); + *new_id + } + + pub fn get_id(&self, name: &str) -> Option { + self.map.get(name).map(|id| *id) + } + + pub fn get_name(&self, id: usize) -> ArcStr { + let guard = self.reverse_map.read(); + guard + .get(id) + .map(|v| v.clone()) + .expect("internal ids should always be mapped to a name") + } + + pub fn get_keys(&self) -> ArcReadLockedVec { + ArcReadLockedVec { + guard: self.reverse_map.read_arc(), + } + } + + pub fn len(&self) -> usize { + self.reverse_map.read().len() + } + + pub fn is_empty(&self) -> bool { + self.reverse_map.read().is_empty() + } +} + +#[derive(Default, Debug, Serialize, Deserialize)] +pub struct PropMapper { + id_mapper: DictMapper, + dtypes: Arc>>, +} + +impl Deref for PropMapper { + type Target = DictMapper; + + #[inline] + fn deref(&self) -> &Self::Target { + &self.id_mapper + } +} + +impl PropMapper { + fn get_or_create_and_validate(&self, prop: &str, dtype: PropType) -> Result { + let id = self.id_mapper.get_or_create_id(prop); + let dtype_read = self.dtypes.read_recursive(); + if let Some(old_type) = dtype_read.get(id) { + if !matches!(old_type, PropType::Empty) { + return if *old_type == dtype { + Ok(id) + } else { + Err(GraphError::PropertyTypeError { + name: prop.to_owned(), + expected: *old_type, + actual: dtype, + }) + }; + } + } + drop(dtype_read); // drop the read lock and wait for write lock as type did not exist yet + let mut dtype_write = self.dtypes.write(); + match dtype_write.get(id) { + Some(&old_type) => { + if matches!(old_type, PropType::Empty) { + // vector already resized but this id is not filled yet, set the dtype and return id + dtype_write[id] = dtype; + Ok(id) + } else { + // already filled because a different thread won the race for this id, check the type matches + if old_type == dtype { + Ok(id) + } else { + Err(GraphError::PropertyTypeError { + name: prop.to_owned(), + expected: old_type, + actual: dtype, + }) + } + } + } + None => { + // vector not resized yet, resize it and set the dtype and return id + dtype_write.resize(id + 1, PropType::Empty); + dtype_write[id] = dtype; + Ok(id) + } + } + } + + pub fn get_dtype(&self, prop_id: usize) -> Option { + self.dtypes.read_recursive().get(prop_id).copied() + } +} + +#[cfg(test)] +mod test { + use super::*; + use rand::seq::SliceRandom; + use rayon::prelude::*; + use std::{collections::HashMap, sync::Arc, thread}; + + #[test] + fn test_dict_mapper() { + let mapper = DictMapper::default(); + assert_eq!(mapper.get_or_create_id("test"), 0); + assert_eq!(mapper.get_or_create_id("test"), 0); + assert_eq!(mapper.get_or_create_id("test2"), 1); + assert_eq!(mapper.get_or_create_id("test2"), 1); + assert_eq!(mapper.get_or_create_id("test"), 0); + } + + #[quickcheck] + fn check_dict_mapper_concurrent_write(write: Vec) -> bool { + let n = 100; + let mapper: DictMapper = DictMapper::default(); + + // create n maps from strings to ids in parallel + let res: Vec> = (0..n) + .into_par_iter() + .map(|_| { + let mut ids: HashMap = Default::default(); + let mut rng = rand::thread_rng(); + let mut write_s = write.clone(); + write_s.shuffle(&mut rng); + for s in write_s { + let id = mapper.get_or_create_id(s.as_str()); + ids.insert(s, id); + } + ids + }) + .collect(); + + // check that all maps are the same and that all strings have been assigned an id + let res_0 = &res[0]; + res[1..n].iter().all(|v| res_0 == v) && write.iter().all(|v| mapper.get_id(v).is_some()) + } + + // map 5 strings to 5 ids from 4 threads concurrently 1000 times + #[test] + fn test_dict_mapper_concurrent() { + use std::{sync::Arc, thread}; + + let mapper = Arc::new(DictMapper::default()); + let mut threads = Vec::new(); + for _ in 0..4 { + let mapper = Arc::clone(&mapper); + threads.push(thread::spawn(move || { + for _ in 0..1000 { + mapper.get_or_create_id("test"); + mapper.get_or_create_id("test2"); + mapper.get_or_create_id("test3"); + mapper.get_or_create_id("test4"); + mapper.get_or_create_id("test5"); + } + })); + } + + for thread in threads { + thread.join().unwrap(); + } + + let mut actual = vec!["test", "test2", "test3", "test4", "test5"] + .into_iter() + .map(|name| mapper.get_or_create_id(name)) + .collect::>(); + actual.sort(); + + assert_eq!(actual, vec![0, 1, 2, 3, 4]); + } + + #[test] + fn test_prop_mapper_concurrent() { + let values = [Prop::I64(1), Prop::U16(0), Prop::Bool(true), Prop::F64(0.0)]; + let input_len = values.len(); + + let mapper = Arc::new(PropMapper::default()); + let threads: Vec<_> = values + .into_iter() + .map(move |v| { + let mapper = mapper.clone(); + thread::spawn(move || mapper.get_or_create_and_validate("test", v.dtype())) + }) + .flat_map(|t| t.join()) + .collect(); + + assert_eq!(threads.len(), input_len); // no errors + assert_eq!(threads.into_iter().flatten().count(), 1); // only one result (which ever was first) + } +} diff --git a/raphtory/src/core/tcell.rs b/raphtory/src/core/entities/properties/tcell.rs similarity index 61% rename from raphtory/src/core/tcell.rs rename to raphtory/src/core/entities/properties/tcell.rs index bfd23ea19d..de17baa33f 100644 --- a/raphtory/src/core/tcell.rs +++ b/raphtory/src/core/entities/properties/tcell.rs @@ -1,47 +1,50 @@ -use std::{collections::BTreeMap, fmt::Debug, ops::Range}; - +use crate::core::storage::{ + sorted_vec_map::SVM, + timeindex::{AsTime, TimeIndexEntry}, +}; use serde::{Deserialize, Serialize}; - -use crate::core::sorted_vec_map::SVM; +use std::{collections::BTreeMap, fmt::Debug, ops::Range}; #[derive(Debug, PartialEq, Default, Clone, Serialize, Deserialize)] - // TCells represent a value in time that can be set at multiple times and keeps a history -pub(crate) enum TCell { +pub enum TCell { #[default] Empty, - TCell1(i64, A), - TCellCap(SVM), - TCellN(BTreeMap), + TCell1(TimeIndexEntry, A), + TCellCap(SVM), + TCellN(BTreeMap), } const BTREE_CUTOFF: usize = 128; -impl TCell { - pub fn new(t: i64, value: A) -> Self { +impl TCell { + pub fn new(t: TimeIndexEntry, value: A) -> Self { TCell::TCell1(t, value) } - pub fn set(&mut self, t: i64, value: A) { + pub fn set(&mut self, t: TimeIndexEntry, value: A) { match self { TCell::Empty => { *self = TCell::TCell1(t, value); } TCell::TCell1(t0, value0) => { - if t != *t0 { - let mut svm = SVM::new(); - svm.insert(t, value); - svm.insert(*t0, value0.clone()); - *self = TCell::TCellCap(svm) + if &t != t0 { + if let TCell::TCell1(t0, value0) = std::mem::take(self) { + let mut svm = SVM::new(); + svm.insert(t, value); + svm.insert(t0, value0); + *self = TCell::TCellCap(svm) + } } } TCell::TCellCap(svm) => { if svm.len() < BTREE_CUTOFF { svm.insert(t, value.clone()); } else { - let mut btm: BTreeMap = BTreeMap::new(); - for (k, v) in svm.iter() { - btm.insert(*k, v.clone()); + let svm = std::mem::take(svm); + let mut btm: BTreeMap = BTreeMap::new(); + for (k, v) in svm.into_iter() { + btm.insert(k, v); } btm.insert(t, value.clone()); *self = TCell::TCellN(btm) @@ -53,6 +56,15 @@ impl TCell { } } + pub fn at(&self, ti: &TimeIndexEntry) -> Option<&A> { + match self { + TCell::Empty => None, + TCell::TCell1(t, v) => (t == ti).then_some(v), + TCell::TCellCap(svm) => svm.get(ti), + TCell::TCellN(btm) => btm.get(ti), + } + } + #[allow(dead_code)] pub fn iter(&self) -> Box + '_> { match self { @@ -66,9 +78,9 @@ impl TCell { pub fn iter_t(&self) -> Box + '_> { match self { TCell::Empty => Box::new(std::iter::empty()), - TCell::TCell1(t, value) => Box::new(std::iter::once((t, value))), - TCell::TCellCap(svm) => Box::new(svm.iter()), - TCell::TCellN(btm) => Box::new(btm.iter()), + TCell::TCell1(t, value) => Box::new(std::iter::once((t.t(), value))), + TCell::TCellCap(svm) => Box::new(svm.iter().map(|(ti, v)| (ti.t(), v))), + TCell::TCellN(btm) => Box::new(btm.iter().map(|(ti, v)| (ti.t(), v))), } } @@ -77,14 +89,18 @@ impl TCell { match self { TCell::Empty => Box::new(std::iter::empty()), TCell::TCell1(t, value) => { - if r.contains(t) { + if r.contains(t.t()) { Box::new(std::iter::once(value)) } else { Box::new(std::iter::empty()) } } - TCell::TCellCap(svm) => Box::new(svm.range(r).map(|(_, value)| value)), - TCell::TCellN(btm) => Box::new(btm.range(r).map(|(_, value)| value)), + TCell::TCellCap(svm) => { + Box::new(svm.range(TimeIndexEntry::range(r)).map(|(_, value)| value)) + } + TCell::TCellN(btm) => { + Box::new(btm.range(TimeIndexEntry::range(r)).map(|(_, value)| value)) + } } } @@ -92,14 +108,35 @@ impl TCell { match self { TCell::Empty => Box::new(std::iter::empty()), TCell::TCell1(t, value) => { - if r.contains(t) { - Box::new(std::iter::once((t, value))) + if r.contains(t.t()) { + Box::new(std::iter::once((t.t(), value))) } else { Box::new(std::iter::empty()) } } - TCell::TCellCap(svm) => Box::new(svm.range(r)), - TCell::TCellN(btm) => Box::new(btm.range(r)), + TCell::TCellCap(svm) => Box::new( + svm.range(TimeIndexEntry::range(r)) + .map(|(ti, v)| (ti.t(), v)), + ), + TCell::TCellN(btm) => Box::new( + btm.range(TimeIndexEntry::range(r)) + .map(|(ti, v)| (ti.t(), v)), + ), + } + } + + pub fn last_before(&self, t: i64) -> Option<(&i64, &A)> { + match self { + TCell::Empty => None, + TCell::TCell1(t2, v) => (t2.t() < &t).then_some((t2.t(), v)), + TCell::TCellCap(map) => map + .range(TimeIndexEntry::range(i64::MIN..t)) + .last() + .map(|(ti, v)| (ti.t(), v)), + TCell::TCellN(map) => map + .range(TimeIndexEntry::range(i64::MIN..t)) + .last() + .map(|(ti, v)| (ti.t(), v)), } } } @@ -107,19 +144,20 @@ impl TCell { #[cfg(test)] mod tcell_tests { use super::TCell; + use crate::{core::storage::timeindex::TimeIndexEntry, db::api::view::TimeIndex}; #[test] fn set_new_value_for_tcell_initialized_as_empty() { let mut tcell = TCell::default(); - tcell.set(16, String::from("lobster")); + tcell.set(TimeIndexEntry::start(16), String::from("lobster")); assert_eq!(tcell.iter().collect::>(), vec!["lobster"]); } #[test] fn every_new_update_to_the_same_prop_is_recorded_as_history() { - let mut tcell = TCell::new(1, "Pometry"); - tcell.set(2, "Pometry Inc."); + let mut tcell = TCell::new(TimeIndexEntry::start(1), "Pometry"); + tcell.set(TimeIndexEntry::start(2), "Pometry Inc."); assert_eq!( tcell.iter_t().collect::>(), @@ -129,8 +167,8 @@ mod tcell_tests { #[test] fn new_update_with_the_same_time_to_a_prop_is_ignored() { - let mut tcell = TCell::new(1, "Pometry"); - tcell.set(1, "Pometry Inc."); + let mut tcell = TCell::new(TimeIndexEntry::start(1), "Pometry"); + tcell.set(TimeIndexEntry::start(1), "Pometry Inc."); assert_eq!(tcell.iter_t().collect::>(), vec![(&1, &"Pometry")]); } @@ -145,14 +183,14 @@ mod tcell_tests { assert_eq!(tcell.iter_t().collect::>(), vec![]); - let tcell = TCell::new(3, "Pometry"); + let tcell = TCell::new(TimeIndexEntry::start(3), "Pometry"); assert_eq!(tcell.iter().collect::>(), vec![&"Pometry"]); assert_eq!(tcell.iter_t().collect::>(), vec![(&3, &"Pometry")]); - let mut tcell = TCell::new(2, "Pometry"); - tcell.set(1, "Inc. Pometry"); + let mut tcell = TCell::new(TimeIndexEntry::start(2), "Pometry"); + tcell.set(TimeIndexEntry::start(1), "Inc. Pometry"); assert_eq!( // Results are ordered by time @@ -168,7 +206,7 @@ mod tcell_tests { let mut tcell: TCell = TCell::default(); for n in 1..130 { - tcell.set(n, n) + tcell.set(TimeIndexEntry::start(n), n) } assert_eq!(tcell.iter_t().count(), 129); @@ -189,7 +227,7 @@ mod tcell_tests { vec![] ); - let tcell = TCell::new(3, "Pometry"); + let tcell = TCell::new(TimeIndexEntry::start(3), "Pometry"); assert_eq!( tcell.iter_window(3..4).collect::>(), @@ -201,9 +239,9 @@ mod tcell_tests { vec![(&3, &"Pometry")] ); - let mut tcell = TCell::new(3, "Pometry"); - tcell.set(1, "Pometry Inc."); - tcell.set(2, "Raphtory"); + let mut tcell = TCell::new(TimeIndexEntry::start(3), "Pometry"); + tcell.set(TimeIndexEntry::start(1), "Pometry Inc."); + tcell.set(TimeIndexEntry::start(2), "Raphtory"); assert_eq!( tcell.iter_window_t(2..3).collect::>(), @@ -241,7 +279,7 @@ mod tcell_tests { let mut tcell: TCell = TCell::default(); for n in 1..130 { - tcell.set(n, n) + tcell.set(TimeIndexEntry::start(n), n) } assert_eq!(tcell.iter_window_t(i64::MIN..i64::MAX).count(), 129); diff --git a/raphtory/src/core/entities/properties/tprop.rs b/raphtory/src/core/entities/properties/tprop.rs new file mode 100644 index 0000000000..4d10d7f66f --- /dev/null +++ b/raphtory/src/core/entities/properties/tprop.rs @@ -0,0 +1,564 @@ +use crate::{ + core::{ + entities::{ + properties::{props::DictMapper, tcell::TCell}, + LayerIds, + }, + storage::{locked_view::LockedView, timeindex::TimeIndexEntry}, + utils::errors::GraphError, + ArcStr, Prop, PropType, + }, + db::graph::graph::Graph, +}; +use chrono::NaiveDateTime; +use itertools::Itertools; +use serde::{Deserialize, Serialize}; +use std::{collections::HashMap, iter, ops::Range, sync::Arc}; + +// TODO TProp struct could be replaced with Option>, with the only issue (or advantage) that then the type can change? + +#[derive(Debug, Default, PartialEq, Clone, Serialize, Deserialize)] +pub enum TProp { + #[default] + Empty, + Str(TCell), + U8(TCell), + U16(TCell), + I32(TCell), + I64(TCell), + U32(TCell), + U64(TCell), + F32(TCell), + F64(TCell), + Bool(TCell), + DTime(TCell), + Graph(TCell), + List(TCell>>), + Map(TCell>>), +} + +impl TProp { + pub fn dtype(&self) -> PropType { + match self { + TProp::Empty => PropType::Empty, + TProp::Str(_) => PropType::Str, + TProp::U8(_) => PropType::U8, + TProp::U16(_) => PropType::U16, + TProp::I32(_) => PropType::I32, + TProp::I64(_) => PropType::I64, + TProp::U32(_) => PropType::U32, + TProp::U64(_) => PropType::U64, + TProp::F32(_) => PropType::F32, + TProp::F64(_) => PropType::F64, + TProp::Bool(_) => PropType::Bool, + TProp::DTime(_) => PropType::DTime, + TProp::Graph(_) => PropType::Graph, + TProp::List(_) => PropType::List, + TProp::Map(_) => PropType::Map, + } + } + + pub(crate) fn from(t: TimeIndexEntry, prop: Prop) -> Self { + match prop { + Prop::Str(value) => TProp::Str(TCell::new(t, value)), + Prop::I32(value) => TProp::I32(TCell::new(t, value)), + Prop::I64(value) => TProp::I64(TCell::new(t, value)), + Prop::U8(value) => TProp::U8(TCell::new(t, value)), + Prop::U16(value) => TProp::U16(TCell::new(t, value)), + Prop::U32(value) => TProp::U32(TCell::new(t, value)), + Prop::U64(value) => TProp::U64(TCell::new(t, value)), + Prop::F32(value) => TProp::F32(TCell::new(t, value)), + Prop::F64(value) => TProp::F64(TCell::new(t, value)), + Prop::Bool(value) => TProp::Bool(TCell::new(t, value)), + Prop::DTime(value) => TProp::DTime(TCell::new(t, value)), + Prop::Graph(value) => TProp::Graph(TCell::new(t, value)), + Prop::List(value) => TProp::List(TCell::new(t, value)), + Prop::Map(value) => TProp::Map(TCell::new(t, value)), + } + } + + pub(crate) fn set(&mut self, t: TimeIndexEntry, prop: Prop) -> Result<(), GraphError> { + if matches!(self, TProp::Empty) { + *self = TProp::from(t, prop); + } else { + match (self, prop) { + (TProp::Empty, prop) => {} + + (TProp::Str(cell), Prop::Str(a)) => { + cell.set(t, a); + } + (TProp::I32(cell), Prop::I32(a)) => { + cell.set(t, a); + } + (TProp::I64(cell), Prop::I64(a)) => { + cell.set(t, a); + } + (TProp::U32(cell), Prop::U32(a)) => { + cell.set(t, a); + } + (TProp::U8(cell), Prop::U8(a)) => { + cell.set(t, a); + } + (TProp::U16(cell), Prop::U16(a)) => { + cell.set(t, a); + } + (TProp::U64(cell), Prop::U64(a)) => { + cell.set(t, a); + } + (TProp::F32(cell), Prop::F32(a)) => { + cell.set(t, a); + } + (TProp::F64(cell), Prop::F64(a)) => { + cell.set(t, a); + } + (TProp::Bool(cell), Prop::Bool(a)) => { + cell.set(t, a); + } + (TProp::DTime(cell), Prop::DTime(a)) => { + cell.set(t, a); + } + (TProp::Graph(cell), Prop::Graph(a)) => { + cell.set(t, a); + } + (TProp::List(cell), Prop::List(a)) => { + cell.set(t, a); + } + (TProp::Map(cell), Prop::Map(a)) => { + cell.set(t, a); + } + _ => return Err(GraphError::IncorrectPropertyType), + }; + } + Ok(()) + } + + pub(crate) fn at(&self, ti: &TimeIndexEntry) -> Option { + match self { + TProp::Empty => None, + TProp::Str(cell) => cell.at(ti).map(|v| Prop::Str(v.clone())), + TProp::I32(cell) => cell.at(ti).map(|v| Prop::I32(*v)), + TProp::I64(cell) => cell.at(ti).map(|v| Prop::I64(*v)), + TProp::U32(cell) => cell.at(ti).map(|v| Prop::U32(*v)), + TProp::U8(cell) => cell.at(ti).map(|v| Prop::U8(*v)), + TProp::U16(cell) => cell.at(ti).map(|v| Prop::U16(*v)), + TProp::U64(cell) => cell.at(ti).map(|v| Prop::U64(*v)), + TProp::F32(cell) => cell.at(ti).map(|v| Prop::F32(*v)), + TProp::F64(cell) => cell.at(ti).map(|v| Prop::F64(*v)), + TProp::Bool(cell) => cell.at(ti).map(|v| Prop::Bool(*v)), + TProp::DTime(cell) => cell.at(ti).map(|v| Prop::DTime(*v)), + TProp::Graph(cell) => cell.at(ti).map(|v| Prop::Graph(v.clone())), + TProp::List(cell) => cell.at(ti).map(|v| Prop::List(v.clone())), + TProp::Map(cell) => cell.at(ti).map(|v| Prop::Map(v.clone())), + } + } + + pub(crate) fn last_before(&self, t: i64) -> Option<(i64, Prop)> { + match self { + TProp::Empty => None, + TProp::Str(cell) => cell.last_before(t).map(|(t, v)| (*t, Prop::Str(v.clone()))), + TProp::I32(cell) => cell.last_before(t).map(|(t, v)| (*t, Prop::I32(*v))), + TProp::I64(cell) => cell.last_before(t).map(|(t, v)| (*t, Prop::I64(*v))), + TProp::U8(cell) => cell.last_before(t).map(|(t, v)| (*t, Prop::U8(*v))), + TProp::U16(cell) => cell.last_before(t).map(|(t, v)| (*t, Prop::U16(*v))), + TProp::U32(cell) => cell.last_before(t).map(|(t, v)| (*t, Prop::U32(*v))), + TProp::U64(cell) => cell.last_before(t).map(|(t, v)| (*t, Prop::U64(*v))), + TProp::F32(cell) => cell.last_before(t).map(|(t, v)| (*t, Prop::F32(*v))), + TProp::F64(cell) => cell.last_before(t).map(|(t, v)| (*t, Prop::F64(*v))), + TProp::Bool(cell) => cell.last_before(t).map(|(t, v)| (*t, Prop::Bool(*v))), + TProp::DTime(cell) => cell.last_before(t).map(|(t, v)| (*t, Prop::DTime(*v))), + TProp::Graph(cell) => cell + .last_before(t) + .map(|(t, v)| (*t, Prop::Graph(v.clone()))), + TProp::List(cell) => cell + .last_before(t) + .map(|(t, v)| (*t, Prop::List(v.clone()))), + TProp::Map(cell) => cell.last_before(t).map(|(t, v)| (*t, Prop::Map(v.clone()))), + } + } + + pub(crate) fn iter(&self) -> Box + '_> { + match self { + TProp::Empty => Box::new(iter::empty()), + TProp::Str(cell) => Box::new( + cell.iter_t() + .map(|(t, value)| (*t, Prop::Str(value.clone()))), + ), + TProp::I32(cell) => Box::new(cell.iter_t().map(|(t, value)| (*t, Prop::I32(*value)))), + TProp::I64(cell) => Box::new(cell.iter_t().map(|(t, value)| (*t, Prop::I64(*value)))), + TProp::U8(cell) => Box::new(cell.iter_t().map(|(t, value)| (*t, Prop::U8(*value)))), + TProp::U16(cell) => Box::new(cell.iter_t().map(|(t, value)| (*t, Prop::U16(*value)))), + TProp::U32(cell) => Box::new(cell.iter_t().map(|(t, value)| (*t, Prop::U32(*value)))), + TProp::U64(cell) => Box::new(cell.iter_t().map(|(t, value)| (*t, Prop::U64(*value)))), + TProp::F32(cell) => Box::new(cell.iter_t().map(|(t, value)| (*t, Prop::F32(*value)))), + TProp::F64(cell) => Box::new(cell.iter_t().map(|(t, value)| (*t, Prop::F64(*value)))), + TProp::Bool(cell) => Box::new(cell.iter_t().map(|(t, value)| (*t, Prop::Bool(*value)))), + TProp::DTime(cell) => { + Box::new(cell.iter_t().map(|(t, value)| (*t, Prop::DTime(*value)))) + } + TProp::Graph(cell) => Box::new( + cell.iter_t() + .map(|(t, value)| (*t, Prop::Graph(value.clone()))), + ), + TProp::List(cell) => Box::new( + cell.iter_t() + .map(|(t, value)| (*t, Prop::List(value.clone()))), + ), + TProp::Map(cell) => Box::new( + cell.iter_t() + .map(|(t, value)| (*t, Prop::Map(value.clone()))), + ), + } + } + + pub(crate) fn iter_window(&self, r: Range) -> Box + '_> { + match self { + TProp::Empty => Box::new(std::iter::empty()), + TProp::Str(cell) => Box::new( + cell.iter_window_t(r) + .map(|(t, value)| (*t, Prop::Str(value.clone()))), + ), + TProp::I32(cell) => Box::new( + cell.iter_window_t(r) + .map(|(t, value)| (*t, Prop::I32(*value))), + ), + TProp::I64(cell) => Box::new( + cell.iter_window_t(r) + .map(|(t, value)| (*t, Prop::I64(*value))), + ), + TProp::U8(cell) => Box::new( + cell.iter_window_t(r) + .map(|(t, value)| (*t, Prop::U8(*value))), + ), + TProp::U16(cell) => Box::new( + cell.iter_window_t(r) + .map(|(t, value)| (*t, Prop::U16(*value))), + ), + TProp::U32(cell) => Box::new( + cell.iter_window_t(r) + .map(|(t, value)| (*t, Prop::U32(*value))), + ), + TProp::U64(cell) => Box::new( + cell.iter_window_t(r) + .map(|(t, value)| (*t, Prop::U64(*value))), + ), + TProp::F32(cell) => Box::new( + cell.iter_window_t(r) + .map(|(t, value)| (*t, Prop::F32(*value))), + ), + TProp::F64(cell) => Box::new( + cell.iter_window_t(r) + .map(|(t, value)| (*t, Prop::F64(*value))), + ), + TProp::Bool(cell) => Box::new( + cell.iter_window_t(r) + .map(|(t, value)| (*t, Prop::Bool(*value))), + ), + TProp::DTime(cell) => Box::new( + cell.iter_window_t(r) + .map(|(t, value)| (*t, Prop::DTime(*value))), + ), + TProp::Graph(cell) => Box::new( + cell.iter_window_t(r) + .map(|(t, value)| (*t, Prop::Graph(value.clone()))), + ), + TProp::List(cell) => Box::new( + cell.iter_window_t(r) + .map(|(t, value)| (*t, Prop::List(value.clone()))), + ), + TProp::Map(cell) => Box::new( + cell.iter_window_t(r) + .map(|(t, value)| (*t, Prop::Map(value.clone()))), + ), + } + } +} + +pub struct LockedLayeredTProp<'a> { + tprop: Vec>, +} + +impl<'a> LockedLayeredTProp<'a> { + pub(crate) fn new(tprop: Vec>) -> Self { + Self { tprop } + } + + pub(crate) fn last_before(&self, t: i64) -> Option<(i64, Prop)> { + self.tprop + .iter() + .flat_map(|p| p.last_before(t)) + .max_by_key(|v| v.0) + } + + pub(crate) fn iter(&self) -> impl Iterator + '_ { + self.tprop + .iter() + .map(|p| p.iter()) + .kmerge_by(|a, b| a.0 < b.0) + } + + pub(crate) fn iter_window(&self, r: Range) -> impl Iterator + '_ { + self.tprop + .iter() + .map(|p| p.iter_window(r.clone())) + .kmerge_by(|a, b| a.0 < b.0) + } + + pub(crate) fn at(&self, ti: &TimeIndexEntry) -> Option { + self.tprop.iter().find_map(|p| p.at(ti)) + } +} + +#[cfg(test)] +mod tprop_tests { + use super::*; + + #[test] + fn set_new_value_for_tprop_initialized_as_empty() { + let mut tprop = TProp::Empty; + tprop.set(1.into(), Prop::I32(10)); + + assert_eq!(tprop.iter().collect::>(), vec![(1, Prop::I32(10))]); + } + + #[test] + fn every_new_update_to_the_same_prop_is_recorded_as_history() { + let mut tprop = TProp::from(1.into(), "Pometry".into()); + tprop.set(2.into(), "Pometry Inc.".into()); + + assert_eq!( + tprop.iter().collect::>(), + vec![(1, "Pometry".into()), (2, "Pometry Inc.".into())] + ); + } + + #[test] + fn new_update_with_the_same_time_to_a_prop_is_ignored() { + let mut tprop = TProp::from(1.into(), "Pometry".into()); + tprop.set(1.into(), "Pometry Inc.".into()); + + assert_eq!( + tprop.iter().collect::>(), + vec![(1, "Pometry".into())] + ); + } + + #[test] + fn updates_to_prop_can_be_iterated() { + let tprop = TProp::default(); + + assert_eq!(tprop.iter().collect::>(), vec![]); + + let mut tprop = TProp::from(1.into(), "Pometry".into()); + tprop.set(2.into(), "Pometry Inc.".into()); + + assert_eq!( + tprop.iter().collect::>(), + vec![ + (1, Prop::Str("Pometry".into())), + (2, Prop::Str("Pometry Inc.".into())) + ] + ); + + let mut tprop = TProp::from(1.into(), Prop::I32(2022)); + tprop.set(2.into(), Prop::I32(2023)); + + assert_eq!( + tprop.iter().collect::>(), + vec![(1, Prop::I32(2022)), (2, Prop::I32(2023))] + ); + + let mut tprop = TProp::from(1.into(), Prop::I64(2022)); + tprop.set(2.into(), Prop::I64(2023)); + + assert_eq!( + tprop.iter().collect::>(), + vec![(1, Prop::I64(2022)), (2, Prop::I64(2023))] + ); + + let mut tprop = TProp::from(1.into(), Prop::F32(10.0)); + tprop.set(2.into(), Prop::F32(11.0)); + + assert_eq!( + tprop.iter().collect::>(), + vec![(1, Prop::F32(10.0)), (2, Prop::F32(11.0))] + ); + + let mut tprop = TProp::from(1.into(), Prop::F64(10.0)); + tprop.set(2.into(), Prop::F64(11.0)); + + assert_eq!( + tprop.iter().collect::>(), + vec![(1, Prop::F64(10.0)), (2, Prop::F64(11.0))] + ); + + let mut tprop = TProp::from(1.into(), Prop::U32(1)); + tprop.set(2.into(), Prop::U32(2)); + + assert_eq!( + tprop.iter().collect::>(), + vec![(1, Prop::U32(1)), (2, Prop::U32(2))] + ); + + let mut tprop = TProp::from(1.into(), Prop::U64(1)); + tprop.set(2.into(), Prop::U64(2)); + + assert_eq!( + tprop.iter().collect::>(), + vec![(1, Prop::U64(1)), (2, Prop::U64(2))] + ); + + let mut tprop = TProp::from(1.into(), Prop::U8(1)); + tprop.set(2.into(), Prop::U8(2)); + + assert_eq!( + tprop.iter().collect::>(), + vec![(1, Prop::U8(1)), (2, Prop::U8(2))] + ); + + let mut tprop = TProp::from(1.into(), Prop::U16(1)); + tprop.set(2.into(), Prop::U16(2)); + + assert_eq!( + tprop.iter().collect::>(), + vec![(1, Prop::U16(1)), (2, Prop::U16(2))] + ); + + let mut tprop = TProp::from(1.into(), Prop::Bool(true)); + tprop.set(2.into(), Prop::Bool(true)); + + assert_eq!( + tprop.iter().collect::>(), + vec![(1, Prop::Bool(true)), (2, Prop::Bool(true))] + ); + } + + #[test] + fn updates_to_prop_can_be_window_iterated() { + let tprop = TProp::default(); + + assert_eq!( + tprop.iter_window(i64::MIN..i64::MAX).collect::>(), + vec![] + ); + + let mut tprop = TProp::from(3.into(), Prop::Str("Pometry".into())); + tprop.set(1.into(), Prop::Str("Pometry Inc.".into())); + tprop.set(2.into(), Prop::Str("Raphtory".into())); + + assert_eq!( + tprop.iter_window(2..3).collect::>(), + vec![(2, Prop::Str("Raphtory".into()))] + ); + + assert_eq!(tprop.iter_window(4..5).collect::>(), vec![]); + + assert_eq!( + // Results are ordered by time + tprop.iter_window(1..i64::MAX).collect::>(), + vec![ + (1, Prop::Str("Pometry Inc.".into())), + (2, Prop::Str("Raphtory".into())), + (3, Prop::Str("Pometry".into())) + ] + ); + + assert_eq!( + tprop.iter_window(3..i64::MAX).collect::>(), + vec![(3, Prop::Str("Pometry".into()))] + ); + + assert_eq!( + tprop.iter_window(2..i64::MAX).collect::>(), + vec![ + (2, Prop::Str("Raphtory".into())), + (3, Prop::Str("Pometry".into())) + ] + ); + + assert_eq!(tprop.iter_window(5..i64::MAX).collect::>(), vec![]); + + assert_eq!( + tprop.iter_window(i64::MIN..4).collect::>(), + // Results are ordered by time + vec![ + (1, Prop::Str("Pometry Inc.".into())), + (2, Prop::Str("Raphtory".into())), + (3, Prop::Str("Pometry".into())) + ] + ); + + assert_eq!(tprop.iter_window(i64::MIN..1).collect::>(), vec![]); + + let mut tprop = TProp::from(1.into(), Prop::I32(2022)); + tprop.set(2.into(), Prop::I32(2023)); + + assert_eq!( + tprop.iter_window(i64::MIN..i64::MAX).collect::>(), + vec![(1, Prop::I32(2022)), (2, Prop::I32(2023))] + ); + + let mut tprop = TProp::from(1.into(), Prop::I64(2022)); + tprop.set(2.into(), Prop::I64(2023)); + + assert_eq!( + tprop.iter_window(i64::MIN..i64::MAX).collect::>(), + vec![(1, Prop::I64(2022)), (2, Prop::I64(2023))] + ); + + let mut tprop = TProp::from(1.into(), Prop::F32(10.0)); + tprop.set(2.into(), Prop::F32(11.0)); + + assert_eq!( + tprop.iter_window(i64::MIN..i64::MAX).collect::>(), + vec![(1, Prop::F32(10.0)), (2, Prop::F32(11.0))] + ); + + let mut tprop = TProp::from(1.into(), Prop::F64(10.0)); + tprop.set(2.into(), Prop::F64(11.0)); + + assert_eq!( + tprop.iter_window(i64::MIN..i64::MAX).collect::>(), + vec![(1, Prop::F64(10.0)), (2, Prop::F64(11.0))] + ); + + let mut tprop = TProp::from(1.into(), Prop::U32(1)); + tprop.set(2.into(), Prop::U32(2)); + + assert_eq!( + tprop.iter_window(i64::MIN..i64::MAX).collect::>(), + vec![(1, Prop::U32(1)), (2, Prop::U32(2))] + ); + + let mut tprop = TProp::from(1.into(), Prop::U64(1)); + tprop.set(2.into(), Prop::U64(2)); + + assert_eq!( + tprop.iter_window(i64::MIN..i64::MAX).collect::>(), + vec![(1, Prop::U64(1)), (2, Prop::U64(2))] + ); + + let mut tprop = TProp::from(1.into(), Prop::U8(1)); + tprop.set(2.into(), Prop::U8(2)); + + assert_eq!( + tprop.iter_window(i64::MIN..i64::MAX).collect::>(), + vec![(1, Prop::U8(1)), (2, Prop::U8(2))] + ); + + let mut tprop = TProp::from(1.into(), Prop::U16(1)); + tprop.set(2.into(), Prop::U16(2)); + + assert_eq!( + tprop.iter_window(i64::MIN..i64::MAX).collect::>(), + vec![(1, Prop::U16(1)), (2, Prop::U16(2))] + ); + + let mut tprop = TProp::from(1.into(), Prop::Bool(true)); + tprop.set(2.into(), Prop::Bool(true)); + + assert_eq!( + tprop.iter_window(i64::MIN..i64::MAX).collect::>(), + vec![(1, Prop::Bool(true)), (2, Prop::Bool(true))] + ); + } +} diff --git a/raphtory/src/core/vertex.rs b/raphtory/src/core/entities/vertices/input_vertex.rs similarity index 64% rename from raphtory/src/core/vertex.rs rename to raphtory/src/core/entities/vertices/input_vertex.rs index 22d5ae364f..ceb6f0511b 100644 --- a/raphtory/src/core/vertex.rs +++ b/raphtory/src/core/entities/vertices/input_vertex.rs @@ -4,11 +4,11 @@ //! This trait allows you to use a variety of types as input vertices, including //! `u64`, `&str`, and `String`. -use crate::core::{utils, Prop}; +use crate::core::utils::hashing; pub trait InputVertex: Clone { fn id(&self) -> u64; - fn name_prop(&self) -> Option; + fn id_str(&self) -> Option<&str>; } impl InputVertex for u64 { @@ -16,18 +16,18 @@ impl InputVertex for u64 { *self } - fn name_prop(&self) -> Option { + fn id_str(&self) -> Option<&str> { None } } impl<'a> InputVertex for &'a str { fn id(&self) -> u64 { - self.parse().unwrap_or(utils::calculate_hash(self)) + self.parse().unwrap_or(hashing::calculate_hash(self)) } - fn name_prop(&self) -> Option { - Some(Prop::Str(self.to_string())) + fn id_str(&self) -> Option<&str> { + Some(self) } } @@ -37,7 +37,7 @@ impl InputVertex for String { s.id() } - fn name_prop(&self) -> Option { - Some(Prop::Str(self.to_string())) + fn id_str(&self) -> Option<&str> { + Some(self) } } diff --git a/raphtory/src/core/entities/vertices/mod.rs b/raphtory/src/core/entities/vertices/mod.rs new file mode 100644 index 0000000000..3ad56d82de --- /dev/null +++ b/raphtory/src/core/entities/vertices/mod.rs @@ -0,0 +1,5 @@ +pub mod input_vertex; +pub mod structure; +pub mod vertex; +pub mod vertex_ref; +pub mod vertex_store; diff --git a/raphtory/src/core/entities/vertices/structure/adj.rs b/raphtory/src/core/entities/vertices/structure/adj.rs new file mode 100644 index 0000000000..154ef88006 --- /dev/null +++ b/raphtory/src/core/entities/vertices/structure/adj.rs @@ -0,0 +1,155 @@ +use crate::core::{ + entities::{ + edges::edge_ref::{Dir, EdgeRef}, + vertices::structure::adjset::AdjSet, + EID, VID, + }, + Direction, +}; +use core::panic; +use itertools::Itertools; +use serde::{Deserialize, Serialize}; + +#[derive(Debug, Serialize, Deserialize, PartialEq, Default)] +pub enum Adj { + #[default] + Solo, + List { + // local: + out: AdjSet, + into: AdjSet, + }, +} + +impl Adj { + pub(crate) fn get_edge(&self, v: VID, dir: Direction) -> Option { + match self { + Adj::Solo => None, + Adj::List { out, into } => match dir { + Direction::OUT => out.find(v), + Direction::IN => into.find(v), + Direction::BOTH => self + .get_edge(v, Direction::OUT) + .or_else(|| self.get_edge(v, Direction::IN)), + }, + } + } + + pub(crate) fn new_out(v: VID, e: EID) -> Self { + Adj::List { + out: AdjSet::new(v, e), + into: AdjSet::default(), + } + } + + pub(crate) fn new_into(v: VID, e: EID) -> Self { + Adj::List { + into: AdjSet::new(v, e), + out: AdjSet::default(), + } + } + + pub(crate) fn add_edge_into(&mut self, v: VID, e: EID) { + match self { + Adj::Solo => *self = Self::new_into(v, e), + Adj::List { into, .. } => into.push(v, e), + } + } + + pub(crate) fn add_edge_out(&mut self, v: VID, e: EID) { + match self { + Adj::Solo => *self = Self::new_out(v, e), + Adj::List { out, .. } => out.push(v, e), + } + } + + pub(crate) fn iter(&self, dir: Direction) -> Box + Send + '_> { + match self { + Adj::Solo => Box::new(std::iter::empty()), + Adj::List { out, into } => match dir { + Direction::OUT => Box::new(out.iter()), + Direction::IN => Box::new(into.iter()), + Direction::BOTH => Box::new(out.iter().merge(into.iter())), + }, + } + } + + pub(crate) fn iter_eref( + &self, + dir: Direction, + local: VID, + ) -> Box + Send + '_> { + match self { + Adj::Solo => Box::new(std::iter::empty()), + Adj::List { out, into } => match dir { + Direction::OUT => Box::new( + out.iter() + .map(move |(remote, e)| EdgeRef::new(e, local, remote, Dir::Out)), + ), + Direction::IN => Box::new( + into.iter() + .map(move |(remote, e)| EdgeRef::new(e, local, remote, Dir::Into)), + ), + Direction::BOTH => Box::new( + out.iter() + .map(move |(remote, e)| EdgeRef::new(e, local, remote, Dir::Out)) + .merge( + into.iter() + .map(move |(remote, e)| EdgeRef::new(e, local, remote, Dir::Into)), + ), + ), + }, + } + } + + pub(crate) fn vertex_iter(&self, dir: Direction) -> impl Iterator + Send + '_ { + self.iter(dir).map(|(v, _)| v) + } + + pub(crate) fn degree(&self, dir: Direction) -> usize { + match self { + Adj::Solo => 0, + Adj::List { out, into } => match dir { + Direction::OUT => out.len(), + Direction::IN => into.len(), + Direction::BOTH => out + .iter() + .merge(into.iter()) + .dedup_by(|v1, v2| v1.0 == v2.0) + .count(), + }, + } + } + + pub fn fill_page( + &self, + last: Option, + page: &mut [(VID, EID); P], + dir: Dir, + ) -> usize { + match self { + Adj::Solo => 0, + Adj::List { out, into } => match dir { + Dir::Out => out.fill_page(last, page), + Dir::Into => into.fill_page(last, page), + }, + } + } + pub(crate) fn get_page_vec( + &self, + last: Option, + page_size: usize, + dir: Direction, + ) -> Vec<(VID, EID)> { + match self { + Adj::Solo => Vec::new(), + Adj::List { out, into } => match dir { + Direction::OUT => out.get_page_vec(last, page_size), + Direction::IN => into.get_page_vec(last, page_size), + _ => panic!( + "Cannot get page vec for both direction, need to be handled by the caller" + ), + }, + } + } +} diff --git a/raphtory/src/core/entities/vertices/structure/adjset.rs b/raphtory/src/core/entities/vertices/structure/adjset.rs new file mode 100644 index 0000000000..7789737989 --- /dev/null +++ b/raphtory/src/core/entities/vertices/structure/adjset.rs @@ -0,0 +1,304 @@ +//! A data structure for efficiently storing and querying the temporal adjacency set of a node in a temporal graph. + +use itertools::Itertools; +use serde::{Deserialize, Serialize}; +use std::{collections::BTreeMap, hash::Hash}; + +const SMALL_SET: usize = 1024; + +/** + * Temporal adjacency set can track when adding edge v -> u + * does u exist already + * and if it does what is the edge metadata + * + * */ +#[derive(Debug, Default, Serialize, Deserialize, PartialEq)] +pub enum AdjSet + Copy + Send + Sync> { + #[default] + Empty, + One(K, V), + Small { + vs: Vec, // the neighbours + edges: Vec, // edge metadata + }, + Large { + vs: BTreeMap, // this is equiv to vs and edges + }, + // TODO: if we use BTreeSet<(K, Option)> we could implement intersections and support edge label queries such as a && b +} + +impl + Copy + Send + Sync> AdjSet { + pub fn len(&self) -> usize { + match self { + AdjSet::Empty => 0, + AdjSet::One(_, _) => 1, + AdjSet::Small { vs, .. } => vs.len(), + AdjSet::Large { vs } => vs.len(), + } + } + + pub fn is_empty(&self) -> bool { + match self { + AdjSet::Empty => true, + AdjSet::One(_, _) => false, + AdjSet::Small { vs, .. } => vs.is_empty(), + AdjSet::Large { vs } => vs.is_empty(), + } + } + pub fn new(v: K, e: V) -> Self { + Self::One(v, e) + } + + pub fn push(&mut self, v: K, e: V) { + match self { + AdjSet::Empty => { + *self = Self::new(v, e); + } + AdjSet::One(vv, ee) => { + if *vv < v { + *self = Self::Small { + vs: vec![*vv, v], + edges: vec![*ee, e], + } + } else if *vv > v { + *self = Self::Small { + vs: vec![v, *vv], + edges: vec![e, *ee], + } + } + } + AdjSet::Small { vs, edges } => match vs.binary_search(&v) { + Ok(_) => {} + Err(i) => { + if vs.len() < SMALL_SET { + vs.insert(i, v); + edges.insert(i, e); + } else { + let mut map = + BTreeMap::from_iter(vs.iter().copied().zip(edges.iter().copied())); + map.insert(v, e); + *self = Self::Large { vs: map } + } + } + }, + AdjSet::Large { vs } => { + vs.insert(v, e); + } + } + } + + pub fn iter(&self) -> Box + Send + '_> { + match self { + AdjSet::Empty => Box::new(std::iter::empty()), + AdjSet::One(v, e) => Box::new(std::iter::once((*v, *e))), + AdjSet::Small { vs, edges } => Box::new(vs.iter().copied().zip(edges.iter().copied())), + AdjSet::Large { vs } => Box::new(vs.iter().map(|(k, v)| (*k, *v))), + } + } + + pub fn vertices(&self) -> Box + Send + '_> { + match self { + AdjSet::Empty => Box::new(std::iter::empty()), + AdjSet::One(v, ..) => Box::new(std::iter::once(*v)), + AdjSet::Small { vs, .. } => Box::new(vs.iter().copied()), + AdjSet::Large { vs } => Box::new(vs.keys().copied()), + } + } + + pub fn find(&self, v: K) -> Option { + match self { + AdjSet::Empty => None, + AdjSet::One(vv, e) => (*vv == v).then_some(*e), + AdjSet::Small { vs, edges } => vs.binary_search(&v).ok().map(|i| edges[i]), + AdjSet::Large { vs } => vs.get(&v).copied(), + } + } + + /// puts elements into page and returns number of returned elements + pub fn fill_page(&self, last: Option, page: &mut [(K, V); P]) -> usize { + match self { + AdjSet::Empty => 0, + AdjSet::One(v, i) => { + if let Some(l) = last { + if l < *v { + page[0] = (*v, *i); + 1 + } else { + 0 + } + } else { + page[0] = (*v, *i); + 1 + } + } + AdjSet::Small { vs, edges } => { + if let Some(l) = last { + let i = match vs.binary_search(&l) { + Ok(i) => i + 1, + Err(i) => i, + }; + + if i >= vs.len() { + return 0; + } + + let mut index = 0; + vs[i..] + .iter() + .zip(edges[i..].iter()) + .take(P) + .for_each(|(a, b)| { + page[index] = (*a, *b); + index += 1; + }); + index + } else { + let mut index = 0; + vs.iter().zip(edges.iter()).take(P).for_each(|(a, b)| { + page[index] = (*a, *b); + index += 1; + }); + index + } + } + AdjSet::Large { vs } => { + if let Some(l) = last { + let mut index = 0; + vs.range(l..).skip(1).take(P).for_each(|(a, b)| { + page[index] = (*a, *b); + index += 1; + }); + index + } else { + let mut index = 0; + vs.iter().take(P).for_each(|(a, b)| { + page[index] = (*a, *b); + index += 1 + }); + index + } + } + } + } + pub fn get_page_vec(&self, last: Option, page_size: usize) -> Vec<(K, V)> { + match self { + AdjSet::Empty => vec![], + AdjSet::One(v, i) => { + if let Some(l) = last { + if l < *v { + vec![(*v, *i)] + } else { + vec![] + } + } else { + vec![(*v, *i)] + } + } + AdjSet::Small { vs, edges } => { + if let Some(l) = last { + let i = match vs.binary_search(&l) { + Ok(i) => i + 1, + Err(i) => i, + }; + + if i >= vs.len() { + return vec![]; + } + + vs[i..] + .iter() + .zip(edges[i..].iter()) + .take(page_size) + .map(|(a, b)| (*a, *b)) + .collect() + } else { + vs.iter() + .zip(edges.iter()) + .take(page_size) + .map(|(a, b)| (*a, *b)) + .collect() + } + } + AdjSet::Large { vs } => { + if let Some(l) = last { + vs.range(l..) + .skip(1) + .take(page_size) + .map(|(a, b)| (*a, *b)) + .collect() + } else { + vs.iter().take(page_size).map(|(a, b)| (*a, *b)).collect() + } + } + } + } +} + +#[cfg(test)] +mod tadjset_tests { + use super::*; + + #[quickcheck] + fn insert_fuzz(input: Vec) -> bool { + let mut ts: AdjSet = AdjSet::default(); + + for (e, i) in input.iter().enumerate() { + ts.push(*i, e); + } + + let res = input.iter().all(|i| ts.find(*i).is_some()); + if !res { + let ts_vec: Vec<(usize, usize)> = ts.iter().collect(); + println!("Input: {:?}", input); + println!("TAdjSet: {:?}", ts_vec); + } + res + } + + #[test] + fn insert() { + let mut ts: AdjSet = AdjSet::default(); + + ts.push(7, 5); + let actual = ts.iter().collect::>(); + let expected: Vec<(usize, usize)> = vec![(7, 5)]; + assert_eq!(actual, expected) + } + + #[test] + fn insert_large() { + let mut ts: AdjSet = AdjSet::default(); + + for i in 0..SMALL_SET + 2 { + ts.push(i, i); + } + + for i in 0..SMALL_SET + 2 { + assert_eq!(ts.find(i), Some(i)); + } + } + + #[test] + fn insert_twice() { + let mut ts: AdjSet = AdjSet::default(); + + ts.push(7, 9); + ts.push(7, 9); + + let actual = ts.iter().collect::>(); + let expected: Vec<(usize, usize)> = vec![(7, 9)]; + assert_eq!(actual, expected); + } + + #[test] + fn insert_two_different() { + let mut ts: AdjSet = AdjSet::default(); + + ts.push(1, 0); + ts.push(7, 1); + + let actual = ts.iter().collect::>(); + let expected: Vec<(usize, usize)> = vec![(1, 0), (7, 1)]; + assert_eq!(actual, expected); + } +} diff --git a/raphtory/src/core/entities/vertices/structure/iter.rs b/raphtory/src/core/entities/vertices/structure/iter.rs new file mode 100644 index 0000000000..a54e0afa4b --- /dev/null +++ b/raphtory/src/core/entities/vertices/structure/iter.rs @@ -0,0 +1,92 @@ +use crate::core::{ + entities::{edges::edge::EdgeView, graph::tgraph::TGraph, VRef, EID, VID}, + Direction, +}; +use itertools::Merge; +use std::sync::Arc; + +pub struct Paged<'a, const N: usize> { + guard: Arc>, + data: Vec<(VID, EID)>, + i: usize, + size: usize, + dir: Direction, + layer_id: usize, + src: VID, + graph: &'a TGraph, +} + +impl<'a, const N: usize> Paged<'a, N> { + pub(crate) fn new( + guard: Arc>, + dir: Direction, + layer_id: usize, + src: VID, + graph: &'a TGraph, + ) -> Self { + Paged { + guard, + data: Vec::new(), + i: 0, + size: 16, + dir, + layer_id, + src, + graph, + } + } +} + +impl<'a, const N: usize> Iterator for Paged<'a, N> { + type Item = EdgeView<'a, N>; + + fn next(&mut self) -> Option { + if let Some(t) = self.data.get(self.i) { + self.i += 1; + let e_id = self.guard.edge_ref(t.1, self.graph); + let edge = EdgeView::from_edge_ids(self.src, t.0, e_id, self.dir, self.graph); + return Some(edge); + } + + if let Some(last) = self.data.last() { + self.data = self + .guard + .edges_from_last(self.layer_id, self.dir, Some(last.0), self.size) + } else { + // fetch the first page + self.data = self + .guard + .edges_from_last(self.layer_id, self.dir, None, self.size) + } + + if self.data.is_empty() { + return None; + } else { + self.i = 1; + let e_id = self.guard.edge_ref(self.data[0].1, self.graph); + return Some(EdgeView::from_edge_ids( + self.src, + self.data[0].0, + e_id, + self.dir, + self.graph, + )); + } + } +} + +pub enum PagedIter<'a, const N: usize> { + Page(Paged<'a, N>), + Merged(Merge, Paged<'a, N>>), +} + +impl<'a, const N: usize> Iterator for PagedIter<'a, N> { + type Item = EdgeView<'a, N>; + + fn next(&mut self) -> Option { + match self { + PagedIter::Page(p) => p.next(), + PagedIter::Merged(c) => c.next(), + } + } +} diff --git a/raphtory/src/core/entities/vertices/structure/mod.rs b/raphtory/src/core/entities/vertices/structure/mod.rs new file mode 100644 index 0000000000..9eaadd3beb --- /dev/null +++ b/raphtory/src/core/entities/vertices/structure/mod.rs @@ -0,0 +1,3 @@ +pub mod adj; +pub mod adjset; +pub mod iter; diff --git a/raphtory/src/core/entities/vertices/vertex.rs b/raphtory/src/core/entities/vertices/vertex.rs new file mode 100644 index 0000000000..346aa97066 --- /dev/null +++ b/raphtory/src/core/entities/vertices/vertex.rs @@ -0,0 +1,169 @@ +use crate::core::{ + entities::{ + edges::{edge::EdgeView, edge_ref::EdgeRef, edge_store::EdgeStore}, + graph::tgraph::TGraph, + properties::{ + props::{DictMapper, Meta}, + tprop::TProp, + }, + vertices::{ + structure::iter::{Paged, PagedIter}, + vertex_store::VertexStore, + }, + LayerIds, VRef, VID, + }, + storage::{ + locked_view::LockedView, + timeindex::{TimeIndex, TimeIndexEntry, TimeIndexOps}, + ArcEntry, Entry, + }, + Direction, Prop, +}; +use itertools::Itertools; +use std::{ops::Range, sync::Arc}; + +pub struct Vertex<'a, const N: usize> { + node: VRef<'a, N>, + pub graph: &'a TGraph, +} + +impl<'a, const N: usize> Vertex<'a, N> { + pub fn id(&self) -> VID { + self.node.index().into() + } + + pub(crate) fn new(node: VRef<'a, N>, graph: &'a TGraph) -> Self { + Vertex { node, graph } + } + + pub(crate) fn from_entry(node: Entry<'a, VertexStore, N>, graph: &'a TGraph) -> Self { + Self::new(VRef::Entry(node), graph) + } + + pub fn temporal_properties( + &'a self, + prop_id: usize, + window: Option>, + ) -> impl Iterator + 'a { + self.node.temporal_properties(prop_id, window) + } + + pub fn neighbours<'b>( + &'a self, + layers: Vec<&'b str>, + dir: Direction, + ) -> impl Iterator> + 'a { + let layer_ids = layers + .iter() + .filter_map(|str| self.graph.vertex_meta.get_layer_id(str)) + .collect_vec(); + + (*self.node) + .neighbours(layer_ids.into(), dir) + .map(move |dst| self.graph.vertex(dst)) + } + + pub(crate) fn additions(self) -> Option>> { + match self.node { + VRef::Entry(entry) => { + let t_index = entry.map(|entry| entry.timestamps()); + Some(t_index) + } + _ => None, + } + } + + pub(crate) fn temporal_property(self, prop_id: usize) -> Option> { + match self.node { + VRef::Entry(entry) => { + entry.temporal_property(prop_id)?; + + let t_index = entry.map(|entry| entry.temporal_property(prop_id).unwrap()); + Some(t_index) + } + _ => None, + } + } +} + +impl<'a, const N: usize> IntoIterator for Vertex<'a, N> { + type Item = Vertex<'a, N>; + type IntoIter = std::iter::Once; + + fn into_iter(self) -> Self::IntoIter { + std::iter::once(self) + } +} + +pub struct ArcVertex { + e: ArcEntry, + meta: Arc, +} + +impl ArcVertex { + pub(crate) fn from_entry(e: ArcEntry, meta: Arc) -> Self { + ArcVertex { e, meta } + } + + pub fn edge_tuples( + &self, + layers: LayerIds, + dir: Direction, + ) -> impl Iterator + '_ { + self.e.edge_tuples(&layers, dir) + } + + pub fn neighbours(&self, layers: LayerIds, dir: Direction) -> impl Iterator + '_ { + self.e.neighbours(layers, dir) + } +} + +pub(crate) struct ArcEdge { + e: ArcEntry, + meta: Arc, +} + +impl ArcEdge { + pub(crate) fn from_entry(e: ArcEntry, meta: Arc) -> Self { + ArcEdge { e, meta } + } + + pub(crate) fn timestamps_and_layers( + &self, + layer: LayerIds, + ) -> impl Iterator + Send + '_ { + let adds = self.e.additions(); + adds.iter() + .enumerate() + .filter_map(|(layer_id, t)| { + layer + .find(layer_id) + .map(|l| t.iter().map(move |tt| (l, tt))) + }) + .kmerge_by(|a, b| a.1 < b.1) + } + + pub(crate) fn layers(&self) -> impl Iterator + '_ { + self.e.layer_ids_iter() + } + + pub(crate) fn layers_window(&self, w: Range) -> impl Iterator + '_ { + self.e.layer_ids_window_iter(w) + } + + pub(crate) fn timestamps_and_layers_window( + &self, + layer: LayerIds, + w: Range, + ) -> impl Iterator + '_ { + let adds = self.e.additions(); + adds.iter() + .enumerate() + .filter_map(|(layer_id, t)| { + layer + .find(layer_id) + .map(|l| t.range_iter(w.clone()).map(move |tt| (l, tt))) + }) + .kmerge_by(|a, b| a.1 < b.1) + } +} diff --git a/raphtory/src/core/entities/vertices/vertex_ref.rs b/raphtory/src/core/entities/vertices/vertex_ref.rs new file mode 100644 index 0000000000..8720f9aada --- /dev/null +++ b/raphtory/src/core/entities/vertices/vertex_ref.rs @@ -0,0 +1,27 @@ +use crate::core::entities::{vertices::input_vertex::InputVertex, VID}; + +#[derive(Copy, Clone, PartialOrd, PartialEq, Debug)] +pub enum VertexRef { + Internal(VID), + External(u64), +} + +impl VertexRef { + /// Makes a new vertex reference from an internal `VID`. + /// Values are unchecked and the vertex is assumed to exist so use with caution! + pub fn new(vid: VID) -> Self { + VertexRef::Internal(vid) + } +} + +impl From for VertexRef { + fn from(value: V) -> Self { + VertexRef::External(value.id()) + } +} + +impl From for VertexRef { + fn from(value: VID) -> Self { + VertexRef::Internal(value) + } +} diff --git a/raphtory/src/core/entities/vertices/vertex_store.rs b/raphtory/src/core/entities/vertices/vertex_store.rs new file mode 100644 index 0000000000..b49565f8a9 --- /dev/null +++ b/raphtory/src/core/entities/vertices/vertex_store.rs @@ -0,0 +1,458 @@ +use crate::{ + core::{ + entities::{ + edges::edge_ref::{Dir, EdgeRef}, + properties::{props::Props, tprop::TProp}, + vertices::structure::{adj, adj::Adj}, + LayerIds, EID, VID, + }, + storage::{ + iter::Iter, + lazy_vec::IllegalSet, + timeindex::{AsTime, TimeIndex, TimeIndexEntry, TimeIndexOps}, + ArcEntry, + }, + utils::errors::{GraphError, MutateGraphError}, + Direction, Prop, + }, + prelude::Graph, +}; +use itertools::Itertools; +use serde::{Deserialize, Serialize}; +use std::{ + iter, + ops::{Deref, Range}, + sync::Arc, +}; + +#[derive(Serialize, Deserialize, Debug, Default, PartialEq)] +pub struct VertexStore { + pub(crate) global_id: u64, + pub(crate) name: Option, + pub(crate) vid: VID, + // all the timestamps that have been seen by this vertex + timestamps: TimeIndex, + // each layer represents a separate view of the graph + pub(crate) layers: Vec, + // props for vertex + pub(crate) props: Option, +} + +impl VertexStore { + pub fn new(global_id: u64, t: TimeIndexEntry) -> Self { + let mut layers = Vec::with_capacity(1); + layers.push(Adj::Solo); + Self { + global_id, + name: None, + vid: 0.into(), + timestamps: TimeIndex::one(*t.t()), + layers, + props: None, + } + } + + pub fn empty(global_id: u64, name: Option) -> Self { + let mut layers = Vec::with_capacity(1); + layers.push(Adj::Solo); + Self { + global_id, + name, + vid: VID(0), + timestamps: TimeIndex::Empty, + layers, + props: None, + } + } + + pub fn global_id(&self) -> u64 { + self.global_id + } + + pub fn timestamps(&self) -> &TimeIndex { + &self.timestamps + } + + pub fn update_time(&mut self, t: TimeIndexEntry) { + self.timestamps.insert(*t.t()); + } + + pub fn update_name(&mut self, name: &str) { + match &self.name { + None => { + self.name = Some(name.to_owned()); + } + Some(old) => debug_assert_eq!(old, name), // one-to-one mapping between name and id, name should never change + } + } + + pub fn add_prop( + &mut self, + t: TimeIndexEntry, + prop_id: usize, + prop: Prop, + ) -> Result<(), GraphError> { + let props = self.props.get_or_insert_with(Props::new); + props.add_prop(t, prop_id, prop) + } + + pub fn add_constant_prop( + &mut self, + prop_id: usize, + prop: Prop, + ) -> Result<(), IllegalSet>> { + let props = self.props.get_or_insert_with(Props::new); + props.add_constant_prop(prop_id, prop) + } + + #[inline(always)] + pub(crate) fn find_edge(&self, dst: VID, layer_id: &LayerIds) -> Option { + match layer_id { + LayerIds::All => match self.layers.len() { + 0 => None, + 1 => self.layers[0].get_edge(dst, Direction::OUT), + _ => self + .layers + .iter() + .find_map(|layer| layer.get_edge(dst, Direction::OUT)), + }, + LayerIds::One(layer_id) => self + .layers + .get(*layer_id) + .and_then(|layer| layer.get_edge(dst, Direction::OUT)), + LayerIds::Multiple(layers) => layers.iter().find_map(|layer_id| { + self.layers + .get(*layer_id) + .and_then(|layer| layer.get_edge(dst, Direction::OUT)) + }), + LayerIds::None => None, + } + } + + pub(crate) fn add_edge(&mut self, v_id: VID, dir: Direction, layer: usize, edge_id: EID) { + if layer >= self.layers.len() { + self.layers.resize_with(layer + 1, || Adj::Solo); + } + + match dir { + Direction::IN => self.layers[layer].add_edge_into(v_id, edge_id), + Direction::OUT => self.layers[layer].add_edge_out(v_id, edge_id), + _ => {} + } + } + + pub(crate) fn temporal_properties( + &self, + prop_id: usize, + window: Option>, + ) -> impl Iterator + '_ { + if let Some(window) = window { + self.props + .as_ref() + .map(|ps| ps.temporal_props_window(prop_id, window.start, window.end)) + .unwrap_or_else(|| Box::new(iter::empty())) + } else { + self.props + .as_ref() + .map(|ps| ps.temporal_props(prop_id)) + .unwrap_or_else(|| Box::new(iter::empty())) + } + } + + pub(crate) fn const_prop(&self, prop_id: usize) -> Option<&Prop> { + self.props.as_ref().and_then(|ps| ps.const_prop(prop_id)) + } + + #[inline] + pub(crate) fn edge_tuples<'a>( + &'a self, + layers: &LayerIds, + d: Direction, + ) -> Box + Send + 'a> { + let self_id = self.vid; + let iter: Box + Send> = match d { + Direction::OUT => self.merge_layers(layers, Direction::OUT, self_id), + Direction::IN => self.merge_layers(layers, Direction::IN, self_id), + Direction::BOTH => Box::new( + self.edge_tuples(layers, Direction::OUT) + .merge_by(self.edge_tuples(layers, Direction::IN), |e1, e2| { + e1.remote() < e2.remote() + }), + ), + }; + iter + } + + fn merge_layers( + &self, + layers: &LayerIds, + d: Direction, + self_id: VID, + ) -> Box + Send + '_> { + match layers { + LayerIds::All => Box::new( + self.layers + .iter() + .map(|adj| self.iter_adj(adj, d, self_id)) + .kmerge_by(|e1, e2| e1.remote() < e2.remote()) + .dedup(), + ), + LayerIds::One(id) => { + if let Some(layer) = self.layers.get(*id) { + Box::new(self.iter_adj(layer, d, self_id)) + } else { + Box::new(iter::empty()) + } + } + LayerIds::Multiple(ids) => Box::new( + ids.iter() + .filter_map(|id| self.layers.get(*id)) + .map(|layer| self.iter_adj(layer, d, self_id)) + .kmerge_by(|e1, e2| e1.remote() < e2.remote()) + .dedup(), + ), + LayerIds::None => Box::new(iter::empty()), + } + } + + fn iter_adj<'a>( + &'a self, + layer: &'a Adj, + d: Direction, + self_id: VID, + ) -> impl Iterator + Send + '_ { + let iter: Box + Send> = match d { + Direction::IN => Box::new( + layer + .iter(d) + .map(move |(src_pid, e_id)| EdgeRef::new_incoming(e_id, src_pid, self_id)), + ), + Direction::OUT => Box::new( + layer + .iter(d) + .map(move |(dst_pid, e_id)| EdgeRef::new_outgoing(e_id, self_id, dst_pid)), + ), + _ => Box::new(iter::empty()), + }; + iter + } + + pub(crate) fn degree(&self, layers: &LayerIds, d: Direction) -> usize { + match layers { + LayerIds::All => match self.layers.len() { + 0 => 0, + 1 => self.layers[0].degree(d), + _ => self + .layers + .iter() + .map(|l| l.vertex_iter(d)) + .kmerge() + .dedup() + .count(), + }, + LayerIds::One(l) => self + .layers + .get(*l) + .map(|layer| layer.degree(d)) + .unwrap_or(0), + LayerIds::None => 0, + LayerIds::Multiple(ids) => ids + .iter() + .flat_map(|l_id| self.layers.get(*l_id).map(|layer| layer.vertex_iter(d))) + .kmerge() + .dedup() + .count(), + } + } + + // every neighbour apears once in the iterator + // this is important because it calculates degree + pub(crate) fn neighbours<'a>( + &'a self, + layers: LayerIds, + d: Direction, + ) -> Box + Send + 'a> { + match layers { + LayerIds::All => { + let iter = self + .layers + .iter() + .enumerate() + .map(|(layer_id, _)| self.neighbours(layer_id.into(), d)) + .kmerge() + .dedup(); + Box::new(iter) + } + LayerIds::One(one) => { + let iter = self + .layers + .get(one) + .map(|layer| self.neighbours_from_adj(layer, d, layers)) + .unwrap_or(Box::new(iter::empty())); + Box::new(iter) + } + LayerIds::Multiple(layers) => { + let iter = layers + .iter() + .filter_map(|l| self.layers.get(*l)) + .map(|layer| self.neighbours_from_adj(layer, d, layers.clone().into())) + .kmerge() + .dedup(); + Box::new(iter) + } + LayerIds::None => Box::new(iter::empty()), + } + } + + fn neighbours_from_adj<'a>( + &'a self, + layer: &'a Adj, + d: Direction, + layers: LayerIds, + ) -> Box + Send + '_> { + let iter: Box + Send> = match d { + Direction::IN => Box::new(layer.iter(d).map(|(from_v, _)| from_v)), + Direction::OUT => Box::new(layer.iter(d).map(|(to_v, _)| to_v)), + Direction::BOTH => Box::new( + self.neighbours(layers.clone(), Direction::OUT) + .merge(self.neighbours(layers, Direction::IN)) + .dedup(), + ), + }; + iter + } + + pub(crate) fn edges_from_last( + &self, + layer_id: usize, + dir: Direction, + last: Option, + page_size: usize, + ) -> Vec<(VID, EID)> { + self.layers[layer_id].get_page_vec(last, page_size, dir) + } + + pub(crate) fn const_prop_ids(&self) -> impl Iterator + '_ { + self.props + .as_ref() + .into_iter() + .flat_map(|ps| ps.const_prop_ids()) + } + + pub(crate) fn temporal_property(&self, prop_id: usize) -> Option<&TProp> { + self.props.as_ref().and_then(|ps| ps.temporal_prop(prop_id)) + } + + pub(crate) fn temporal_prop_ids(&self) -> impl Iterator + '_ { + self.props + .as_ref() + .into_iter() + .flat_map(|ps| ps.temporal_prop_ids()) + } + + pub(crate) fn active(&self, w: Range) -> bool { + self.timestamps.active(w) + } +} + +impl ArcEntry { + pub fn into_layers(self) -> LockedLayers { + let len = self.layers.len(); + LockedLayers { + entry: self, + pos: 0, + len, + } + } + + pub fn into_layer(self, offset: usize) -> Option { + (offset < self.layers.len()).then_some(LockedLayer { + entry: self, + offset, + }) + } +} + +pub struct LockedLayers { + entry: ArcEntry, + pos: usize, + len: usize, +} + +impl Iterator for LockedLayers { + type Item = LockedLayer; + + fn next(&mut self) -> Option { + if self.pos < self.len { + let layer = LockedLayer { + entry: self.entry.clone(), + offset: self.pos, + }; + self.pos += 1; + Some(layer) + } else { + None + } + } + + fn size_hint(&self) -> (usize, Option) { + (self.len, Some(self.len)) + } +} + +pub struct LockedLayer { + entry: ArcEntry, + offset: usize, +} + +impl Deref for LockedLayer { + type Target = Adj; + + #[inline] + fn deref(&self) -> &Self::Target { + &self.entry.layers[self.offset] + } +} + +impl LockedLayer { + pub fn into_tuples(self, dir: Dir) -> PagedAdjIter<256> { + let mut page = [(VID(0), EID(0)); 256]; + let page_size = self.fill_page(None, &mut page, dir); + PagedAdjIter { + layer: self, + page, + page_offset: 0, + page_size, + dir, + } + } +} + +pub struct PagedAdjIter { + layer: LockedLayer, + page: [(VID, EID); P], + page_offset: usize, + page_size: usize, + dir: Dir, +} + +impl Iterator for PagedAdjIter

{ + type Item = (VID, EID); + + fn next(&mut self) -> Option { + if self.page_offset < self.page_size { + let item = self.page[self.page_offset]; + self.page_offset += 1; + Some(item) + } else if self.page_size == P { + // Was a full page, there may be more items + let last = self.page[P - 1].0; + self.page_offset = 0; + self.page_size = self.layer.fill_page(Some(last), &mut self.page, self.dir); + self.next() + } else { + // Was a partial page, no more items + None + } + } +} diff --git a/raphtory/src/core/lsm.rs b/raphtory/src/core/lsm.rs deleted file mode 100644 index d820469dc0..0000000000 --- a/raphtory/src/core/lsm.rs +++ /dev/null @@ -1,203 +0,0 @@ -//! A data structure for storing and querying temporal graph data using a Log-Structured Merge Tree (LSM). - -use std::fmt::Debug; - -use itertools::Itertools; -use serde::{Deserialize, Serialize}; - -static MERGE_SORT_SIZE: usize = 64; - -#[repr(transparent)] -#[derive(Debug, Serialize, Deserialize, Default)] -pub struct SortedVec { - vs: Vec, -} - -impl SortedVec { - pub fn insert(&mut self, k: K) { - match self.vs.binary_search(&k) { - Ok(i) | Err(i) => self.vs.insert(i, k), - } - } - - pub fn find(&self, k: K) -> Option<&K> { - self.vs.binary_search(&k).map(|i| &self.vs[i]).ok() - } - - pub fn new() -> Self { - SortedVec { vs: vec![] } - } -} - -//FIXME: naive LSM like implementation, add benches and more tests -#[derive(Debug, PartialEq, Default, Serialize, Deserialize)] -pub struct LSMSet { - vs: Vec, -} - -impl LSMSet { - pub fn new() -> Self { - LSMSet { vs: vec![] } - } - - pub fn len(&self) -> usize { - self.vs.len() // not technically correct - } - - pub fn insert(&mut self, k: K) { - // until we reach MERGE_SORT_SIZE elements we optimistically just add k to the end of the vec - self.vs.push(k); - - if self.vs.len() >= MERGE_SORT_SIZE - && (self.vs.len() - MERGE_SORT_SIZE) % MERGE_SORT_SIZE == 0 - { - // we need to sort the entire thing and dedup - self.vs.sort_unstable(); - // FIXME: why don't we have a sort and dedup? - self.vs.dedup(); - } - } - - fn sorted0(&self) -> &[K] { - &self.vs[0..self.vs.len() / MERGE_SORT_SIZE] - } - - fn unsorted0(&self) -> &[K] { - &self.vs[self.vs.len() / MERGE_SORT_SIZE..] - } - - /* - * - * find k otherwise find the smallest value that is greater than k - * - */ - fn find_local_unsorted<'a, 'b>(k: &'a K, unsorted: &'b [K]) -> Option<&'b K> { - let mut alt: Option<&K> = None; - - for k0 in unsorted.iter() { - if k0 == k { - // awesome - return Some(k0); - } else if k0 > k { - let next_k_alt = alt.get_or_insert(k0); - *next_k_alt = Ord::min(next_k_alt, k0); - } - } - - alt - } - - fn find_local<'a, 'b>(k: &'a K, sorted: &'b [K]) -> Option<&'b K> { - match sorted.binary_search(k) { - Ok(i) => Some(&sorted[i]), - Err(j) if j < sorted.len() => Some(&sorted[j]), - _ => None, - } - } - - pub fn find(&self, k: K) -> Option<&K> { - let a = Self::find_local_unsorted(&k, self.unsorted0()); - let b = Self::find_local(&k, self.sorted0()); - - match (a, b) { - (Some(a1), Some(b1)) => Some(Ord::min(a1, b1)), - (a1 @ Some(_), None) => a1, - (None, a1 @ Some(_)) => a1, - _ => None, - } - } - - pub fn iter(&self) -> Box + '_> { - Box::new( - [self.sorted_cur(), self.sorted()] - .into_iter() - .kmerge() - .dedup(), - ) - } - - fn sorted_cur(&self) -> Box + '_> { - Box::new(self.unsorted0().iter().sorted()) - } - - fn sorted(&self) -> Box + '_> { - Box::new(self.sorted0().iter()) - } -} - -impl> From for LSMSet { - fn from(i: I) -> Self { - let new_sorted = i.sorted().collect_vec(); - LSMSet { vs: new_sorted } - } -} - -#[cfg(test)] -mod lsmset_tests { - use std::collections::BTreeSet; - - use super::*; - - #[test] - fn insert() { - let mut s = LSMSet::default(); - - s.insert(4); - s.insert(9); - s.insert(1); - } - - #[test] - fn insert_find() { - let mut s = LSMSet::default(); - - s.insert((4, 1)); - s.insert((4, 4)); - s.insert((1, 1)); - s.insert((1, 2)); - s.insert((4, 3)); - - assert_eq!(s.find((4, 1)), Some(&(4, 1))); - assert_eq!(s.find((1, 2)), Some(&(1, 2))); - assert_eq!(s.find((1, 3)), Some(&(4, 1))); - assert_eq!(s.find((1, 2)), Some(&(1, 2))); - - let mut ss = BTreeSet::default(); - - ss.insert((4, 1)); - ss.insert((4, 4)); - ss.insert((1, 1)); - ss.insert((1, 2)); - ss.insert((4, 3)); - - assert_eq!(ss.range((4, 2)..).next(), Some(&(4, 3))); - - assert_eq!(s.find((4, 2)), Some(&(4, 3))); - assert_eq!(s.find((1, 3)), Some(&(4, 1))); - } - - #[test] - fn iter() { - let mut s = LSMSet::default(); - - s.insert((4, 1)); - s.insert((4, 4)); - s.insert((1, 1)); - s.insert((1, 2)); - s.insert((4, 3)); - - let all = s.iter().collect_vec(); - - assert_eq!(all, vec![&(1, 1), &(1, 2), &(4, 1), &(4, 3), &(4, 4)]) - } - - #[test] - fn example() { - let mut ss = BTreeSet::default(); - - ss.insert((1, 2)); - - let expected: Option<&(i32, i32)> = None; - assert_eq!(ss.range((4, 2)..).next(), expected); - } -} diff --git a/raphtory/src/core/misc.rs b/raphtory/src/core/misc.rs deleted file mode 100644 index 8b13789179..0000000000 --- a/raphtory/src/core/misc.rs +++ /dev/null @@ -1 +0,0 @@ - diff --git a/raphtory/src/core/mod.rs b/raphtory/src/core/mod.rs index 99e6868f52..27b295d126 100644 --- a/raphtory/src/core/mod.rs +++ b/raphtory/src/core/mod.rs @@ -24,49 +24,120 @@ //! * `macOS` //! -use crate::db::graph::Graph; -use crate::db::view_api::GraphViewOps; +use crate::db::{api::view::GraphViewOps, graph::graph::Graph}; use chrono::NaiveDateTime; use serde::{Deserialize, Serialize}; -use std::fmt; +use std::{ + borrow::Borrow, + cmp::Ordering, + collections::HashMap, + fmt, + fmt::{Display, Formatter}, + ops::Deref, + sync::Arc, +}; #[cfg(test)] extern crate core; -mod adj; -pub mod agg; -mod edge_layer; -pub mod edge_ref; -mod lazy_vec; -pub mod lsm; -mod props; -mod sorted_vec_map; +pub mod entities; pub mod state; -pub mod tadjset; -mod tcell; -pub mod tgraph; -pub mod tgraph_shard; -pub mod time; -pub mod timeindex; -mod tprop; +pub(crate) mod storage; pub mod utils; -pub mod vertex; -pub mod vertex_ref; -type Time = i64; +/// this is here because Arc annoyingly doesn't implement all the expected comparisons +#[derive(Clone, Debug, Eq, Ord, Hash, Serialize, Deserialize)] +pub struct ArcStr(pub(crate) Arc); + +impl Display for ArcStr { + fn fmt(&self, f: &mut Formatter<'_>) -> fmt::Result { + Display::fmt(&self.0, f) + } +} + +impl>> From for ArcStr { + fn from(value: T) -> Self { + ArcStr(value.into()) + } +} + +impl From for String { + fn from(value: ArcStr) -> Self { + value.to_string() + } +} +impl Deref for ArcStr { + type Target = Arc; + + #[inline] + fn deref(&self) -> &Self::Target { + &self.0 + } +} + +impl Borrow for ArcStr { + #[inline] + fn borrow(&self) -> &str { + self.0.borrow() + } +} + +impl AsRef for ArcStr +where + T: ?Sized, + ::Target: AsRef, +{ + fn as_ref(&self) -> &T { + self.deref().as_ref() + } +} + +impl + ?Sized> PartialEq for ArcStr { + fn eq(&self, other: &T) -> bool { + >::borrow(self).eq(other.borrow()) + } +} + +impl> PartialOrd for ArcStr { + fn partial_cmp(&self, other: &T) -> Option { + >::borrow(self).partial_cmp(other.borrow()) + } +} /// Denotes the direction of an edge. Can be incoming, outgoing or both. -#[derive(Clone, Copy, PartialEq, Debug)] +#[derive(Clone, Copy, PartialEq, PartialOrd, Debug)] pub enum Direction { OUT, IN, BOTH, } +#[derive(Copy, Clone, PartialEq, Eq, Debug, Default, Serialize, Deserialize)] +pub enum PropType { + #[default] + Empty, + Str, + U8, + U16, + I32, + I64, + U32, + U64, + F32, + F64, + Bool, + List, + Map, + DTime, + Graph, +} + /// Denotes the types of properties allowed to be stored in the graph. #[derive(Debug, Serialize, Deserialize, PartialEq, Clone)] pub enum Prop { - Str(String), + Str(ArcStr), + U8(u8), + U16(u16), I32(i32), I64(i64), U32(u32), @@ -74,13 +145,98 @@ pub enum Prop { F32(f32), F64(f64), Bool(bool), + List(Arc>), + Map(Arc>), DTime(NaiveDateTime), Graph(Graph), } +impl PartialOrd for Prop { + fn partial_cmp(&self, other: &Self) -> Option { + match (self, other) { + (Prop::Str(a), Prop::Str(b)) => a.partial_cmp(b), + (Prop::U8(a), Prop::U8(b)) => a.partial_cmp(b), + (Prop::U16(a), Prop::U16(b)) => a.partial_cmp(b), + (Prop::I32(a), Prop::I32(b)) => a.partial_cmp(b), + (Prop::I64(a), Prop::I64(b)) => a.partial_cmp(b), + (Prop::U32(a), Prop::U32(b)) => a.partial_cmp(b), + (Prop::U64(a), Prop::U64(b)) => a.partial_cmp(b), + (Prop::F32(a), Prop::F32(b)) => a.partial_cmp(b), + (Prop::F64(a), Prop::F64(b)) => a.partial_cmp(b), + (Prop::Bool(a), Prop::Bool(b)) => a.partial_cmp(b), + (Prop::DTime(a), Prop::DTime(b)) => a.partial_cmp(b), + _ => None, + } + } +} + +impl Prop { + pub fn dtype(&self) -> PropType { + match self { + Prop::Str(_) => PropType::Str, + Prop::U8(_) => PropType::U8, + Prop::U16(_) => PropType::U16, + Prop::I32(_) => PropType::I32, + Prop::I64(_) => PropType::I64, + Prop::U32(_) => PropType::U32, + Prop::U64(_) => PropType::U64, + Prop::F32(_) => PropType::F32, + Prop::F64(_) => PropType::F64, + Prop::Bool(_) => PropType::Bool, + Prop::List(_) => PropType::List, + Prop::Map(_) => PropType::Map, + Prop::DTime(_) => PropType::DTime, + Prop::Graph(_) => PropType::Graph, + } + } + + pub fn str>(s: S) -> Prop { + Prop::Str(s.into()) + } + + pub fn add(self, other: Prop) -> Option { + match (self, other) { + (Prop::U8(a), Prop::U8(b)) => Some(Prop::U8(a + b)), + (Prop::U16(a), Prop::U16(b)) => Some(Prop::U16(a + b)), + (Prop::I32(a), Prop::I32(b)) => Some(Prop::I32(a + b)), + (Prop::I64(a), Prop::I64(b)) => Some(Prop::I64(a + b)), + (Prop::U32(a), Prop::U32(b)) => Some(Prop::U32(a + b)), + (Prop::U64(a), Prop::U64(b)) => Some(Prop::U64(a + b)), + (Prop::F32(a), Prop::F32(b)) => Some(Prop::F32(a + b)), + (Prop::F64(a), Prop::F64(b)) => Some(Prop::F64(a + b)), + (Prop::Str(a), Prop::Str(b)) => Some(Prop::Str((a.to_string() + &b).into())), + _ => None, + } + } + + pub fn divide(self, other: Prop) -> Option { + match (self, other) { + (Prop::U8(a), Prop::U8(b)) if b != 0 => Some(Prop::U8(a / b)), + (Prop::U16(a), Prop::U16(b)) if b != 0 => Some(Prop::U16(a / b)), + (Prop::I32(a), Prop::I32(b)) if b != 0 => Some(Prop::I32(a / b)), + (Prop::I64(a), Prop::I64(b)) if b != 0 => Some(Prop::I64(a / b)), + (Prop::U32(a), Prop::U32(b)) if b != 0 => Some(Prop::U32(a / b)), + (Prop::U64(a), Prop::U64(b)) if b != 0 => Some(Prop::U64(a / b)), + (Prop::F32(a), Prop::F32(b)) if b != 0.0 => Some(Prop::F32(a / b)), + (Prop::F64(a), Prop::F64(b)) if b != 0.0 => Some(Prop::F64(a / b)), + _ => None, + } + } +} + pub trait PropUnwrap: Sized { - fn into_str(self) -> Option; - fn unwrap_str(self) -> String { + fn into_u8(self) -> Option; + fn unwrap_u8(self) -> u8 { + self.into_u8().unwrap() + } + + fn into_u16(self) -> Option; + fn unwrap_u16(self) -> u16 { + self.into_u16().unwrap() + } + + fn into_str(self) -> Option; + fn unwrap_str(self) -> ArcStr { self.into_str().unwrap() } @@ -119,6 +275,16 @@ pub trait PropUnwrap: Sized { self.into_bool().unwrap() } + fn into_list(self) -> Option>>; + fn unwrap_list(self) -> Arc> { + self.into_list().unwrap() + } + + fn into_map(self) -> Option>>; + fn unwrap_map(self) -> Arc> { + self.into_map().unwrap() + } + fn into_dtime(self) -> Option; fn unwrap_dtime(self) -> NaiveDateTime { self.into_dtime().unwrap() @@ -131,7 +297,15 @@ pub trait PropUnwrap: Sized { } impl PropUnwrap for Option

{ - fn into_str(self) -> Option { + fn into_u8(self) -> Option { + self.and_then(|p| p.into_u8()) + } + + fn into_u16(self) -> Option { + self.and_then(|p| p.into_u16()) + } + + fn into_str(self) -> Option { self.and_then(|p| p.into_str()) } @@ -163,6 +337,14 @@ impl PropUnwrap for Option

{ self.and_then(|p| p.into_bool()) } + fn into_list(self) -> Option>> { + self.and_then(|p| p.into_list()) + } + + fn into_map(self) -> Option>> { + self.and_then(|p| p.into_map()) + } + fn into_dtime(self) -> Option { self.and_then(|p| p.into_dtime()) } @@ -173,7 +355,23 @@ impl PropUnwrap for Option

{ } impl PropUnwrap for Prop { - fn into_str(self) -> Option { + fn into_u8(self) -> Option { + if let Prop::U8(s) = self { + Some(s) + } else { + None + } + } + + fn into_u16(self) -> Option { + if let Prop::U16(s) = self { + Some(s) + } else { + None + } + } + + fn into_str(self) -> Option { if let Prop::Str(s) = self { Some(s) } else { @@ -237,6 +435,22 @@ impl PropUnwrap for Prop { } } + fn into_list(self) -> Option>> { + if let Prop::List(v) = self { + Some(v) + } else { + None + } + } + + fn into_map(self) -> Option>> { + if let Prop::Map(v) = self { + Some(v) + } else { + None + } + } + fn into_dtime(self) -> Option { if let Prop::DTime(v) = self { Some(v) @@ -258,6 +472,8 @@ impl fmt::Display for Prop { fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result { match self { Prop::Str(value) => write!(f, "{}", value), + Prop::U8(value) => write!(f, "{}", value), + Prop::U16(value) => write!(f, "{}", value), Prop::I32(value) => write!(f, "{}", value), Prop::I64(value) => write!(f, "{}", value), Prop::U32(value) => write!(f, "{}", value), @@ -269,9 +485,179 @@ impl fmt::Display for Prop { Prop::Graph(value) => write!( f, "Graph(num_vertices={}, num_edges={})", - value.num_vertices(), - value.num_edges() + value.count_vertices(), + value.count_edges() ), + Prop::List(value) => { + write!(f, "{:?}", value) + } + Prop::Map(value) => { + write!(f, "{:?}", value) + } } } } + +// From impl for Prop + +impl From for Prop { + fn from(value: ArcStr) -> Self { + Prop::Str(value) + } +} + +impl From<&ArcStr> for Prop { + fn from(value: &ArcStr) -> Self { + Prop::Str(value.clone()) + } +} + +impl From for Prop { + fn from(value: String) -> Self { + Prop::Str(value.into()) + } +} +impl From<&String> for Prop { + fn from(s: &String) -> Self { + Prop::Str(s.as_str().into()) + } +} + +impl From> for Prop { + fn from(s: Arc) -> Self { + Prop::Str(s.into()) + } +} + +impl From<&Arc> for Prop { + fn from(value: &Arc) -> Self { + Prop::Str(value.clone().into()) + } +} + +impl From<&str> for Prop { + fn from(s: &str) -> Self { + Prop::Str(s.to_owned().into()) + } +} + +impl From for Prop { + fn from(i: i32) -> Self { + Prop::I32(i) + } +} + +impl From for Prop { + fn from(i: u8) -> Self { + Prop::U8(i) + } +} + +impl From for Prop { + fn from(i: u16) -> Self { + Prop::U16(i) + } +} + +impl From for Prop { + fn from(i: i64) -> Self { + Prop::I64(i) + } +} + +impl From for Prop { + fn from(u: u32) -> Self { + Prop::U32(u) + } +} + +impl From for Prop { + fn from(u: u64) -> Self { + Prop::U64(u) + } +} + +impl From for Prop { + fn from(f: f32) -> Self { + Prop::F32(f) + } +} + +impl From for Prop { + fn from(f: f64) -> Self { + Prop::F64(f) + } +} + +impl From for Prop { + fn from(b: bool) -> Self { + Prop::Bool(b) + } +} + +impl From> for Prop { + fn from(value: HashMap) -> Self { + Prop::Map(Arc::new(value)) + } +} + +impl From> for Prop { + fn from(value: Vec) -> Self { + Prop::List(Arc::new(value)) + } +} + +impl From<&Prop> for Prop { + fn from(value: &Prop) -> Self { + value.clone() + } +} + +pub trait IntoPropMap { + fn into_prop_map(self) -> Prop; +} + +impl, K: Into, V: Into> IntoPropMap for I { + fn into_prop_map(self) -> Prop { + Prop::Map(Arc::new( + self.into_iter() + .map(|(k, v)| (k.into(), v.into())) + .collect(), + )) + } +} + +pub trait IntoPropList { + fn into_prop_list(self) -> Prop; +} + +impl, K: Into> IntoPropList for I { + fn into_prop_list(self) -> Prop { + Prop::List(Arc::new(self.into_iter().map(|v| v.into()).collect())) + } +} + +pub trait IntoProp { + fn into_prop(self) -> Prop; +} + +impl> IntoProp for T { + fn into_prop(self) -> Prop { + self.into() + } +} + +#[cfg(test)] +mod test_arc_str { + use crate::core::ArcStr; + use std::sync::Arc; + + #[test] + fn can_compare_with_str() { + let test: ArcStr = "test".into(); + assert_eq!(test, "test"); + assert_eq!(test, "test".to_string()); + assert_eq!(test, Arc::from("test")); + assert_eq!(&test, &"test".to_string()) + } +} diff --git a/raphtory/src/core/props.rs b/raphtory/src/core/props.rs deleted file mode 100644 index 3737f8f986..0000000000 --- a/raphtory/src/core/props.rs +++ /dev/null @@ -1,298 +0,0 @@ -use crate::core::lazy_vec::{IllegalSet, LazyVec}; -use crate::core::tprop::TProp; -use crate::core::Prop; -use itertools::Itertools; -use serde::{Deserialize, Serialize}; -use std::collections::HashMap; -use std::fmt::Debug; - -#[derive(thiserror::Error, Debug, PartialEq)] -#[error("cannot mutate static property '{name}'")] -pub struct IllegalMutate { - pub name: String, - pub source: IllegalSet>, -} - -impl IllegalMutate { - fn from(source: IllegalSet>, props: &Props) -> IllegalMutate { - let id = PropId::Static(source.index); - IllegalMutate { - name: props.reverse_id(&id).to_string(), - source, - } - } -} - -#[derive(Debug, Serialize, Deserialize, PartialEq, Eq, Hash, Clone)] -enum PropId { - Static(usize), - Temporal(usize), -} - -impl PropId { - #[allow(dead_code)] - pub(crate) fn new(id: usize, static_: bool) -> PropId { - if static_ { - PropId::Static(id) - } else { - PropId::Temporal(id) - } - } - pub(crate) fn get_id(&self) -> usize { - match self { - PropId::Static(id) => *id, - PropId::Temporal(id) => *id, - } - } - pub(crate) fn is_static(&self) -> bool { - match self { - PropId::Static(_) => true, - PropId::Temporal(_) => false, - } - } -} - -#[derive(Default, Debug, Serialize, Deserialize, PartialEq)] -pub(crate) struct Props { - // Mapping between property name and property id - prop_ids: HashMap, // TODO: change name back to prop_ids - - // Vector of vertices properties. Each index represents vertex local (physical) id - static_props: Vec>>, - temporal_props: Vec>, -} - -impl Props { - // GETTERS: - - fn get_prop_id(&self, name: &str, should_be_static: bool) -> Option { - match self.prop_ids.get(name) { - Some(prop_id) if prop_id.is_static() == should_be_static => Some(prop_id.get_id()), - _ => None, - } - } - - #[allow(unused_variables)] - fn reverse_id(&self, id: &PropId) -> &str { - self.prop_ids.iter().find(|&(k, v)| v == id).unwrap().0 - } - - fn get_or_default(&self, vector: &Vec>, id: usize, name: &str) -> A - where - A: PartialEq + Default + Clone + Debug, - { - match self.get_prop_id(name, true) { - Some(prop_id) => { - let props = vector.get(id).unwrap_or(&LazyVec::Empty); - props.get(prop_id).cloned().unwrap_or(Default::default()) - } - None => Default::default(), - } - } - - pub(crate) fn static_prop(&self, id: usize, name: &str) -> Option { - self.get_or_default(&self.static_props, id, name) - } - - pub(crate) fn temporal_prop(&self, id: usize, name: &str) -> Option<&TProp> { - // TODO: we should be able to use self.get_or_default() here - let prop_id = self.get_prop_id(name, false)?; - let props = self.temporal_props.get(id).unwrap_or(&LazyVec::Empty); - props.get(prop_id) - } - - fn get_names( - &self, - vector: &Vec>, - id: usize, - should_be_static: bool, - ) -> Vec - where - A: Clone + Default + PartialEq + Debug, - { - match vector.get(id) { - Some(props) => { - let ids = props.filled_ids().into_iter(); - if should_be_static { - ids.map(|id| self.reverse_id(&PropId::Static(id)).to_string()) - .collect_vec() - } else { - ids.map(|id| self.reverse_id(&PropId::Temporal(id)).to_string()) - .collect_vec() - } - } - None => vec![], - } - } - - pub fn static_names(&self, id: usize) -> Vec { - self.get_names(&self.static_props, id, true) - } - - pub fn temporal_names(&self, id: usize) -> Vec { - self.get_names(&self.temporal_props, id, false) - } - - // SETTERS: - - fn grow_and_get_slot(vector: &mut Vec, id: usize) -> &mut A - where - A: Default, - { - if vector.len() <= id { - vector.resize_with(id + 1, || Default::default()); - } - // now props_storage.len() >= id + 1: - vector.get_mut(id).unwrap() - } - - fn get_or_allocate_id(&mut self, name: &str, should_be_static: bool) -> Result { - match self.prop_ids.get(name) { - None => { - let new_prop_id = if should_be_static { - let static_prop_ids = self.prop_ids.iter().filter(|&(_, v)| v.is_static()); - let new_id = static_prop_ids.count(); - PropId::Static(new_id) - } else { - let static_prop_ids = self.prop_ids.iter().filter(|&(_, v)| !v.is_static()); - let new_id = static_prop_ids.count(); - PropId::Temporal(new_id) - }; - self.prop_ids.insert(name.to_string(), new_prop_id.clone()); - Ok(new_prop_id.get_id()) - } - Some(id) if id.is_static() == should_be_static => Ok(id.get_id()), - _ => Err(()), - } - } - - fn translate_props( - &mut self, - props: &Vec<(String, Prop)>, - should_be_static: bool, - ) -> Vec<(usize, Prop)> { - // TODO: return Result - props - .iter() - .map(|(name, prop)| { - ( - self.get_or_allocate_id(name, should_be_static).unwrap(), - prop.clone(), - ) - }) - .collect_vec() - } - - pub fn upsert_temporal_props(&mut self, t: i64, id: usize, props: &Vec<(String, Prop)>) { - if !props.is_empty() { - let translated_props = self.translate_props(props, false); - let vertex_slot: &mut LazyVec = - Self::grow_and_get_slot(&mut self.temporal_props, id); - for (prop_id, prop) in translated_props { - vertex_slot.update_or_set(prop_id, |p| p.set(t, &prop), TProp::from(t, &prop)); - } - } - } - - pub fn set_static_props( - &mut self, - id: usize, - props: &Vec<(String, Prop)>, - ) -> Result<(), IllegalMutate> { - if !props.is_empty() { - let translated_props = self.translate_props(props, true); - let vertex_slot: &mut LazyVec> = - Self::grow_and_get_slot(&mut self.static_props, id); - for (prop_id, prop) in translated_props { - if let Err(e) = vertex_slot.set(prop_id, Some(prop)) { - return Err(IllegalMutate::from(e, &self)); - } - } - } - Ok(()) - } -} - -#[cfg(test)] -mod props_tests { - use super::*; - - #[test] - fn return_prop_id_if_prop_name_found() { - let mut props = Props::default(); - props - .prop_ids - .insert(String::from("key1"), PropId::Temporal(0)); - props - .prop_ids - .insert(String::from("key2"), PropId::Temporal(1)); - - assert_eq!(props.get_or_allocate_id("key2", false), Ok(1)); - } - - #[test] - fn return_new_prop_id_if_prop_name_not_found() { - let mut props = Props::default(); - assert_eq!(props.get_or_allocate_id("key1", false), Ok(0)); - assert_eq!(props.get_or_allocate_id("key2", false), Ok(1)); - } - - #[test] - fn insert_new_vertex_prop() { - let mut props = Props::default(); - props.upsert_temporal_props(1, 0, &vec![("bla".to_string(), Prop::I32(10))]); - - let prop_id = props.get_or_allocate_id("bla", false).unwrap(); - assert_eq!( - props - .temporal_props - .get(0) - .unwrap() - .get(prop_id) - .unwrap() - .iter() - .collect::>(), - vec![(&1, Prop::I32(10))] - ) - } - - #[test] - fn update_existing_vertex_prop() { - let mut props = Props::default(); - props.upsert_temporal_props(1, 0, &vec![("bla".to_string(), Prop::I32(10))]); - props.upsert_temporal_props(2, 0, &vec![("bla".to_string(), Prop::I32(10))]); - - let prop_id = props.get_or_allocate_id("bla", false).unwrap(); - assert_eq!( - props - .temporal_props - .get(0) - .unwrap() - .get(prop_id) - .unwrap() - .iter() - .collect::>(), - vec![(&1, Prop::I32(10)), (&2, Prop::I32(10))] - ) - } - - #[test] - fn new_update_with_the_same_time_to_a_vertex_prop_is_ignored() { - let mut props = Props::default(); - props.upsert_temporal_props(1, 0, &vec![("bla".to_string(), Prop::I32(10))]); - props.upsert_temporal_props(1, 0, &vec![("bla".to_string(), Prop::I32(20))]); - - let prop_id = props.get_or_allocate_id("bla", false).unwrap(); - assert_eq!( - props - .temporal_props - .get(0) - .unwrap() - .get(prop_id) - .unwrap() - .iter() - .collect::>(), - vec![(&1, Prop::I32(10))] - ) - } -} diff --git a/raphtory/src/core/state/accumulator_id.rs b/raphtory/src/core/state/accumulator_id.rs index 74779d2894..96ad01e743 100644 --- a/raphtory/src/core/state/accumulator_id.rs +++ b/raphtory/src/core/state/accumulator_id.rs @@ -1,4 +1,4 @@ -use crate::core::agg::{Accumulator, Init, InitAcc}; +use crate::core::state::agg::{Accumulator, Init, InitAcc}; #[derive(Debug)] pub struct AccId> { @@ -39,13 +39,13 @@ unsafe impl> Sync for AccId: Send + Sync + 'static { fn zero() -> A; @@ -404,8 +403,9 @@ mod agg_test { #[test] fn avg_def() { - use crate::core::agg::{ - topk::TopK, topk::TopKHeap, Accumulator, AvgDef, MaxDef, MinDef, SumDef, + use super::{ + topk::{TopK, TopKHeap}, + Accumulator, AvgDef, MaxDef, MinDef, SumDef, }; let mut avg = AvgDef::::zero(); diff --git a/raphtory/src/core/state/compute_state.rs b/raphtory/src/core/state/compute_state.rs index d440c86572..771a805287 100644 --- a/raphtory/src/core/state/compute_state.rs +++ b/raphtory/src/core/state/compute_state.rs @@ -1,13 +1,9 @@ -use rustc_hash::FxHashMap; -use std::collections::HashMap; - -use crate::core::vertex_ref::LocalVertexRef; -use crate::{core::agg::Accumulator, db::view_api::internal::GraphViewInternalOps}; - use super::{ - container::{merge_2_vecs, DynArray, MapArray, VecArray}, + container::{merge_2_vecs, DynArray, VecArray}, StateType, }; +use crate::{core::state::agg::Accumulator, db::api::view::GraphViewOps}; +use std::collections::HashMap; pub trait ComputeState: std::fmt::Debug + Clone + Send + Sync { fn clone_current_into_other(&mut self, ss: usize); @@ -30,10 +26,7 @@ pub trait ComputeState: std::fmt::Debug + Clone + Send + Sync { i: usize, ) -> Option<&A>; - fn iter(&self, ss: usize) -> Box + '_>; - - fn iter_keys(&self) -> Box + '_>; - fn iter_keys_changed(&self, ss: usize) -> Box + '_>; + fn iter(&self, ss: usize, extend_to: usize) -> Box + '_>; fn agg>(&mut self, ss: usize, a: IN, ki: usize) where @@ -47,10 +40,9 @@ pub trait ComputeState: std::fmt::Debug + Clone + Send + Sync { where A: StateType; - fn finalize, G: GraphViewInternalOps>( + fn finalize, G: GraphViewOps>( &self, ss: usize, - shard_id: usize, g: &G, ) -> HashMap where @@ -65,186 +57,6 @@ pub trait ComputeState: std::fmt::Debug + Clone + Send + Sync { OUT: StateType; } -#[derive(Debug)] -pub struct ComputeStateMap(Box); - -impl ComputeStateMap { - fn current_mut(&mut self) -> &mut dyn DynArray { - self.0.as_mut() - } - - fn current(&self) -> &dyn DynArray { - self.0.as_ref() - } -} - -impl Clone for ComputeStateMap { - fn clone(&self) -> Self { - ComputeStateMap(self.0.clone_array()) - } -} - -impl ComputeState for ComputeStateMap { - fn clone_current_into_other(&mut self, ss: usize) { - self.0.copy_over(ss); - } - - fn reset_resetable_states(&mut self, ss: usize) { - self.0.reset(ss); - } - - fn new_mutable_primitive(zero: T) -> Self { - ComputeStateMap(Box::new(MapArray:: { - map: FxHashMap::default(), - zero, - })) - } - - fn read>( - &self, - ss: usize, - i: usize, - ) -> Option - where - OUT: std::fmt::Debug, - { - let current = self - .current() - .as_any() - .downcast_ref::>() - .unwrap(); - - current - .map - .get(&(i as u64)) - .map(|v| ACC::finish(&v[ss % 2])) - } - - fn read_ref>( - &self, - ss: usize, - i: usize, - ) -> Option<&A> { - let current = self - .current() - .as_any() - .downcast_ref::>() - .unwrap(); - current.map.get(&(i as u64)).map(|v| &v[ss % 2]) - } - - fn iter(&self, ss: usize) -> Box + '_> { - let current = self - .current() - .as_any() - .downcast_ref::>() - .unwrap(); - Box::new( - current - .map - .iter() - .map(move |(k, v)| (*k as usize, &v[ss % 2])), - ) - } - - fn iter_keys(&self) -> Box + '_> { - self.current().iter_keys() - } - - fn iter_keys_changed(&self, ss: usize) -> Box + '_> { - self.current().iter_keys_changed(ss) - } - - fn agg>(&mut self, ss: usize, a: IN, i: usize) - where - A: StateType, - { - let current = self - .current_mut() - .as_mut_any() - .downcast_mut::>() - .unwrap(); - let entry = current - .map - .entry(i as u64) - .or_insert_with(|| [current.zero.clone(), current.zero.clone()]); - ACC::add0(&mut entry[ss % 2], a); - } - - fn combine>(&mut self, ss: usize, a: &A, i: usize) - where - A: StateType, - { - let current = self - .current_mut() - .as_mut_any() - .downcast_mut::>() - .unwrap(); - let zero = current.zero.clone(); - let entry = current - .map - .entry(i as u64) - .or_insert_with(|| [zero.clone(), zero.clone()]); - ACC::combine(&mut entry[ss % 2], a); - } - - fn merge>(&mut self, other: &Self, ss: usize) - where - A: StateType, - { - other.iter::(ss).for_each(|(i, a)| { - self.combine::(ss, a, i); - }); - } - - fn finalize, G: GraphViewInternalOps>( - &self, - ss: usize, - _shard_id: usize, - _g: &G, - ) -> HashMap - where - OUT: StateType, - A: 'static, - { - let current = self - .current() - .as_any() - .downcast_ref::>() - .unwrap(); - current - .map - .iter() - .map(|(c, v)| { - // println!("c? = {}", c); - ( - _g.vertex_name(_g.localise_vertex_unchecked((*c).into())), - ACC::finish(&v[ss % 2]), - ) - }) - .collect() - } - - fn fold, F, B>(&self, ss: usize, b: B, f: F) -> B - where - F: FnOnce(B, &u64, OUT) -> B + Copy, - A: 'static, - B: std::fmt::Debug, - OUT: StateType, - { - let current = self - .current() - .as_any() - .downcast_ref::>() - .unwrap(); - current - .map - .iter() - .map(|(k, v)| (k, ACC::finish(&v[ss % 2]))) - .fold(b, |b, (k, out)| f(b, k, out)) - } -} - #[derive(Debug)] pub struct ComputeStateVec(Box); @@ -306,24 +118,20 @@ impl ComputeState for ComputeStateVec { vec.current(ss).get(i) } - fn iter(&self, ss: usize) -> Box + '_> { + fn iter(&self, ss: usize, extend_to: usize) -> Box + '_> { let vec = self .current() .as_any() .downcast_ref::>() .unwrap(); - let iter = vec.current(ss).iter().enumerate(); + let zero = vec.zero(); + let inner_vec = vec.current(ss); + let vec_len = inner_vec.len(); + let extend_iter = std::iter::repeat(zero).take(extend_to - vec_len); + let iter = inner_vec.iter().chain(extend_iter); Box::new(iter) } - fn iter_keys(&self) -> Box + '_> { - todo!() - } - - fn iter_keys_changed(&self, _ss: usize) -> Box + '_> { - todo!() - } - fn agg>(&mut self, ss: usize, a: IN, ki: usize) where A: StateType, @@ -381,10 +189,9 @@ impl ComputeState for ComputeStateVec { merge_2_vecs(v, v_other, |a, b| ACC::combine(a, b)); } - fn finalize, G: GraphViewInternalOps>( + fn finalize, G: GraphViewOps>( &self, ss: usize, - shard_id: usize, g: &G, ) -> HashMap where @@ -402,10 +209,8 @@ impl ComputeState for ComputeStateVec { .iter() .enumerate() .map(|(p_id, a)| { - let v_ref = LocalVertexRef::new(p_id, shard_id); - let out = ACC::finish(a); - (g.vertex_name(v_ref), out) + (g.vertex_name(p_id.into()), out) }) .collect() } diff --git a/raphtory/src/core/state/container.rs b/raphtory/src/core/state/container.rs index 8fdb52e769..956bea9f27 100644 --- a/raphtory/src/core/state/container.rs +++ b/raphtory/src/core/state/container.rs @@ -1,8 +1,5 @@ -use std::any::Any; - -use rustc_hash::FxHashMap; - use super::StateType; +use std::any::Any; pub trait DynArray: std::fmt::Debug + Send + Sync { fn as_any(&self) -> &dyn Any; @@ -12,14 +9,6 @@ pub trait DynArray: std::fmt::Debug + Send + Sync { // used for map array fn copy_over(&mut self, ss: usize); fn reset(&mut self, ss: usize); - fn iter_keys(&self) -> Box + '_>; - fn iter_keys_changed(&self, ss: usize) -> Box + '_>; -} - -#[derive(Debug, Clone, PartialEq)] -pub(crate) struct MapArray { - pub(crate) map: FxHashMap, - pub(crate) zero: T, } #[derive(Debug, Clone, PartialEq)] @@ -62,12 +51,8 @@ impl VecArray { } } - fn previous(&self, ss: usize) -> &Vec { - if ss % 2 == 0 { - &self.odd - } else { - &self.even - } + pub(crate) fn zero(&self) -> &T { + &self.zero } } @@ -129,65 +114,4 @@ impl DynArray for VecArray { *v = zero.clone(); } } - - fn iter_keys(&self) -> Box + '_> { - todo!() - } - - fn iter_keys_changed(&self, _ss: usize) -> Box + '_> { - todo!() - } -} - -impl DynArray for MapArray -where - T: StateType, -{ - fn as_any(&self) -> &dyn Any { - self - } - - fn as_mut_any(&mut self) -> &mut dyn Any { - self - } - - fn clone_array(&self) -> Box { - Box::new(self.clone()) - } - - fn copy_from(&mut self, other: &dyn DynArray) { - let other = other.as_any().downcast_ref::>().unwrap(); - self.map = other.map.clone(); - } - - fn copy_over(&mut self, ss: usize) { - for val in self.map.values_mut() { - let i = ss % 2; - let j = (ss + 1) % 2; - val[j] = val[i].clone(); - } - } - - fn iter_keys(&self) -> Box + '_> { - Box::new(self.map.keys().copied()) - } - - fn iter_keys_changed(&self, ss: usize) -> Box + '_> { - Box::new(self.map.iter().filter_map(move |(k, v)| { - let i = ss % 2; - let j = (ss + 1) % 2; - if v[i] != v[j] { - Some(*k) - } else { - None - } - })) - } - - fn reset(&mut self, ss: usize) { - for val in self.map.values_mut() { - let i = (ss + 1) % 2; - val[i] = self.zero.clone(); - } - } } diff --git a/raphtory/src/core/state/mod.rs b/raphtory/src/core/state/mod.rs index 2059d4728f..c6d2cf227a 100644 --- a/raphtory/src/core/state/mod.rs +++ b/raphtory/src/core/state/mod.rs @@ -1,7 +1,8 @@ pub mod accumulator_id; +pub mod agg; pub mod compute_state; pub mod container; -pub mod shard_state; +pub mod morcel_state; pub mod shuffle_state; pub trait StateType: PartialEq + Clone + std::fmt::Debug + Send + Sync + 'static {} @@ -15,13 +16,11 @@ mod state_test { use crate::{ core::state::{ - accumulator_id::accumulators, - compute_state::{ComputeStateMap, ComputeStateVec}, - container::merge_2_vecs, - shard_state::ShardComputeState, - shuffle_state::ShuffleComputeState, + accumulator_id::accumulators, compute_state::ComputeStateVec, container::merge_2_vecs, + morcel_state::MorcelComputeState, shuffle_state::ShuffleComputeState, }, - db::graph::Graph, + db::{api::mutation::AdditionOps, graph::graph::Graph}, + prelude::NO_PROPS, }; #[quickcheck] @@ -43,22 +42,22 @@ mod state_test { } } - fn tiny_graph(n_shards: usize) -> Graph { - let g = Graph::new(n_shards); + fn tiny_graph() -> Graph { + let g = Graph::new(); - g.add_vertex(1, 1, &vec![]).unwrap(); - g.add_vertex(1, 2, &vec![]).unwrap(); - g.add_vertex(1, 3, &vec![]).unwrap(); + g.add_vertex(1, 1, NO_PROPS).unwrap(); + g.add_vertex(1, 2, NO_PROPS).unwrap(); + g.add_vertex(1, 3, NO_PROPS).unwrap(); g } #[test] fn min_aggregates_for_3_keys() { - let g = tiny_graph(1); + let g = tiny_graph(); let min = accumulators::min(0); - let mut state_map: ShardComputeState = ShardComputeState::new(); + let mut state_map: MorcelComputeState = MorcelComputeState::new(3); // create random vec of numbers let mut rng = rand::thread_rng(); @@ -76,25 +75,25 @@ mod state_test { state_map.accumulate_into(0, 2, a, &min); } - let mut actual = state_map.finalize(0, &min, 0, &g).into_iter().collect_vec(); + let mut actual = state_map.finalize(0, &min, &g).into_iter().collect_vec(); actual.sort(); assert_eq!( actual, vec![ ("1".to_string(), actual_min), ("2".to_string(), actual_min), - ("3".to_string(), actual_min) + ("3".to_string(), actual_min), ] ); } #[test] fn avg_aggregates_for_3_keys() { - let g = tiny_graph(1); + let g = tiny_graph(); let avg = accumulators::avg(0); - let mut state_map: ShardComputeState = ShardComputeState::new(); + let mut state_map: MorcelComputeState = MorcelComputeState::new(3); // create random vec of numbers let mut rng = rand::thread_rng(); @@ -107,31 +106,31 @@ mod state_test { } for a in vec { + state_map.accumulate_into(0, 0, a, &avg); state_map.accumulate_into(0, 1, a, &avg); state_map.accumulate_into(0, 2, a, &avg); - state_map.accumulate_into(0, 3, a, &avg); } let actual_avg = sum / 100; - let mut actual = state_map.finalize(0, &avg, 0, &g).into_iter().collect_vec(); + let mut actual = state_map.finalize(0, &avg, &g).into_iter().collect_vec(); actual.sort(); assert_eq!( actual, vec![ ("1".to_string(), actual_avg), ("2".to_string(), actual_avg), - ("3".to_string(), actual_avg) + ("3".to_string(), actual_avg), ] ); } #[test] fn top3_aggregates_for_3_keys() { - let g = tiny_graph(1); + let g = tiny_graph(); let top3 = accumulators::topk::(0); - let mut state_map: ShardComputeState = ShardComputeState::new(); + let mut state_map: MorcelComputeState = MorcelComputeState::new(3); for a in 0..100 { state_map.accumulate_into(0, 0, a, &top3); @@ -140,10 +139,7 @@ mod state_test { } let expected = vec![99, 98, 97]; - let mut actual = state_map - .finalize(0, &top3, 0, &g) - .into_iter() - .collect_vec(); + let mut actual = state_map.finalize(0, &top3, &g).into_iter().collect_vec(); actual.sort(); @@ -152,18 +148,18 @@ mod state_test { vec![ ("1".to_string(), expected.clone()), ("2".to_string(), expected.clone()), - ("3".to_string(), expected.clone()) + ("3".to_string(), expected.clone()), ] ); } #[test] fn sum_aggregates_for_3_keys() { - let g = tiny_graph(2); + let g = tiny_graph(); let sum = accumulators::sum(0); - let mut state: ShardComputeState = ShardComputeState::new(); + let mut state: MorcelComputeState = MorcelComputeState::new(3); // create random vec of numbers let mut rng = rand::thread_rng(); @@ -176,31 +172,31 @@ mod state_test { } for a in vec { + state.accumulate_into(0, 0, a, &sum); state.accumulate_into(0, 1, a, &sum); state.accumulate_into(0, 2, a, &sum); - state.accumulate_into(0, 3, a, &sum); } - let mut actual = state.finalize(0, &sum, 0, &g).into_iter().collect_vec(); + let mut actual = state.finalize(0, &sum, &g).into_iter().collect_vec(); actual.sort(); assert_eq!( actual, vec![ ("1".to_string(), actual_sum), ("2".to_string(), actual_sum), - ("3".to_string(), actual_sum) + ("3".to_string(), actual_sum), ] ); } #[test] fn sum_aggregates_for_3_keys_2_parts() { - let g = tiny_graph(2); - let sum = accumulators::sum(0); - let mut part1_state: ShuffleComputeState = ShuffleComputeState::new(2); - let mut part2_state: ShuffleComputeState = ShuffleComputeState::new(2); + let mut part1_state: ShuffleComputeState = + ShuffleComputeState::new(3, 2, 2); + let mut part2_state: ShuffleComputeState = + ShuffleComputeState::new(3, 2, 2); // create random vec of numbers let mut rng = rand::thread_rng(); @@ -208,7 +204,7 @@ mod state_test { let mut vec2 = vec![]; let mut actual_sum_1 = 0; let mut actual_sum_2 = 0; - for _ in 0..100 { + for _ in 0..3 { // data for first partition let i = rng.gen_range(0..100); actual_sum_1 += i; @@ -224,75 +220,48 @@ mod state_test { // 2 gets the numbers from part1 // 3 gets the numbers from part2 for a in vec1 { + part1_state.accumulate_into(0, 0, a, &sum); part1_state.accumulate_into(0, 1, a, &sum); - part1_state.accumulate_into(0, 2, a, &sum); } for a in vec2 { - part2_state.accumulate_into(0, 1, a, &sum); - part2_state.accumulate_into(0, 3, a, &sum); + part2_state.accumulate_into(0, 0, a, &sum); + part2_state.accumulate_into(0, 2, a, &sum); } - println!("part1_state: {:?}", part1_state); - println!("part2_state: {:?}", part2_state); - - let mut actual: Vec<(String, i32)> = part1_state - .finalize(&sum, 0, &g, |c| c) - .into_iter() - .collect_vec(); - - actual.sort(); - - assert_eq!( - actual, - vec![ - ("1".to_string(), actual_sum_1), - ("2".to_string(), actual_sum_1), - ] - ); + let actual = part1_state.iter_out(0, sum).collect_vec(); - let mut actual = part2_state - .finalize(&sum, 0, &g, |c| c) - .into_iter() - .collect_vec(); + assert_eq!(actual, vec![(0, actual_sum_1), (1, actual_sum_1), (2, 0)]); - actual.sort(); + let actual = part2_state.iter_out(0, sum).collect_vec(); - assert_eq!( - actual, - vec![ - ("1".to_string(), actual_sum_2), - ("3".to_string(), actual_sum_2) - ] - ); + assert_eq!(actual, vec![(0, actual_sum_2), (1, 0), (2, actual_sum_2)]); - ShuffleComputeState::merge_mut(&mut part1_state, &part2_state, &sum, 0); - let mut actual = part1_state - .finalize(&sum, 0, &g, |c| c) - .into_iter() - .collect_vec(); + ShuffleComputeState::merge_mut(&mut part1_state, &part2_state, sum, 0); - actual.sort(); + let actual = part1_state.iter_out(0, sum).collect_vec(); assert_eq!( actual, vec![ - ("1".to_string(), (actual_sum_1 + actual_sum_2)), - ("2".to_string(), actual_sum_1), - ("3".to_string(), actual_sum_2) + (0, (actual_sum_1 + actual_sum_2)), + (1, actual_sum_1), + (2, actual_sum_2), ] ); } #[test] fn min_sum_aggregates_for_3_keys_2_parts() { - let g = tiny_graph(2); + let g = tiny_graph(); let sum = accumulators::sum(0); let min = accumulators::min(1); - let mut part1_state: ShuffleComputeState = ShuffleComputeState::new(2); - let mut part2_state: ShuffleComputeState = ShuffleComputeState::new(2); + let mut part1_state: ShuffleComputeState = + ShuffleComputeState::new(3, 2, 2); + let mut part2_state: ShuffleComputeState = + ShuffleComputeState::new(3, 2, 2); // create random vec of numbers let mut rng = rand::thread_rng(); @@ -320,20 +289,21 @@ mod state_test { // 2 gets the numbers from part1 // 3 gets the numbers from part2 for a in vec1 { + part1_state.accumulate_into(0, 0, a, &sum); part1_state.accumulate_into(0, 1, a, &sum); - part1_state.accumulate_into(0, 2, a, &sum); + part1_state.accumulate_into(0, 0, a, &min); part1_state.accumulate_into(0, 1, a, &min); - part1_state.accumulate_into(0, 2, a, &min); } for a in vec2 { - part2_state.accumulate_into(0, 1, a, &sum); - part2_state.accumulate_into(0, 3, a, &sum); - part2_state.accumulate_into(0, 1, a, &min); - part2_state.accumulate_into(0, 3, a, &min); + part2_state.accumulate_into(0, 0, a, &sum); + part2_state.accumulate_into(0, 2, a, &sum); + part2_state.accumulate_into(0, 0, a, &min); + part2_state.accumulate_into(0, 2, a, &min); } let mut actual = part1_state + .clone() .finalize(&sum, 0, &g, |c| c) .into_iter() .collect_vec(); @@ -345,10 +315,12 @@ mod state_test { vec![ ("1".to_string(), actual_sum_1), ("2".to_string(), actual_sum_1), + ("3".to_string(), 0), ] ); let mut actual = part1_state + .clone() .finalize(&min, 0, &g, |c| c) .into_iter() .collect_vec(); @@ -360,10 +332,12 @@ mod state_test { vec![ ("1".to_string(), actual_min_1), ("2".to_string(), actual_min_1), + ("3".to_string(), i32::MAX), ] ); let mut actual = part2_state + .clone() .finalize(&sum, 0, &g, |c| c) .into_iter() .collect_vec(); @@ -374,11 +348,13 @@ mod state_test { actual, vec![ ("1".to_string(), actual_sum_2), - ("3".to_string(), actual_sum_2) + ("2".to_string(), 0), + ("3".to_string(), actual_sum_2), ] ); let mut actual = part2_state + .clone() .finalize(&min, 0, &g, |c| c) .into_iter() .collect_vec(); @@ -389,12 +365,14 @@ mod state_test { actual, vec![ ("1".to_string(), actual_min_2), - ("3".to_string(), actual_min_2) + ("2".to_string(), i32::MAX), + ("3".to_string(), actual_min_2), ] ); - ShuffleComputeState::merge_mut(&mut part1_state, &part2_state, &sum, 0); + ShuffleComputeState::merge_mut(&mut part1_state, &part2_state, sum, 0); let mut actual = part1_state + .clone() .finalize(&sum, 0, &g, |c| c) .into_iter() .collect_vec(); @@ -406,12 +384,13 @@ mod state_test { vec![ ("1".to_string(), (actual_sum_1 + actual_sum_2)), ("2".to_string(), actual_sum_1), - ("3".to_string(), actual_sum_2) + ("3".to_string(), actual_sum_2), ] ); - ShuffleComputeState::merge_mut(&mut part1_state, &part2_state, &min, 0); + ShuffleComputeState::merge_mut(&mut part1_state, &part2_state, min, 0); let mut actual = part1_state + .clone() .finalize(&min, 0, &g, |c| c) .into_iter() .collect_vec(); @@ -423,7 +402,7 @@ mod state_test { vec![ ("1".to_string(), actual_min_1.min(actual_min_2)), ("2".to_string(), actual_min_1), - ("3".to_string(), actual_min_2) + ("3".to_string(), actual_min_2), ] ); } diff --git a/raphtory/src/core/state/shard_state.rs b/raphtory/src/core/state/morcel_state.rs similarity index 81% rename from raphtory/src/core/state/shard_state.rs rename to raphtory/src/core/state/morcel_state.rs index 4e15ab2ff3..bbb919b3ff 100644 --- a/raphtory/src/core/state/shard_state.rs +++ b/raphtory/src/core/state/morcel_state.rs @@ -1,16 +1,17 @@ use super::{accumulator_id::AccId, compute_state::ComputeState, StateType}; -use crate::{core::agg::Accumulator, db::view_api::internal::GraphViewInternalOps}; +use crate::{core::state::agg::Accumulator, db::api::view::GraphViewOps}; use rustc_hash::FxHashMap; use std::collections::HashMap; pub const GLOBAL_STATE_KEY: usize = 0; #[derive(Debug, Clone)] -pub struct ShardComputeState { +pub struct MorcelComputeState { + morcel_size: usize, pub(crate) states: FxHashMap, } -impl ShardComputeState { +impl MorcelComputeState { pub(crate) fn copy_over_next_ss(&mut self, ss: usize) { for (_, state) in self.states.iter_mut() { state.clone_current_into_other(ss); @@ -25,31 +26,10 @@ impl ShardComputeState { } } - pub(crate) fn fold, F, B>( + pub fn read_vec, G: GraphViewOps>( &self, ss: usize, - b: B, agg_ref: &AccId, - f: F, - ) -> B - where - F: FnOnce(B, &u64, OUT) -> B + Copy, - A: 'static, - B: std::fmt::Debug, - OUT: StateType, - { - if let Some(state) = self.states.get(&agg_ref.id()) { - state.fold::(ss, b, f) - } else { - b - } - } - - pub fn read_vec, G: GraphViewInternalOps>( - &self, - ss: usize, - agg_ref: &AccId, - shard_id: usize, g: &G, ) -> Option> where @@ -57,7 +37,7 @@ impl ShardComputeState { A: 'static, { let cs = self.states.get(&agg_ref.id())?; - Some(cs.finalize::(ss, shard_id, g)) + Some(cs.finalize::(ss, g)) } pub(crate) fn set_from_other>( @@ -131,8 +111,9 @@ impl ShardComputeState { state.read_ref::(ss, i) } - pub(crate) fn new() -> Self { - ShardComputeState { + pub(crate) fn new(morcel_size: usize) -> Self { + MorcelComputeState { + morcel_size, states: FxHashMap::default(), } } @@ -152,14 +133,28 @@ impl ShardComputeState { .or_insert_with(|| CS::new_mutable_primitive(ACC::zero())); state.agg::(ss, a, key); } + + pub(crate) fn iter>( + &self, + ss: usize, + agg_ref: &AccId, + ) -> Box> + '_> + where + A: StateType, + { + if let Some(state) = self.states.get(&agg_ref.id()) { + Box::new(state.iter(ss, self.morcel_size).map(|v| Some(v))) + } else { + Box::new(std::iter::repeat(None).take(self.morcel_size)) + } + } } -impl ShardComputeState { - pub fn finalize, G: GraphViewInternalOps>( +impl MorcelComputeState { + pub fn finalize, G: GraphViewOps>( &self, ss: usize, agg_ref: &AccId, - shard_id: usize, g: &G, ) -> HashMap where @@ -168,7 +163,7 @@ impl ShardComputeState { { self.states .get(&agg_ref.id()) - .map(|s| s.finalize::(ss, shard_id, g)) + .map(|s| s.finalize::(ss, g)) .unwrap_or(HashMap::::default()) } } diff --git a/raphtory/src/core/state/shuffle_state.rs b/raphtory/src/core/state/shuffle_state.rs index 4a8e4f68ff..f4e87238a9 100644 --- a/raphtory/src/core/state/shuffle_state.rs +++ b/raphtory/src/core/state/shuffle_state.rs @@ -1,87 +1,34 @@ -use crate::db::task::task_state::{Global, Shard}; -use crate::db::view_api::GraphViewOps; -use crate::{ - core::{agg::Accumulator, utils::get_shard_id_from_global_vid}, - db::view_api::internal::GraphViewInternalOps, -}; -use std::borrow::Borrow; -use std::collections::HashMap; -use std::sync::Arc; - use super::{ accumulator_id::AccId, compute_state::ComputeState, - shard_state::{ShardComputeState, GLOBAL_STATE_KEY}, + morcel_state::{MorcelComputeState, GLOBAL_STATE_KEY}, StateType, }; +use crate::{ + core::state::agg::Accumulator, + db::{ + api::view::GraphViewOps, + task::task_state::{Global, Shard}, + }, +}; +use std::{borrow::Borrow, collections::HashMap, sync::Arc}; #[derive(Debug, Clone)] pub struct ShuffleComputeState { - pub global: ShardComputeState, - pub parts: Vec>, + morcel_size: usize, + pub global: MorcelComputeState, + pub parts: Vec>, } // every partition has a struct as such impl ShuffleComputeState { - pub fn fold_state, B, F>( - &self, - ss: usize, - b: B, - agg_ref: &AccId, - f: F, - ) -> B - where - A: StateType, - B: std::fmt::Debug, - OUT: StateType, - F: Fn(B, &u64, OUT) -> B + Copy, - { - let out_b = self - .parts - .iter() - .fold(b, |b, part| part.fold(ss, b, agg_ref, f)); - out_b - } - - pub fn fold_state_internal, B, F>( - &self, - ss: usize, - b: B, - agg_ref: &AccId, - f: F, - ) -> B - where - A: StateType, - B: std::fmt::Debug, - OUT: StateType, - F: Fn(B, usize, usize, OUT) -> B + Copy, - { - let out_b = self.parts.iter().enumerate().fold(b, |b, (part_id, part)| { - part.fold(ss, b, agg_ref, |b, id, out| { - f(b, part_id, *id as usize, out) - }) - }); - out_b + fn resolve_pid(&self, p_id: usize) -> (usize, usize) { + let morcel_id = p_id / self.morcel_size; + let offset = p_id % self.morcel_size; + (morcel_id, offset) } pub fn merge_mut>( - &mut self, - other: &Self, - agg_ref: &AccId, - ss: usize, - ) where - A: StateType, - { - // zip the two partitions - // merge each shard - assert_eq!(self.parts.len(), other.parts.len()); - self.parts - .iter_mut() - .zip(other.parts.iter()) - .for_each(|(s, o)| s.merge(o, agg_ref, ss)); - } - - pub fn merge_mut_2>( &mut self, other: &Self, agg_ref: AccId, @@ -147,61 +94,50 @@ impl ShuffleComputeState { self.global.reset_states(ss, states); } - pub fn new(n_parts: usize) -> Self { - Self { - parts: (0..n_parts) - .into_iter() - .map(|_| ShardComputeState::new()) - .collect(), - global: ShardComputeState::new(), + pub fn new(total_len: usize, n_parts: usize, morcel_size: usize) -> Self { + let last_one_size = total_len % morcel_size; + let mut parts: Vec> = (0..n_parts - 1) + .into_iter() + .map(|_| MorcelComputeState::new(morcel_size)) + .collect(); + + if last_one_size != 0 { + parts.push(MorcelComputeState::new(last_one_size)); + } else { + parts.push(MorcelComputeState::new(morcel_size)); } - } - pub fn keys(&self, part_num: usize) -> impl Iterator + '_ { - self.parts[part_num] - .states - .iter() - .flat_map(|(_, cs)| cs.iter_keys()) + Self { + morcel_size, + parts, + global: MorcelComputeState::new(1), + } } - pub fn changed_keys(&self, part_num: usize, ss: usize) -> impl Iterator + '_ { - self.parts[part_num] - .states - .iter() - .flat_map(move |(_, cs)| cs.iter_keys_changed(ss)) + pub fn global() -> Self { + Self { + morcel_size: 1, + parts: vec![], + global: MorcelComputeState::new(1), + } } pub fn accumulate_into>( &mut self, ss: usize, - into: usize, - a: IN, - agg_ref: &AccId, - ) where - A: StateType, - { - let part = get_shard_id_from_global_vid(into as u64, self.parts.len()); - self.parts[part].accumulate_into(ss, into, a, agg_ref) - } - - pub fn accumulate_into_pid>( - &mut self, - ss: usize, - g_id: u64, p_id: usize, a: IN, agg_ref: &AccId, ) where A: StateType, { - let part = get_shard_id_from_global_vid(g_id, self.parts.len()); - self.parts[part].accumulate_into(ss, p_id, a, agg_ref) + let (morcel_id, offset) = self.resolve_pid(p_id); + self.parts[morcel_id].accumulate_into(ss, offset, a, agg_ref) } pub fn read_with_pid>( &self, ss: usize, - g_id: u64, p_id: usize, agg_ref: &AccId, ) -> Option @@ -209,8 +145,8 @@ impl ShuffleComputeState { A: StateType, OUT: std::fmt::Debug, { - let part = get_shard_id_from_global_vid(g_id, self.parts.len()); - self.parts[part].read::(p_id, agg_ref.id(), ss) + let (morcel_id, offset) = self.resolve_pid(p_id); + self.parts[morcel_id].read::(offset, agg_ref.id(), ss) } pub fn accumulate_global>( @@ -224,46 +160,32 @@ impl ShuffleComputeState { self.global .accumulate_into(ss, GLOBAL_STATE_KEY, a, agg_ref) } - // reads the value from K if it's set we return Ok(a) else we return Err(zero) from the monoid + pub fn read>( &self, ss: usize, - into: usize, + p_id: usize, agg_ref: &AccId, ) -> Option where A: StateType, OUT: std::fmt::Debug, { - let part = get_shard_id_from_global_vid(into as u64, self.parts.len()); - self.parts[part].read::(into, agg_ref.id(), ss) + let (morcel_id, offset) = self.resolve_pid(p_id); + self.parts[morcel_id].read::(offset, agg_ref.id(), ss) } pub fn read_ref>( &self, ss: usize, - into: usize, - agg_ref: &AccId, - ) -> Option<&A> - where - A: StateType, - { - let part = get_shard_id_from_global_vid(into as u64, self.parts.len()); - self.parts[part].read_ref::(into, agg_ref.id(), ss) - } - - pub fn read_ref_with_pid>( - &self, - ss: usize, - g_id: u64, p_id: usize, agg_ref: &AccId, ) -> Option<&A> where A: StateType, { - let part = get_shard_id_from_global_vid(g_id, self.parts.len()); - self.parts[part].read_ref::(p_id, agg_ref.id(), ss) + let (morcel_id, offset) = self.resolve_pid(p_id); + self.parts[morcel_id].read_ref::(offset, agg_ref.id(), ss) } pub fn read_global>( @@ -279,25 +201,6 @@ impl ShuffleComputeState { .read::(GLOBAL_STATE_KEY, agg_ref.id(), ss) } - pub fn read_vec_partition, G: GraphViewInternalOps>( - &self, - ss: usize, - agg_def: &AccId, - g: &G, - ) -> Vec> - where - OUT: StateType, - A: 'static, - { - self.parts - .iter() - .enumerate() - .flat_map(|(shard_id, part)| part.read_vec(ss, agg_def, shard_id, g)) - .collect() - } -} - -impl ShuffleComputeState { pub fn finalize, G: GraphViewOps>( &self, agg_def: &AccId, @@ -307,34 +210,52 @@ impl ShuffleComputeState { ) -> HashMap where OUT: StateType, - A: 'static, + A: StateType, F: Fn(OUT) -> B + Copy, { - let r = self - .parts + self.iter(ss, *agg_def) + .map(|(v_id, a)| { + let out = a + .map(|a| ACC::finish(a)) + .unwrap_or_else(|| ACC::finish(&ACC::zero())); + (g.vertex_name(v_id.into()).to_string(), f(out)) + }) + .collect() + } + + pub fn iter<'a, A: StateType, IN: 'a, OUT: 'a, ACC: Accumulator>( + &'a self, + ss: usize, + acc_id: AccId, + ) -> impl Iterator)> + 'a { + self.parts .iter() + .flat_map(move |part| part.iter(ss, &acc_id)) .enumerate() - .map(|(shard_id, part)| part.finalize(ss, &agg_def, shard_id, g)); + } - r.into_iter() - .flat_map(|c| c.into_iter().map(|(k, v)| (k, f(v)))) - .collect() + pub fn iter_out<'a, A: StateType, IN: 'a, OUT: 'a, ACC: Accumulator>( + &'a self, + ss: usize, + acc_id: AccId, + ) -> impl Iterator + 'a { + self.iter(ss, acc_id).map(|(id, a)| { + let out = a + .map(|a| ACC::finish(a)) + .unwrap_or_else(|| ACC::finish(&ACC::zero())); + (id, out) + }) } } -pub struct EvalGlobalState { +pub struct EvalGlobalState { ss: usize, - g: G, pub(crate) global_state: Global, } -impl EvalGlobalState { - pub fn new(ss: usize, g: G, global_state: Global) -> EvalGlobalState { - Self { - ss, - g, - global_state, - } +impl EvalGlobalState { + pub fn new(ss: usize, global_state: Global) -> EvalGlobalState { + Self { ss, global_state } } pub fn finalize>( @@ -354,6 +275,7 @@ impl EvalGlobalState { } } +#[derive(Debug)] pub struct EvalShardState { ss: usize, g: G, @@ -370,22 +292,25 @@ impl EvalShardState { } pub fn finalize>( - &self, + self, agg_def: &AccId, f: F, ) -> HashMap where OUT: StateType, - A: 'static, + A: StateType, F: Fn(OUT) -> B + Copy, { - self.shard_states - .inner() - .finalize(agg_def, self.ss, &self.g, f) + let inner = self.shard_states.consume(); + if let Ok(inner) = inner { + inner.finalize(agg_def, self.ss, &self.g, f) + } else { + HashMap::new() + } } - pub fn values(self) -> Shard { - self.shard_states + pub fn values(&self) -> &Shard { + &self.shard_states } } @@ -409,19 +334,19 @@ impl EvalLocalState { } pub fn finalize>( - &self, + self, agg_def: &AccId, f: F, ) -> HashMap where OUT: StateType, - A: 'static, + A: StateType, F: Fn(OUT) -> B + Copy, { self.local_states - .iter() + .into_iter() .flat_map(|state| { - if let Some(state) = state.as_ref() { + if let Some(state) = Arc::try_unwrap(state).ok().flatten() { state.finalize(agg_def, self.ss, &self.g, f) } else { HashMap::::new() diff --git a/raphtory/src/core/storage/iter.rs b/raphtory/src/core/storage/iter.rs new file mode 100644 index 0000000000..46c748a5f8 --- /dev/null +++ b/raphtory/src/core/storage/iter.rs @@ -0,0 +1,108 @@ +use super::RawStorage; +use std::{ops::Deref, sync::Arc}; + +pub struct Iter<'a, T: Default, const N: usize> { + raw: &'a RawStorage, + segment: usize, + offset: usize, + current: Option>, +} + +// impl new for Iter +impl<'a, T: Default, const N: usize> Iter<'a, T, N> { + pub fn new(raw: &'a RawStorage) -> Self { + Iter { + raw, + segment: 0, + offset: 0, + current: None, + } + } +} + +type GuardIter<'a, T> = ( + Arc>>, + std::slice::Iter<'a, T>, +); + +pub struct RefT<'a, T, const N: usize> { + _guard: Arc>>, + t: &'a T, + i: usize, +} + +impl<'a, T, const N: usize> Clone for RefT<'_, T, N> { + fn clone(&self) -> Self { + RefT { + _guard: self._guard.clone(), + t: self.t, + i: self.i, + } + } +} + +impl<'a, T, const N: usize> Deref for RefT<'a, T, N> { + type Target = T; + + fn deref(&self) -> &Self::Target { + self.t + } +} + +// simple impl for RefT that returns &T in the value function +impl<'a, T, const N: usize> RefT<'a, T, N> { + pub fn value(&self) -> &T { + self.t + } + + pub fn index(&self) -> usize { + self.i + } +} + +/// # Safety +/// +/// Requires that you ensure the reference does not become invalid. +/// The object has to outlive the reference. +pub unsafe fn change_lifetime_const<'a, 'b, T>(x: &'a T) -> &'b T { + &*(x as *const T) +} + +impl<'a, T: std::fmt::Debug + Default, const N: usize> Iterator for Iter<'a, T, N> { + type Item = RefT<'a, T, N>; + + fn next(&mut self) -> Option { + loop { + if let Some((guard, iter)) = self.current.as_mut() { + if let Some(t) = iter.next() { + let guard = guard.clone(); + let next = Some(RefT { + _guard: guard, + i: (self.offset * N + (self.segment - 1)), + t, + }); + self.offset += 1; + return next; + } + } + + if self.segment >= N { + return None; + } + + // get the next segment + let guard = self.raw.data[self.segment].data.read(); + + // convince the rust compiler that the reference is valid + let raw = unsafe { change_lifetime_const(&*guard) }; + + // grab the iterator + let iter = raw.iter(); + + // set the current segment with the new iterator + self.current = Some((Arc::new(guard), iter)); + self.offset = 0; + self.segment += 1; + } + } +} diff --git a/raphtory/src/core/lazy_vec.rs b/raphtory/src/core/storage/lazy_vec.rs similarity index 70% rename from raphtory/src/core/lazy_vec.rs rename to raphtory/src/core/storage/lazy_vec.rs index 53c548ae80..c1d34765a6 100644 --- a/raphtory/src/core/lazy_vec.rs +++ b/raphtory/src/core/storage/lazy_vec.rs @@ -1,5 +1,6 @@ +use crate::core::utils::errors::GraphError; use serde::{Deserialize, Serialize}; -use std::fmt::Debug; +use std::{fmt::Debug, iter}; #[derive(thiserror::Error, Debug, PartialEq)] #[error("cannot set previous value '{previous_value:?}' to '{new_value:?}' in position '{index}'")] @@ -36,16 +37,17 @@ where LazyVec::LazyVec1(id, value) } - pub(crate) fn filled_ids(&self) -> Vec { + pub(crate) fn filled_ids(&self) -> Box + '_> { match self { - LazyVec::Empty => Default::default(), - LazyVec::LazyVec1(id, _) => vec![*id], - LazyVec::LazyVecN(vector) => vector - .iter() - .enumerate() - .filter(|&(_, value)| *value != Default::default()) - .map(|(id, _)| id) - .collect(), + LazyVec::Empty => Box::new(iter::empty()), + LazyVec::LazyVec1(id, _) => Box::new(iter::once(*id)), + LazyVec::LazyVecN(vector) => Box::new( + vector + .iter() + .enumerate() + .filter(|&(_, value)| *value != Default::default()) + .map(|(id, _)| id), + ), } } @@ -70,7 +72,9 @@ where return Err(IllegalSet::new(id, only_value.clone(), value)); } } else { - let mut vector = vec![Default::default(); usize::max(id, *only_id) + 1]; + let len = usize::max(id, *only_id) + 1; + let mut vector = Vec::with_capacity(len + 1); + vector.resize(len, Default::default()); vector[id] = value; vector[*only_id] = only_value.clone(); *self = LazyVec::LazyVecN(vector) @@ -99,22 +103,27 @@ where } } - pub(crate) fn update_or_set(&mut self, id: usize, updater: F, default: A) + pub(crate) fn update(&mut self, id: usize, updater: F) -> Result<(), GraphError> where - F: FnOnce(&mut A), + F: FnOnce(&mut A) -> Result<(), GraphError>, { match self.get_mut(id) { - Some(value) => updater(value), - None => self - .set(id, default) - .expect("Set failed over a non existing value"), - } + Some(value) => updater(value)?, + None => { + let mut value = A::default(); + updater(&mut value)?; + self.set(id, value) + .expect("Set failed over a non existing value") + } + }; + Ok(()) } } #[cfg(test)] mod lazy_vec_tests { use super::*; + use itertools::Itertools; #[test] fn normal_operation() { @@ -126,17 +135,14 @@ mod lazy_vec_tests { assert_eq!(vec.get(5), Some(&55)); assert_eq!(vec.get(1), Some(&11)); assert_eq!(vec.get(0), Some(&0)); - assert_eq!(vec.get(10), None); // FIXME: this should return the default, 0, as well, there is no need to return Option from get() + assert_eq!(vec.get(10), None); - // FIXME: replace update_or_set() with update() - // the behavior should be the same for both cases, because we should be able to assume that - // any cell is prefilled with default values and can therefore be safely updated - vec.update_or_set(6, |n| *n += 1, 66); + vec.update(6, |n| Ok(*n += 1)); assert_eq!(vec.get(6), Some(&1)); - vec.update_or_set(9, |n| *n += 1, 99); - assert_eq!(vec.get(9), Some(&99)); + vec.update(9, |n| Ok(*n += 1)); + assert_eq!(vec.get(9), Some(&1)); - assert_eq!(vec.filled_ids(), vec![1, 5, 6, 8, 9]); + assert_eq!(vec.filled_ids().collect_vec(), vec![1, 5, 6, 8, 9]); } #[test] diff --git a/raphtory/src/core/storage/locked_view.rs b/raphtory/src/core/storage/locked_view.rs new file mode 100644 index 0000000000..85ce71796a --- /dev/null +++ b/raphtory/src/core/storage/locked_view.rs @@ -0,0 +1,105 @@ +use dashmap::mapref::one::Ref; +use parking_lot::{MappedRwLockReadGuard, RwLockReadGuard}; +use rustc_hash::FxHasher; +use std::{ + borrow::Borrow, + cmp::Ordering, + fmt::{Debug, Formatter}, + hash::{BuildHasherDefault, Hash, Hasher}, + ops::Deref, +}; +use tantivy::directory::Lock; + +pub enum LockedView<'a, T> { + LockMapped(parking_lot::MappedRwLockReadGuard<'a, T>), + Locked(parking_lot::RwLockReadGuard<'a, T>), + DashMap(Ref<'a, usize, T, BuildHasherDefault>), +} + +impl<'a, T, O> AsRef for LockedView<'a, O> +where + T: ?Sized, + as Deref>::Target: AsRef, +{ + fn as_ref(&self) -> &T { + self.deref().as_ref() + } +} + +impl<'a, T> Borrow for LockedView<'a, T> { + fn borrow(&self) -> &T { + self.deref() + } +} + +impl<'a> From> for String { + fn from(value: LockedView<'a, String>) -> Self { + value.deref().clone() + } +} + +impl<'a, T: PartialEq, Rhs, LRhs: Deref> PartialEq for LockedView<'a, T> { + fn eq(&self, other: &LRhs) -> bool { + self.deref() == other.deref() + } +} + +impl<'a, T: Eq> Eq for LockedView<'a, T> {} + +impl<'a, T: PartialOrd, Rhs, LRhs: Deref> PartialOrd + for LockedView<'a, T> +{ + fn partial_cmp(&self, other: &LRhs) -> Option { + self.deref().partial_cmp(other.deref()) + } +} + +impl<'a, T: Ord> Ord for LockedView<'a, T> { + fn cmp(&self, other: &Self) -> Ordering { + self.deref().cmp(other.deref()) + } +} + +impl<'a, T: Hash> Hash for LockedView<'a, T> { + fn hash(&self, state: &mut H) { + self.deref().hash(state) + } +} + +impl<'a, T> From> for LockedView<'a, T> { + fn from(value: MappedRwLockReadGuard<'a, T>) -> Self { + Self::LockMapped(value) + } +} + +impl<'a, T> From> for LockedView<'a, T> { + fn from(value: RwLockReadGuard<'a, T>) -> Self { + Self::Locked(value) + } +} + +impl<'a, T> From>> + for LockedView<'a, T> +{ + fn from(value: Ref<'a, usize, T, BuildHasherDefault>) -> Self { + Self::DashMap(value) + } +} + +impl<'a, T> Deref for LockedView<'a, T> { + type Target = T; + + fn deref(&self) -> &Self::Target { + match self { + LockedView::LockMapped(guard) => guard.deref(), + LockedView::DashMap(r) => (*r).deref(), + LockedView::Locked(guard) => guard.deref(), + } + } +} + +impl<'a, T: Debug> Debug for LockedView<'a, T> { + fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result { + write!(f, "LockedView({:?})", self.deref()) + } +} diff --git a/raphtory/src/core/storage/mod.rs b/raphtory/src/core/storage/mod.rs new file mode 100644 index 0000000000..fc3c5a6d81 --- /dev/null +++ b/raphtory/src/core/storage/mod.rs @@ -0,0 +1,448 @@ +#![allow(unused)] + +pub(crate) mod iter; +pub mod lazy_vec; +pub mod locked_view; +pub mod sorted_vec_map; +pub mod timeindex; + +use self::iter::Iter; +use lock_api; +use locked_view::LockedView; +use parking_lot::{RwLock, RwLockReadGuard}; +use rayon::prelude::*; +use serde::{Deserialize, Serialize}; +use std::{ + array, + fmt::Debug, + iter::FusedIterator, + ops::{Deref, DerefMut}, + sync::{ + atomic::{AtomicUsize, Ordering}, + Arc, + }, +}; + +type ArcRwLockReadGuard = lock_api::ArcRwLockReadGuard; + +#[inline] +fn resolve(index: usize) -> (usize, usize) { + let bucket = index % N; + let offset = index / N; + (bucket, offset) +} + +#[derive(Debug, Serialize, Deserialize, Clone)] +pub struct LockVec { + data: Arc>>, +} + +impl PartialEq for LockVec { + fn eq(&self, other: &Self) -> bool { + let a = self.data.read(); + let b = other.data.read(); + a.deref() == b.deref() + } +} + +impl LockVec { + pub fn new() -> Self { + Self { + data: Arc::new(RwLock::new(Vec::new())), + } + } + + #[inline] + pub fn read_arc_lock(&self) -> ArcRwLockReadGuard> { + RwLock::read_arc(&self.data) + } +} + +#[derive(Serialize, Deserialize, Debug)] +pub struct RawStorage { + pub(crate) data: Box<[LockVec]>, + len: AtomicUsize, +} + +impl PartialEq for RawStorage { + fn eq(&self, other: &Self) -> bool { + self.data.eq(&other.data) + } +} + +#[derive(Debug)] +pub struct ReadLockedStorage { + locks: [ArcRwLockReadGuard>; N], + len: usize, +} + +impl ReadLockedStorage { + pub(crate) fn get(&self, index: usize) -> &T { + let (bucket, offset) = resolve::(index); + let bucket = &self.locks[bucket]; + &bucket[offset] + } + + pub(crate) fn iter(&self) -> impl Iterator + '_ { + self.locks.iter().flat_map(|v| v.iter()) + } + + pub(crate) fn par_iter(&self) -> impl ParallelIterator + '_ + where + T: Send + Sync, + { + self.locks.par_iter().flat_map(|v| v.par_iter()) + } + + pub(crate) fn into_iter(self) -> impl Iterator> + Send + where + T: Send + Sync + 'static, + { + self.locks + .into_iter() + .enumerate() + .flat_map(|(bucket, data)| { + let arc_data = Arc::new(data); + (0..arc_data.len()).map(move |offset| ArcEntry { + guard: arc_data.clone(), + i: offset, + }) + }) + } + + pub(crate) fn into_par_iter(self) -> impl ParallelIterator> + where + T: Send + Sync + 'static, + { + self.locks + .into_par_iter() + .enumerate() + .flat_map(|(bucket, data)| { + let arc_data = Arc::new(data); + (0..arc_data.len()) + .into_par_iter() + .map(move |offset| ArcEntry { + guard: arc_data.clone(), + i: offset, + }) + }) + } +} + +impl RawStorage { + pub fn count_with_filter bool + Send + Sync>(&self, f: F) -> usize { + self.read_lock().par_iter().filter(|x| f(x)).count() + } +} + +impl RawStorage { + #[inline] + pub fn read_lock(&self) -> ReadLockedStorage { + let guards: [ArcRwLockReadGuard>; N] = + array::from_fn(|i| self.data[i].read_arc_lock()); + ReadLockedStorage { + locks: guards, + len: self.len(), + } + } + + pub fn indices(&self) -> impl Iterator + Send + '_ { + 0..self.len() + } + + pub fn new() -> Self { + let data: [LockVec; N] = array::from_fn(|_| LockVec::new()); + let data = Box::new(data); + Self { + data, + len: AtomicUsize::new(0), + } + } + + pub fn push(&self, mut value: T, f: F) -> usize { + let index = self.len.fetch_add(1, Ordering::SeqCst); + let (bucket, offset) = resolve::(index); + let mut vec = self.data[bucket].data.write(); + if offset >= vec.len() { + vec.resize_with(offset + 1, || Default::default()); + } + f(index, &mut value); + vec[offset] = value; + index + } + + #[inline] + pub fn entry(&self, index: usize) -> Entry<'_, T, N> { + let (bucket, _) = resolve::(index); + let guard = self.data[bucket].data.read_recursive(); + Entry { + offset: index, + guard, + } + } + + #[inline] + pub fn get(&self, index: usize) -> impl Deref + '_ { + let (bucket, offset) = resolve::(index); + let guard = self.data[bucket].data.read_recursive(); + RwLockReadGuard::map(guard, |guard| &guard[offset]) + } + + pub fn entry_arc(&self, index: usize) -> ArcEntry { + let (bucket, offset) = resolve::(index); + let guard = &self.data[bucket].data; + let arc_guard = RwLock::read_arc_recursive(guard); + ArcEntry { + i: offset, + guard: Arc::new(arc_guard), + } + } + + pub fn entry_mut(&self, index: usize) -> EntryMut<'_, T> { + let (bucket, offset) = resolve::(index); + let guard = self.data[bucket].data.write(); + EntryMut { i: offset, guard } + } + + // This helps get the right locks when adding an edge + pub fn pair_entry_mut(&self, i: usize, j: usize) -> PairEntryMut<'_, T> { + let (bucket_i, offset_i) = resolve::(i); + let (bucket_j, offset_j) = resolve::(j); + // always acquire lock for smaller bucket first to avoid deadlock between two updates for the same pair of buckets + if bucket_i < bucket_j { + let guard_i = self.data[bucket_i].data.write(); + let guard_j = self.data[bucket_j].data.write(); + PairEntryMut::Different { + i: offset_i, + j: offset_j, + guard1: guard_i, + guard2: guard_j, + } + } else if bucket_i > bucket_j { + let guard_j = self.data[bucket_j].data.write(); + let guard_i = self.data[bucket_i].data.write(); + PairEntryMut::Different { + i: offset_i, + j: offset_j, + guard1: guard_i, + guard2: guard_j, + } + } else { + PairEntryMut::Same { + i: offset_i, + j: offset_j, + guard: self.data[bucket_i].data.write(), + } + } + } + + #[inline] + pub fn len(&self) -> usize { + self.len.load(Ordering::SeqCst) + } + + pub fn iter(&self) -> Iter { + Iter::new(self) + } +} + +#[derive(Debug)] +pub struct Entry<'a, T: 'static, const N: usize> { + offset: usize, + guard: RwLockReadGuard<'a, Vec>, +} + +impl<'a, T: 'static, const N: usize> Clone for Entry<'a, T, N> { + fn clone(&self) -> Self { + let guard = RwLockReadGuard::rwlock(&self.guard).read_recursive(); + let i = self.offset; + Self { offset: i, guard } + } +} + +#[derive(Debug)] +pub struct ArcEntry { + guard: Arc>>, + i: usize, +} + +impl Clone for ArcEntry { + fn clone(&self) -> Self { + Self { + guard: self.guard.clone(), + i: self.i, + } + } +} + +impl Deref for ArcEntry { + type Target = T; + + fn deref(&self) -> &Self::Target { + &self.guard[self.i] + } +} + +impl<'a, T, const N: usize> Entry<'a, T, N> { + pub fn value(&self) -> &T { + let (_, offset) = resolve::(self.offset); + &self.guard[offset] + } + + pub fn index(&self) -> usize { + self.offset + } + + pub fn map &U>(self, f: F) -> LockedView<'a, U> { + let (_, offset) = resolve::(self.offset); + let mapped_guard = RwLockReadGuard::map(self.guard, |guard| { + let what = &guard[offset]; + f(what) + }); + + LockedView::LockMapped(mapped_guard) + } +} + +impl<'a, T, const N: usize> Deref for Entry<'a, T, N> { + type Target = T; + + fn deref(&self) -> &Self::Target { + let (_, offset) = resolve::(self.offset); + &self.guard[offset] + } +} + +pub enum PairEntryMut<'a, T: 'static> { + Same { + i: usize, + j: usize, + guard: parking_lot::RwLockWriteGuard<'a, Vec>, + }, + Different { + i: usize, + j: usize, + guard1: parking_lot::RwLockWriteGuard<'a, Vec>, + guard2: parking_lot::RwLockWriteGuard<'a, Vec>, + }, +} + +impl<'a, T: 'static> PairEntryMut<'a, T> { + pub(crate) fn get_mut_i(&mut self) -> &mut T { + match self { + PairEntryMut::Same { i, guard, .. } => &mut guard[*i], + PairEntryMut::Different { i, guard1, .. } => &mut guard1[*i], + } + } + + pub(crate) fn get_mut_j(&mut self) -> &mut T { + match self { + PairEntryMut::Same { j, guard, .. } => &mut guard[*j], + PairEntryMut::Different { j, guard2, .. } => &mut guard2[*j], + } + } +} + +pub struct EntryMut<'a, T: 'static> { + i: usize, + guard: parking_lot::RwLockWriteGuard<'a, Vec>, +} + +impl<'a, T> Deref for EntryMut<'a, T> { + type Target = T; + + fn deref(&self) -> &Self::Target { + &self.guard[self.i] + } +} + +impl<'a, T> DerefMut for EntryMut<'a, T> { + fn deref_mut(&mut self) -> &mut Self::Target { + &mut self.guard[self.i] + } +} + +#[cfg(test)] +mod test { + use rayon::prelude::{IntoParallelIterator, ParallelIterator}; + + use super::RawStorage; + + #[test] + fn add_5_values_to_storage() { + let storage = RawStorage::::new(); + + for i in 0..5 { + storage.push(i.to_string(), |_, _| {}); + } + + assert_eq!(storage.len(), 5); + + for i in 0..5 { + let entry = storage.entry(i); + assert_eq!(*entry, i.to_string()); + } + + let items_iter = storage.iter(); + + let actual = items_iter.map(|s| (*s).to_owned()).collect::>(); + + assert_eq!(actual, vec!["0", "2", "4", "1", "3"]); + } + + #[test] + fn test_index_correctness() { + let storage = RawStorage::::new(); + + for i in 0..5 { + storage.push(i.to_string(), |_, _| {}); + } + + let items_iter = storage.iter(); + let actual = items_iter + .map(|s| (s.index(), (*s).to_owned())) + .collect::>(); + assert_eq!( + actual, + vec![(0, "0"), (2, "2"), (4, "4"), (1, "1"), (3, "3"),] + .into_iter() + .map(|(i, s)| (i, s.to_string())) + .collect::>() + ); + } + + #[test] + fn test_entry() { + let storage = RawStorage::::new(); + + for i in 0..5 { + storage.push(i.to_string(), |_, _| {}); + } + + for i in 0..5 { + let entry = storage.entry(i); + assert_eq!(*entry, i.to_string()); + } + } + + use pretty_assertions::assert_eq; + + #[quickcheck] + fn concurrent_push(v: Vec) -> bool { + let storage = RawStorage::::new(); + let mut expected = v + .into_par_iter() + .map(|v| { + storage.push(v, |_, _| {}); + v + }) + .collect::>(); + + let mut actual = storage.iter().map(|s| *s).collect::>(); + + actual.sort(); + expected.sort(); + + actual == expected + } +} diff --git a/raphtory/src/core/sorted_vec_map.rs b/raphtory/src/core/storage/sorted_vec_map.rs similarity index 83% rename from raphtory/src/core/sorted_vec_map.rs rename to raphtory/src/core/storage/sorted_vec_map.rs index 2f695bf5c4..c12e04c743 100644 --- a/raphtory/src/core/sorted_vec_map.rs +++ b/raphtory/src/core/storage/sorted_vec_map.rs @@ -1,17 +1,30 @@ -use std::ops::Range; - use serde::{ser::SerializeSeq, Deserialize, Serialize}; -use sorted_vector_map::{map::Entry, SortedVectorMap}; +use sorted_vector_map::SortedVectorMap; +use std::{borrow::Borrow, ops::Range}; // wrapper for SortedVectorMap -#[derive(Debug, PartialEq, Default, Clone)] +#[derive(Debug, PartialEq, Clone)] pub struct SVM(SortedVectorMap); +impl Default for SVM { + fn default() -> Self { + Self::new() + } +} + impl SVM { pub(crate) fn new() -> Self { Self(SortedVectorMap::new()) } + pub(crate) fn get(&self, k: &Q) -> Option<&V> + where + K: Borrow, + Q: Ord + ?Sized, + { + self.0.get(k) + } + pub(crate) fn insert(&mut self, k: K, v: V) -> Option { self.0.insert(k, v) } @@ -31,10 +44,6 @@ impl SVM { pub(crate) fn from_iter>(iter: I) -> Self { Self(SortedVectorMap::from_iter(iter)) } - - pub(crate) fn entry(&mut self, k: K) -> Entry { - self.0.entry(k) - } } impl IntoIterator for SVM diff --git a/raphtory/src/core/storage/timeindex.rs b/raphtory/src/core/storage/timeindex.rs new file mode 100644 index 0000000000..801f937747 --- /dev/null +++ b/raphtory/src/core/storage/timeindex.rs @@ -0,0 +1,480 @@ +use crate::{ + core::{entities::LayerIds, utils::time::error::ParseTimeError}, + db::api::mutation::{internal::InternalAdditionOps, InputTime, TryIntoInputTime}, +}; +use itertools::{Itertools, KMerge}; +use num_traits::Saturating; +use serde::{Deserialize, Serialize}; +use std::{ + cmp::{max, min}, + collections::BTreeSet, + fmt::Debug, + marker::PhantomData, + ops::{Deref, Range}, + sync::Arc, +}; +use tantivy::time::Time; + +use super::locked_view::LockedView; + +#[derive(Debug, Copy, Clone, Serialize, Deserialize, PartialEq, Ord, PartialOrd, Eq)] +pub struct TimeIndexEntry(i64, usize); + +pub trait AsTime: Debug + Copy + Ord + Eq + Send + Sync { + fn t(&self) -> &i64; + fn range(w: Range) -> Range; +} + +impl From for TimeIndexEntry { + fn from(value: i64) -> Self { + Self::start(value) + } +} + +impl TimeIndexEntry { + pub fn new(t: i64, s: usize) -> Self { + Self(t, s) + } + + pub fn from_input( + g: &G, + t: T, + ) -> Result { + let t = t.try_into_input_time()?; + Ok(match t { + InputTime::Simple(t) => Self::new(t, g.next_event_id()), + InputTime::Indexed(t, s) => Self::new(t, s), + }) + } + + pub fn start(t: i64) -> Self { + Self(t, 0) + } + + pub fn end(t: i64) -> Self { + Self(t.saturating_add(1), 0) + } +} + +impl AsTime for i64 { + fn t(&self) -> &i64 { + self + } + + fn range(w: Range) -> Range { + w + } +} + +impl AsTime for TimeIndexEntry { + fn t(&self) -> &i64 { + &self.0 + } + fn range(w: Range) -> Range { + Self::start(w.start)..Self::start(w.end) + } +} + +#[derive(Default, Debug, Clone, Serialize, Deserialize, PartialEq)] +pub enum TimeIndex { + #[default] + Empty, + One(T), + Set(BTreeSet), +} + +impl TimeIndex { + pub fn is_empty(&self) -> bool { + matches!(self, TimeIndex::Empty) + } + + pub fn one(ti: T) -> Self { + Self::One(ti) + } + pub fn insert(&mut self, ti: T) -> bool { + match self { + TimeIndex::Empty => { + *self = TimeIndex::One(ti); + true + } + TimeIndex::One(t0) => { + if t0 == &ti { + false + } else { + *self = TimeIndex::Set([*t0, ti].into_iter().collect()); + true + } + } + TimeIndex::Set(ts) => ts.insert(ti), + } + } + + pub(crate) fn contains(&self, w: Range) -> bool { + match self { + TimeIndex::Empty => false, + TimeIndex::One(t) => w.contains(t.t()), + TimeIndex::Set(ts) => ts.range(T::range(w)).next().is_some(), + } + } + + pub(crate) fn iter(&self) -> Box + Send + '_> { + match self { + TimeIndex::Empty => Box::new(std::iter::empty()), + TimeIndex::One(t) => Box::new(std::iter::once(t)), + TimeIndex::Set(ts) => Box::new(ts.iter()), + } + } + + pub(crate) fn range_iter( + &self, + w: Range, + ) -> Box + Send + '_> { + match self { + TimeIndex::Empty => Box::new(std::iter::empty()), + TimeIndex::One(t) => { + if w.contains(t.t()) { + Box::new(std::iter::once(t)) + } else { + Box::new(std::iter::empty()) + } + } + TimeIndex::Set(ts) => Box::new(ts.range(T::range(w))), + } + } + + // = note: see issue #65991 for more information + // = note: required when coercing `Box + Send>` into `Box + Send>` + pub(crate) fn range_iter_forward( + &self, + w: Range, + ) -> Box + Send + '_> { + Box::new(self.range_iter(w)) + } +} + +pub enum TimeIndexWindow<'a, T: AsTime> { + Empty, + TimeIndexRange { + timeindex: &'a TimeIndex, + range: Range, + }, + All(&'a TimeIndex), +} + +pub struct LayeredTimeIndexWindow<'a, T: AsTime> { + timeindex: Vec>, +} + +pub enum WindowIter<'a> { + Empty, + TimeIndexRange(Box + Send + 'a>), + All(Box + Send + 'a>), +} + +impl<'a> Iterator for WindowIter<'a> { + type Item = &'a i64; + + fn next(&mut self) -> Option { + match self { + WindowIter::Empty => None, + WindowIter::TimeIndexRange(iter) => iter.next(), + WindowIter::All(iter) => iter.next(), + } + } +} + +pub type LockedLayeredIndex<'a, T> = LayeredIndex<'a, T, LockedView<'a, Vec>>>; + +pub struct LayeredIndex<'a, T: AsTime, V: Deref>> + 'a> { + layers: LayerIds, + view: V, + marker: PhantomData<&'a Vec>>, +} + +impl<'a, T: AsTime, V: Deref>> + 'a> LayeredIndex<'a, T, V> { + pub fn new(layers: LayerIds, view: V) -> Self { + Self { + layers, + view, + marker: PhantomData, + } + } + + pub fn range_iter(&'a self, w: Range) -> Box + Send + '_> { + let iter = self + .view + .iter() + .enumerate() + .filter(|(i, _)| self.layers.contains(i)) + .map(|(_, t)| t.range_iter(w.clone()).map(|t| t.t())) + .kmerge() + .dedup(); + Box::new(iter) + } + + pub fn first(&self) -> Option { + self.view + .iter() + .enumerate() + .filter(|(i, _)| self.layers.contains(i)) + .map(|(_, t)| t.first_t()) + .min() + .flatten() + } + + pub fn active(&self, w: Range) -> bool { + self.view + .iter() + .enumerate() + .filter(|(i, _)| self.layers.contains(i)) + .any(|(_, t)| t.active(w.clone())) + } + + fn last_window(&self, w: Range) -> Option { + self.view + .iter() + .enumerate() + .filter(|(i, _)| self.layers.contains(i)) + .map(|(_, t)| t.range_iter(w.clone()).next_back().map(|t| *t.t())) + .max() + .flatten() + } +} + +impl<'a, T: AsTime, V: Deref>> + 'a> TimeIndexOps + for LayeredIndex<'a, T, V> +{ + type IterType<'b> = Box + Send + 'b> where Self: 'b; + type WindowType<'b> = LayeredTimeIndexWindow<'b, T> where Self: 'b; + type IndexType = T; + + fn active(&self, w: Range) -> bool { + self.view.iter().any(|t| t.active(w.clone())) + } + + fn range(&self, w: Range) -> LayeredTimeIndexWindow { + let timeindex = self + .view + .iter() + .enumerate() + .filter_map(|(l, t)| self.layers.contains(&l).then(|| t.range(w.clone()))) + .collect_vec(); + LayeredTimeIndexWindow { timeindex } + } + + fn first(&self) -> Option<&T> { + self.view.iter().flat_map(|t| t.first()).min() + } + + fn last(&self) -> Option<&T> { + self.view.iter().flat_map(|t| t.last()).max() + } + + fn iter_t(&self) -> Self::IterType<'_> { + let iter = self.view.iter().map(|t| t.iter_t()).kmerge().dedup(); + Box::new(iter) + } +} + +pub trait TimeIndexOps { + type IterType<'a>: Iterator + Send + 'a + where + Self: 'a; + + type WindowType<'a>: TimeIndexOps + 'a + where + Self: 'a; + type IndexType: AsTime; + + fn active(&self, w: Range) -> bool; + + fn range<'a>(&'a self, w: Range) -> Self::WindowType<'a>; + + fn first_t(&self) -> Option { + self.first().map(|ti| *ti.t()) + } + + fn first(&self) -> Option<&Self::IndexType>; + + fn last_t(&self) -> Option { + self.last().map(|ti| *ti.t()) + } + + fn last(&self) -> Option<&Self::IndexType>; + + fn iter_t(&self) -> Self::IterType<'_>; +} + +impl TimeIndexOps for TimeIndex { + type IterType<'a> = Box + Send + 'a> where T: 'a; + type WindowType<'a> = TimeIndexWindow<'a, T> where Self: 'a; + type IndexType = T; + + #[inline(always)] + fn active(&self, w: Range) -> bool { + match &self { + TimeIndex::Empty => false, + TimeIndex::One(t) => w.contains(t.t()), + TimeIndex::Set(ts) => ts.range(T::range(w)).next().is_some(), + } + } + + fn range(&self, w: Range) -> TimeIndexWindow<'_, T> { + match &self { + TimeIndex::Empty => TimeIndexWindow::Empty, + TimeIndex::One(t) => { + if w.contains(t.t()) { + TimeIndexWindow::All(self) + } else { + TimeIndexWindow::Empty + } + } + TimeIndex::Set(ts) => { + if let Some(min_val) = ts.first() { + if let Some(max_val) = ts.last() { + if min_val.t() >= &w.start && max_val.t() < &w.end { + TimeIndexWindow::All(self) + } else { + TimeIndexWindow::TimeIndexRange { + timeindex: self, + range: w, + } + } + } else { + TimeIndexWindow::Empty + } + } else { + TimeIndexWindow::Empty + } + } + } + } + + fn first(&self) -> Option<&T> { + match self { + TimeIndex::Empty => None, + TimeIndex::One(t) => Some(t), + TimeIndex::Set(ts) => ts.first(), + } + } + + fn last(&self) -> Option<&T> { + match self { + TimeIndex::Empty => None, + TimeIndex::One(t) => Some(t), + TimeIndex::Set(ts) => ts.last(), + } + } + + fn iter_t(&self) -> Box + Send + '_> { + match self { + TimeIndex::Empty => Box::new(std::iter::empty()), + TimeIndex::One(t) => Box::new(std::iter::once(t.t())), + TimeIndex::Set(ts) => Box::new(ts.iter().map(|ti| ti.t())), + } + } +} + +impl<'b, T: AsTime> TimeIndexOps for TimeIndexWindow<'b, T> +where + Self: 'b, +{ + type IterType<'a> = WindowIter<'a> where Self: 'a; + type WindowType<'a> = TimeIndexWindow<'a, T> where Self: 'a; + type IndexType = T; + + fn active(&self, w: Range) -> bool { + match self { + TimeIndexWindow::Empty => false, + TimeIndexWindow::TimeIndexRange { timeindex, range } => { + w.start < range.end + && w.end > range.start + && (timeindex.active(max(w.start, range.start)..min(w.end, range.end))) + } + TimeIndexWindow::All(timeindex) => timeindex.active(w), + } + } + + fn range(&self, w: Range) -> TimeIndexWindow { + match self { + TimeIndexWindow::Empty => TimeIndexWindow::Empty, + TimeIndexWindow::TimeIndexRange { timeindex, range } => { + let start = max(range.start, w.start); + let end = min(range.start, w.start); + if end <= start { + TimeIndexWindow::Empty + } else { + TimeIndexWindow::TimeIndexRange { + timeindex, + range: start..end, + } + } + } + TimeIndexWindow::All(timeindex) => timeindex.range(w), + } + } + + fn first(&self) -> Option<&T> { + match self { + TimeIndexWindow::Empty => None, + TimeIndexWindow::TimeIndexRange { timeindex, range } => { + timeindex.range_iter(range.clone()).next() + } + TimeIndexWindow::All(timeindex) => timeindex.first(), + } + } + + fn last(&self) -> Option<&T> { + match self { + TimeIndexWindow::Empty => None, + TimeIndexWindow::TimeIndexRange { timeindex, range } => { + timeindex.range_iter(range.clone()).next_back() + } + TimeIndexWindow::All(timeindex) => timeindex.last(), + } + } + + fn iter_t(&self) -> Self::IterType<'_> { + match self { + TimeIndexWindow::Empty => WindowIter::Empty, + TimeIndexWindow::TimeIndexRange { timeindex, range } => WindowIter::TimeIndexRange( + Box::new(timeindex.range_iter_forward(range.clone()).map(|t| t.t())), + ), + TimeIndexWindow::All(timeindex) => WindowIter::All(timeindex.iter_t()), + } + } +} + +impl<'b, T: AsTime> TimeIndexOps for LayeredTimeIndexWindow<'b, T> +where + Self: 'b, +{ + type IterType<'a> = KMerge> where Self: 'a; + type WindowType<'a> = LayeredTimeIndexWindow<'a, T> where Self: 'a; + type IndexType = T; + + fn active(&self, w: Range) -> bool { + self.timeindex.iter().any(|t| t.active(w.clone())) + } + + fn range<'a>(&'a self, w: Range) -> Self::WindowType<'a> { + let timeindex = self + .timeindex + .iter() + .map(|t| t.range(w.clone())) + .collect_vec(); + Self::WindowType { timeindex } + } + + fn first(&self) -> Option<&T> { + self.timeindex.iter().flat_map(|t| t.first()).min() + } + + fn last(&self) -> Option<&T> { + self.timeindex.iter().flat_map(|t| t.last()).max() + } + + fn iter_t(&self) -> Self::IterType<'_> { + self.timeindex.iter().map(|t| t.iter_t()).kmerge() + } +} diff --git a/raphtory/src/core/tadjset.rs b/raphtory/src/core/tadjset.rs deleted file mode 100644 index 52a4088d12..0000000000 --- a/raphtory/src/core/tadjset.rs +++ /dev/null @@ -1,224 +0,0 @@ -//! A data structure for efficiently storing and querying the temporal adjacency set of a node in a temporal graph. - -use crate::core::timeindex::TimeIndex; -use serde::{Deserialize, Serialize}; -use std::{collections::BTreeMap, hash::Hash, ops::Range}; - -const SMALL_SET: usize = 1024; - -/** - * Temporal adjacency set can track when adding edge v -> u - * does u exist already - * and if it does what is the edge metadata - * and if the edge is remote or local - * - * */ -#[derive(Debug, Default, Serialize, Deserialize, PartialEq)] -pub enum TAdjSet { - #[default] - Empty, - One(V, usize), - Small { - vs: Vec, // the neighbours - edges: Vec, // edge metadata - }, - Large { - vs: BTreeMap, // this is equiv to vs and edges - }, -} - -impl TAdjSet { - pub fn new(v: V, e: usize) -> Self { - Self::One(v, e) - } - - pub fn len(&self) -> usize { - match self { - TAdjSet::Empty => 0, - TAdjSet::One(_, _) => 1, - TAdjSet::Small { vs, .. } => vs.len(), - TAdjSet::Large { vs } => vs.len(), - } - } - - pub fn len_window(&self, timestamps: &[TimeIndex], window: &Range) -> usize { - match self { - TAdjSet::Empty => 0, - TAdjSet::One(_, e) => { - if timestamps[*e].active(window.clone()) { - 1 - } else { - 0 - } - } - - TAdjSet::Small { edges, .. } => edges - .iter() - .filter(|&&e| timestamps[e].active(window.clone())) - .count(), - TAdjSet::Large { vs } => vs - .values() - .filter(|&&e| timestamps[e].active(window.clone())) - .count(), - } - } - - pub fn push(&mut self, v: V, e: usize) { - match self { - TAdjSet::Empty => { - *self = Self::new(v, e); - } - TAdjSet::One(vv, ee) => { - if *vv < v { - *self = Self::Small { - vs: vec![*vv, v], - edges: vec![*ee, e], - } - } else if *vv > v { - *self = Self::Small { - vs: vec![v, *vv], - edges: vec![e, *ee], - } - } - } - TAdjSet::Small { vs, edges } => match vs.binary_search(&v) { - Ok(_) => {} - Err(i) => { - if vs.len() < SMALL_SET { - vs.insert(i, v); - edges.insert(i, e); - } else { - let mut map = - BTreeMap::from_iter(vs.iter().copied().zip(edges.iter().copied())); - map.insert(v, e); - *self = Self::Large { vs: map } - } - } - }, - TAdjSet::Large { vs } => { - vs.insert(v, e); - } - } - } - - pub fn iter(&self) -> Box + Send + '_> { - match self { - TAdjSet::Empty => Box::new(std::iter::empty()), - TAdjSet::One(v, e) => Box::new(std::iter::once((*v, *e))), - TAdjSet::Small { vs, edges } => Box::new(vs.iter().copied().zip(edges.iter().copied())), - TAdjSet::Large { vs } => Box::new(vs.iter().map(|(k, v)| (*k, *v))), - } - } - - pub fn vertices(&self) -> Box + Send + '_> { - match self { - TAdjSet::Empty => Box::new(std::iter::empty()), - TAdjSet::One(v, ..) => Box::new(std::iter::once(*v)), - TAdjSet::Small { vs, .. } => Box::new(vs.iter().copied()), - TAdjSet::Large { vs } => Box::new(vs.keys().copied()), - } - } - - pub fn iter_window<'a>( - &'a self, - timestamps: &'a [TimeIndex], - window: &Range, - ) -> Box + Send + 'a> { - let w = window.clone(); - Box::new( - self.iter() - .filter(move |(_, e)| timestamps[*e].active(w.clone())), - ) - } - - pub fn vertices_window<'a>( - &'a self, - timestamps: &'a [TimeIndex], - window: &Range, - ) -> Box + Send + 'a> { - let w = window.clone(); - Box::new( - self.iter() - .filter(move |(_, e)| timestamps[*e].active(w.clone())) - .map(|(v, _)| v), - ) - } - - pub fn find(&self, v: V) -> Option { - match self { - TAdjSet::Empty => None, - TAdjSet::One(vv, e) => (*vv == v).then_some(*e), - TAdjSet::Small { vs, edges } => vs.binary_search(&v).ok().map(|i| edges[i]), - TAdjSet::Large { vs } => vs.get(&v).copied(), - } - } -} - -#[cfg(test)] -mod tadjset_tests { - use super::*; - - #[quickcheck] - fn insert_fuzz(input: Vec) -> bool { - let mut ts: TAdjSet = TAdjSet::default(); - - for (e, i) in input.iter().enumerate() { - ts.push(*i, e); - } - - let res = input.iter().all(|i| ts.find(*i).is_some()); - if !res { - let ts_vec: Vec<(usize, usize)> = ts.iter().collect(); - println!("Input: {:?}", input); - println!("TAdjSet: {:?}", ts_vec); - } - res - } - - #[test] - fn insert() { - let mut ts: TAdjSet = TAdjSet::default(); - - ts.push(7, 5); - let actual = ts.iter().collect::>(); - let expected: Vec<(usize, usize)> = vec![(7, 5)]; - assert_eq!(actual, expected) - } - - #[test] - fn insert_large() { - let mut ts: TAdjSet = TAdjSet::default(); - - for i in 0..SMALL_SET + 2 { - ts.push(i, i); - } - - for i in 0..SMALL_SET + 2 { - assert_eq!(ts.find(i), Some(i)); - } - } - - #[test] - fn insert_twice() { - let mut ts: TAdjSet = TAdjSet::default(); - - ts.push(7, 9); - ts.push(7, 9); - - let actual = ts.iter().collect::>(); - let expected: Vec<(usize, usize)> = vec![(7, 9)]; - assert_eq!(actual, expected); - } - - #[test] - fn insert_two_different() { - let mut ts: TAdjSet = TAdjSet::default(); - - ts.push(1, 0); - ts.push(7, 1); - - let actual = ts.iter().collect::>(); - let expected: Vec<(usize, usize)> = vec![(1, 0), (7, 1)]; - assert_eq!(actual, expected); - } -} diff --git a/raphtory/src/core/tgraph.rs b/raphtory/src/core/tgraph.rs deleted file mode 100644 index c54d01bf3d..0000000000 --- a/raphtory/src/core/tgraph.rs +++ /dev/null @@ -1,2105 +0,0 @@ -//! A data structure for representing temporal graphs. - -use self::errors::MutateGraphError; -use crate::core::edge_layer::{EdgeLayer, VID}; -use crate::core::edge_ref::EdgeRef; -use crate::core::props::Props; -use crate::core::timeindex::TimeIndex; -use crate::core::tprop::TProp; -use crate::core::vertex::InputVertex; -use crate::core::vertex_ref::{LocalVertexRef, VertexRef}; -use crate::core::Direction; -use crate::core::{Prop, Time}; -use itertools::Itertools; -use rustc_hash::FxHashMap; -use serde::{Deserialize, Serialize}; -use std::{collections::HashMap, ops::Range}; - -pub(crate) mod errors { - use crate::core::props::IllegalMutate; - - #[derive(thiserror::Error, Debug, PartialEq)] - pub enum MutateGraphError { - #[error("Create vertex '{vertex_id}' first before adding static properties to it")] - VertexNotFoundError { vertex_id: u64 }, - #[error("cannot change property for vertex '{vertex_id}'")] - IllegalVertexPropertyChange { - vertex_id: u64, - source: IllegalMutate, - }, - #[error("Create edge '{0}' -> '{1}' first before adding static properties to it")] - MissingEdge(u64, u64), // src, dst - #[error("cannot change property for edge '{src_id}' -> '{dst_id}'")] - IllegalEdgePropertyChange { - src_id: u64, - dst_id: u64, - source: IllegalMutate, - }, - #[error("cannot update property as is '{first_type}' and '{second_type}' given'")] - PropertyChangedType { - first_type: &'static str, - second_type: &'static str, - }, - } -} - -pub type MutateGraphResult = Result<(), MutateGraphError>; - -#[derive(Debug, Serialize, Deserialize, PartialEq)] -pub struct TemporalGraph { - id: usize, - // Maps global (logical) id to the local (physical) id which is an index to the adjacency list vector - pub(crate) logical_to_physical: FxHashMap, - - // global ids in insertion order for fast iterations, maps physical ids to logical ids - pub(crate) logical_ids: Vec, - - // Set of timestamps per vertex for fast window filtering - timestamps: Vec, - - // Properties abstraction for both vertices and edges - pub(crate) vertex_props: Props, - - // Edge layers - pub(crate) layers: Vec, - - //earliest time seen in this graph - pub(crate) earliest_time: i64, - - //latest time seen in this graph - pub(crate) latest_time: i64, -} - -impl TemporalGraph { - pub(crate) fn new(id: usize) -> Self { - Self { - id, - logical_to_physical: Default::default(), - logical_ids: Default::default(), - timestamps: Default::default(), - vertex_props: Default::default(), - layers: vec![EdgeLayer::new(0, id)], - earliest_time: i64::MAX, - latest_time: i64::MIN, - } - } -} - -// Internal helpers -impl TemporalGraph { - /// Checks if vertex ref is actually local and returns appropriate ID (either local pid or global id) - #[inline(always)] - fn local_id(&self, v: VertexRef) -> VID { - match v { - VertexRef::Local(LocalVertexRef { pid, .. }) => VID::Local(pid), - VertexRef::Remote(gid) => match self.logical_to_physical.get(&gid) { - Some(v_pid) => VID::Local(*v_pid), - None => VID::Remote(gid), - }, - } - } - - fn new_local_vertex(&self, pid: usize) -> LocalVertexRef { - LocalVertexRef { - shard_id: self.id, - pid, - } - } - - pub fn local_vertex(&self, v: VertexRef) -> Option { - match v { - VertexRef::Local(v) => { - (v.shard_id == self.id && v.pid < self.logical_ids.len()).then_some(v) - } - VertexRef::Remote(gid) => self.vertex(gid), - } - } - - pub fn local_vertex_window(&self, v: VertexRef, w: Range) -> Option { - self.local_vertex(v) - .filter(|v| self.timestamps[v.pid].active(w)) - } -} - -// Layer management: -impl TemporalGraph { - // TODO: we can completely replace this function with `layer_iter` if we are sure that doesn't - // affect performance - fn layer_iter(&self, id: Option) -> LayerIterator { - if self.layers.len() == 1 { - LayerIterator::Single(&self.layers[0]) - } else { - match id { - Some(id) => LayerIterator::Single(&self.layers[id]), - None => LayerIterator::Vector(&self.layers), - } - } - } -} - -enum LayerIterator<'a> { - Single(&'a EdgeLayer), - Vector(&'a Vec), -} - -impl TemporalGraph { - /// Global id of vertex - pub fn vertex_id(&self, v: LocalVertexRef) -> u64 { - self.logical_ids[v.pid] - } - - pub(crate) fn allocate_layer(&mut self, id: usize) { - self.layers.push(EdgeLayer::new(id, self.id)); - assert_eq!(self.layers.len(), id + 1) - } - - pub(crate) fn len(&self) -> usize { - self.logical_ids.len() - } - - pub(crate) fn len_window(&self, w: &Range) -> usize { - self.timestamps - .iter() - .filter(|&ts| ts.active(w.clone())) - .count() - } - - pub(crate) fn out_edges_len(&self, layer: Option) -> usize { - match self.layer_iter(layer) { - LayerIterator::Single(layer) => layer.out_edges_len(), - LayerIterator::Vector(_) => self - .vertices() - .map(|v| self.degree(v, Direction::OUT, None)) - .sum(), - } - } - - pub fn out_edges_len_window(&self, w: &Range

{ + pub(crate) fn new(props: P) -> Self { + Self { props } + } + pub fn keys(&self) -> Vec { + self.props.const_prop_keys().map(|v| v.clone()).collect() + } + + pub fn values(&self) -> Vec { + self.props.const_prop_values() + } + + pub fn iter(&self) -> Box + '_> { + Box::new(self.into_iter()) + } + + pub fn get(&self, key: &str) -> Option { + let id = self.props.get_const_prop_id(key)?; + self.props.get_const_prop(id) + } + + pub fn contains(&self, key: &str) -> bool { + self.get(key).is_some() + } + + pub fn as_map(&self) -> HashMap { + self.iter().collect() + } +} + +impl IntoIterator for ConstProperties

{ + type Item = (ArcStr, Prop); + type IntoIter = Zip, std::vec::IntoIter>; + + fn into_iter(self) -> Self::IntoIter { + let keys = self.keys(); + let vals = self.values(); + keys.into_iter().zip(vals) + } +} + +impl IntoIterator for &ConstProperties

{ + type Item = (ArcStr, Prop); + type IntoIter = Zip, std::vec::IntoIter>; + + fn into_iter(self) -> Self::IntoIter { + let keys = self.keys(); + let vals = self.values(); + keys.into_iter().zip(vals) + } +} + +impl PartialEq for ConstProperties

{ + fn eq(&self, other: &Self) -> bool { + self.as_map() == other.as_map() + } +} diff --git a/raphtory/src/db/api/properties/internal.rs b/raphtory/src/db/api/properties/internal.rs new file mode 100644 index 0000000000..b71e91982c --- /dev/null +++ b/raphtory/src/db/api/properties/internal.rs @@ -0,0 +1,157 @@ +use crate::{ + core::{ArcStr, Prop}, + db::api::view::internal::Base, +}; +use enum_dispatch::enum_dispatch; + +#[enum_dispatch] +pub trait TemporalPropertyViewOps { + fn temporal_value(&self, id: usize) -> Option { + self.temporal_values(id).last().cloned() + } + fn temporal_history(&self, id: usize) -> Vec; + fn temporal_values(&self, id: usize) -> Vec; + fn temporal_value_at(&self, id: usize, t: i64) -> Option { + let history = self.temporal_history(id); + match history.binary_search(&t) { + Ok(index) => Some(self.temporal_values(id)[index].clone()), + Err(index) => (index > 0).then(|| self.temporal_values(id)[index - 1].clone()), + } + } +} + +#[enum_dispatch] +pub trait ConstPropertiesOps { + /// Find id for property name (note this only checks the meta-data, not if the property actually exists for the entity) + fn get_const_prop_id(&self, name: &str) -> Option; + fn get_const_prop_name(&self, id: usize) -> ArcStr; + fn const_prop_ids(&self) -> Box + '_>; + fn const_prop_keys(&self) -> Box + '_> { + Box::new(self.const_prop_ids().map(|id| self.get_const_prop_name(id))) + } + fn const_prop_values(&self) -> Vec { + self.const_prop_ids() + .map(|k| { + self.get_const_prop(k) + .expect("ids that come from the internal iterator should exist") + }) + .collect() + } + fn get_const_prop(&self, id: usize) -> Option; +} + +#[enum_dispatch] +pub trait TemporalPropertiesOps { + fn get_temporal_prop_id(&self, name: &str) -> Option; + fn get_temporal_prop_name(&self, id: usize) -> ArcStr; + + fn temporal_prop_ids(&self) -> Box + '_>; + fn temporal_prop_keys(&self) -> Box + '_> { + Box::new( + self.temporal_prop_ids() + .map(|id| self.get_temporal_prop_name(id)), + ) + } +} + +pub trait PropertiesOps: + TemporalPropertiesOps + TemporalPropertyViewOps + ConstPropertiesOps +{ +} + +impl PropertiesOps for P {} + +pub trait InheritTemporalPropertyViewOps: Base {} +pub trait InheritTemporalPropertiesOps: Base {} +pub trait InheritStaticPropertiesOps: Base {} +pub trait InheritPropertiesOps: Base {} + +impl InheritStaticPropertiesOps for P {} +impl InheritTemporalPropertiesOps for P {} + +impl TemporalPropertyViewOps for P +where + P::Base: TemporalPropertyViewOps, +{ + #[inline] + fn temporal_value(&self, id: usize) -> Option { + self.base().temporal_value(id) + } + + #[inline] + fn temporal_history(&self, id: usize) -> Vec { + self.base().temporal_history(id) + } + + #[inline] + fn temporal_values(&self, id: usize) -> Vec { + self.base().temporal_values(id) + } + + #[inline] + fn temporal_value_at(&self, id: usize, t: i64) -> Option { + self.base().temporal_value_at(id, t) + } +} + +impl InheritTemporalPropertyViewOps for P {} + +impl TemporalPropertiesOps for P +where + P::Base: TemporalPropertiesOps, +{ + #[inline] + fn get_temporal_prop_id(&self, name: &str) -> Option { + self.base().get_temporal_prop_id(name) + } + + #[inline] + fn get_temporal_prop_name(&self, id: usize) -> ArcStr { + self.base().get_temporal_prop_name(id) + } + + #[inline] + fn temporal_prop_ids(&self) -> Box + '_> { + self.base().temporal_prop_ids() + } + + #[inline] + fn temporal_prop_keys(&self) -> Box + '_> { + self.base().temporal_prop_keys() + } +} + +impl ConstPropertiesOps for P +where + P::Base: ConstPropertiesOps, +{ + #[inline] + fn get_const_prop_id(&self, name: &str) -> Option { + self.base().get_const_prop_id(name) + } + + #[inline] + fn get_const_prop_name(&self, id: usize) -> ArcStr { + self.base().get_const_prop_name(id) + } + + #[inline] + fn const_prop_ids(&self) -> Box + '_> { + self.base().const_prop_ids() + } + + #[inline] + fn const_prop_keys(&self) -> Box + '_> { + self.base().const_prop_keys() + } + + #[inline] + fn const_prop_values(&self) -> Vec { + self.base().const_prop_values() + } + + #[inline] + fn get_const_prop(&self, id: usize) -> Option { + self.base().get_const_prop(id) + } +} diff --git a/raphtory/src/db/api/properties/mod.rs b/raphtory/src/db/api/properties/mod.rs new file mode 100644 index 0000000000..2ab4d0830f --- /dev/null +++ b/raphtory/src/db/api/properties/mod.rs @@ -0,0 +1,8 @@ +mod constant_props; +pub mod internal; +mod props; +mod temporal_props; + +pub use constant_props::*; +pub use props::*; +pub use temporal_props::*; diff --git a/raphtory/src/db/api/properties/props.rs b/raphtory/src/db/api/properties/props.rs new file mode 100644 index 0000000000..8368a2afbf --- /dev/null +++ b/raphtory/src/db/api/properties/props.rs @@ -0,0 +1,98 @@ +use crate::{ + core::{ArcStr, Prop}, + db::api::properties::{ + constant_props::ConstProperties, internal::*, temporal_props::TemporalProperties, + }, +}; +use std::collections::HashMap; + +/// View of the properties of an entity (graph|vertex|edge) +#[derive(Clone)] +pub struct Properties { + pub(crate) props: P, +} + +impl Properties

{ + pub fn new(props: P) -> Properties

{ + Self { props } + } + + /// Get property value. + /// + /// First searches temporal properties and returns latest value if it exists. + /// If not, it falls back to static properties. + pub fn get(&self, key: &str) -> Option { + self.props + .get_temporal_prop_id(key) + .and_then(|k| self.props.temporal_value(k)) + .or_else(|| { + self.props + .get_const_prop_id(key) + .and_then(|id| self.props.get_const_prop(id)) + }) + } + + /// Check if property `key` exists. + pub fn contains(&self, key: &str) -> bool { + self.get(key).is_some() + } + + /// Iterate over all property keys + pub fn keys(&self) -> impl Iterator + '_ { + self.props.temporal_prop_keys().chain( + self.props + .const_prop_keys() + .filter(|k| self.props.get_temporal_prop_id(k).is_none()), + ) + } + + /// Iterate over all property values + pub fn values(&self) -> impl Iterator + '_ { + self.keys().map(|k| self.get(&k).unwrap()) + } + + /// Iterate over all property key-value pairs + pub fn iter(&self) -> impl Iterator + '_ { + self.keys().zip(self.values()) + } + + /// Get a view of the temporal properties only. + pub fn temporal(&self) -> TemporalProperties

{ + TemporalProperties::new(self.props.clone()) + } + + /// Get a view of the constant properties (meta-data) only. + pub fn constant(&self) -> ConstProperties

{ + ConstProperties::new(self.props.clone()) + } + + /// Collect properties into vector + pub fn as_vec(&self) -> Vec<(ArcStr, Prop)> { + self.iter().map(|(k, v)| (k, v)).collect() + } + + /// Collect properties into map + pub fn as_map(&self) -> HashMap { + self.iter().map(|(k, v)| (k.clone(), v)).collect() + } +} + +impl IntoIterator for Properties

{ + type Item = (ArcStr, Prop); + type IntoIter = Box>; + + fn into_iter(self) -> Self::IntoIter { + let keys: Vec<_> = self.keys().map(|k| k.clone()).collect(); + let vals: Vec<_> = self.values().collect(); + Box::new(keys.into_iter().zip(vals)) + } +} + +impl<'a, P: PropertiesOps + Clone + 'a> IntoIterator for &'a Properties

{ + type Item = (ArcStr, Prop); + type IntoIter = Box + 'a>; + + fn into_iter(self) -> Self::IntoIter { + Box::new(self.iter()) + } +} diff --git a/raphtory/src/db/api/properties/temporal_props.rs b/raphtory/src/db/api/properties/temporal_props.rs new file mode 100644 index 0000000000..798630f5c8 --- /dev/null +++ b/raphtory/src/db/api/properties/temporal_props.rs @@ -0,0 +1,167 @@ +use crate::{ + core::{ArcStr, Prop, PropUnwrap}, + db::api::properties::internal::PropertiesOps, + prelude::Graph, +}; +use chrono::NaiveDateTime; +use std::{collections::HashMap, iter::Zip, sync::Arc}; + +pub struct TemporalPropertyView { + pub(crate) id: usize, + pub(crate) props: P, +} + +impl TemporalPropertyView

{ + pub(crate) fn new(props: P, key: usize) -> Self { + TemporalPropertyView { props, id: key } + } + pub fn history(&self) -> Vec { + self.props.temporal_history(self.id) + } + pub fn values(&self) -> Vec { + self.props.temporal_values(self.id) + } + pub fn iter(&self) -> impl Iterator { + self.into_iter() + } + pub fn at(&self, t: i64) -> Option { + self.props.temporal_value_at(self.id, t) + } + pub fn latest(&self) -> Option { + self.props.temporal_value(self.id) + } +} + +impl IntoIterator for TemporalPropertyView

{ + type Item = (i64, Prop); + type IntoIter = Zip, std::vec::IntoIter>; + + fn into_iter(self) -> Self::IntoIter { + let hist = self.history(); + let vals = self.values(); + hist.into_iter().zip(vals) + } +} + +impl IntoIterator for &TemporalPropertyView

{ + type Item = (i64, Prop); + type IntoIter = Zip, std::vec::IntoIter>; + + fn into_iter(self) -> Self::IntoIter { + let hist = self.history(); + let vals = self.values(); + hist.into_iter().zip(vals) + } +} + +pub struct TemporalProperties { + pub(crate) props: P, +} + +impl IntoIterator for TemporalProperties

{ + type Item = (ArcStr, TemporalPropertyView

); + type IntoIter = Zip, std::vec::IntoIter>>; + + fn into_iter(self) -> Self::IntoIter { + let keys: Vec<_> = self.keys().map(|k| k.clone()).collect(); + let values: Vec<_> = self.values().collect(); + keys.into_iter().zip(values) + } +} + +impl TemporalProperties

{ + pub(crate) fn new(props: P) -> Self { + Self { props } + } + pub fn keys(&self) -> impl Iterator + '_ { + self.props.temporal_prop_keys() + } + + pub fn contains(&self, key: &str) -> bool { + self.props.get_temporal_prop_id(key).is_some() + } + + pub fn values(&self) -> impl Iterator> + '_ { + self.props + .temporal_prop_ids() + .map(|k| TemporalPropertyView::new(self.props.clone(), k)) + } + + pub fn iter_latest(&self) -> impl Iterator + '_ { + self.iter().flat_map(|(k, v)| v.latest().map(|v| (k, v))) + } + + pub fn iter(&self) -> impl Iterator)> + '_ { + self.keys().zip(self.values()) + } + + pub fn get(&self, key: &str) -> Option> { + self.props + .get_temporal_prop_id(key) + .map(|k| TemporalPropertyView::new(self.props.clone(), k)) + } + + pub fn collect_properties(self) -> Vec<(ArcStr, Prop)> { + self.iter() + .flat_map(|(k, v)| v.latest().map(|v| (k.clone(), v))) + .collect() + } +} + +impl PropUnwrap for TemporalPropertyView

{ + fn into_u8(self) -> Option { + self.latest().into_u8() + } + + fn into_u16(self) -> Option { + self.latest().into_u16() + } + + fn into_str(self) -> Option { + self.latest().into_str() + } + + fn into_i32(self) -> Option { + self.latest().into_i32() + } + + fn into_i64(self) -> Option { + self.latest().into_i64() + } + + fn into_u32(self) -> Option { + self.latest().into_u32() + } + + fn into_u64(self) -> Option { + self.latest().into_u64() + } + + fn into_f32(self) -> Option { + self.latest().into_f32() + } + + fn into_f64(self) -> Option { + self.latest().into_f64() + } + + fn into_bool(self) -> Option { + self.latest().into_bool() + } + + fn into_list(self) -> Option>> { + self.latest().into_list() + } + + fn into_map(self) -> Option>> { + self.latest().into_map() + } + + fn into_dtime(self) -> Option { + self.latest().into_dtime() + } + + fn into_graph(self) -> Option { + self.latest().into_graph() + } +} diff --git a/raphtory/src/db/api/view/edge.rs b/raphtory/src/db/api/view/edge.rs new file mode 100644 index 0000000000..2336217720 --- /dev/null +++ b/raphtory/src/db/api/view/edge.rs @@ -0,0 +1,253 @@ +use crate::{ + core::{ + entities::{edges::edge_ref::EdgeRef, VID}, + storage::timeindex::{AsTime, TimeIndexEntry}, + ArcStr, + }, + db::api::{ + properties::{ + internal::{ConstPropertiesOps, TemporalPropertiesOps, TemporalPropertyViewOps}, + Properties, + }, + view::{internal::*, *}, + }, +}; + +pub trait EdgeViewInternalOps> { + fn graph(&self) -> G; + + fn eref(&self) -> EdgeRef; + + fn new_vertex(&self, v: VID) -> V; + + fn new_edge(&self, e: EdgeRef) -> Self; +} + +pub trait EdgeViewOps: + EdgeViewInternalOps + + ConstPropertiesOps + + TemporalPropertiesOps + + TemporalPropertyViewOps + + Sized + + Clone +{ + type Graph: GraphViewOps; + type Vertex: VertexViewOps; + type EList: EdgeListOps; + + /// list the activation timestamps for the edge + fn history(&self) -> Vec { + let layer_ids = self.graph().layer_ids().constrain_from_edge(self.eref()); + self.graph() + .edge_exploded(self.eref(), layer_ids) + .map(|e| *e.time().expect("exploded").t()) + .collect() + } + + /// Return a view of the properties of the edge + fn properties(&self) -> Properties { + Properties::new(self.clone()) + } + + /// Returns the source vertex of the edge. + fn src(&self) -> Self::Vertex { + let vertex = self.eref().src(); + self.new_vertex(vertex) + } + + /// Returns the destination vertex of the edge. + fn dst(&self) -> Self::Vertex { + let vertex = self.eref().dst(); + self.new_vertex(vertex) + } + + /// Check if edge is active at a given time point + fn active(&self, t: i64) -> bool { + let layer_ids = self.graph().layer_ids().constrain_from_edge(self.eref()); + match self.eref().time() { + Some(tt) => *tt.t() <= t && t <= self.latest_time().unwrap_or(*tt.t()), + None => self.graph().include_edge_window( + &self.graph().core_edge(self.eref().pid()), + t..t.saturating_add(1), + &layer_ids, + ), + } + } + + /// Returns the id of the edge. + fn id( + &self, + ) -> ( + ::ValueType, + ::ValueType, + ) { + (self.src().id(), self.dst().id()) + } + + /// Explodes an edge and returns all instances it had been updated as seperate edges + fn explode(&self) -> Self::EList; + + fn explode_layers(&self) -> Self::EList; + + /// Gets the first time an edge was seen + fn earliest_time(&self) -> Option { + let layer_ids = self.graph().layer_ids().constrain_from_edge(self.eref()); + self.graph().edge_earliest_time(self.eref(), layer_ids) + } + + /// Gets the latest time an edge was updated + fn latest_time(&self) -> Option { + let layer_ids = self.graph().layer_ids().constrain_from_edge(self.eref()); + self.graph().edge_latest_time(self.eref(), layer_ids) + } + + /// Gets the time stamp of the edge if it is exploded + fn time(&self) -> Option { + self.eref().time().map(|ti| *ti.t()) + } + + /// Gets the layer name for the edge if it is restricted to a single layer + fn layer_name(&self) -> Option { + self.eref() + .layer() + .map(|l_id| self.graph().get_layer_name(*l_id)) + } + + /// Gets the TimeIndexEntry if the edge is exploded + fn time_and_index(&self) -> Option { + self.eref().time() + } + + /// Gets the name of the layer this edge belongs to + fn layer_names(&self) -> BoxedIter { + let layer_ids = self + .graph() + .edge_layer_ids(&self.graph().core_edge(self.eref().pid())) + .constrain_from_edge(self.eref()); + self.graph().get_layer_names_from_ids(layer_ids) + } +} + +/// This trait defines the operations that can be +/// performed on a list of edges in a temporal graph view. +pub trait EdgeListOps: + IntoIterator, IntoIter = Self::IterType> + Sized +{ + type Graph: GraphViewOps; + type Vertex: VertexViewOps; + type Edge: EdgeViewOps; + type ValueType; + + /// the type of list of vertices + type VList: VertexListOps; + + /// the type of iterator + type IterType: Iterator>; + fn properties(self) -> Self::IterType>; + + /// gets the source vertices of the edges in the list + fn src(self) -> Self::VList; + + /// gets the destination vertices of the edges in the list + fn dst(self) -> Self::VList; + + fn id(self) -> Self::IterType<(u64, u64)>; + + /// returns a list of exploded edges that include an edge at each point in time + fn explode(self) -> Self::IterType; + + /// Get the timestamp for the earliest activity of the edge + fn earliest_time(self) -> Self::IterType>; + + /// Get the timestamp for the latest activity of the edge + fn latest_time(self) -> Self::IterType>; + + /// Get the timestamps of the edges if they are exploded + fn time(self) -> Self::IterType>; + + /// Get the layer name for each edge if it is restricted to a single layer + fn layer_name(self) -> Self::IterType>; +} + +#[cfg(test)] +mod test_edge_view { + use crate::prelude::*; + + #[test] + fn test_exploded_edge_properties() { + let g = Graph::new(); + let actual_prop_values = vec![0, 1, 2, 3]; + for v in actual_prop_values.iter() { + g.add_edge(0, 1, 2, [("test", *v)], None).unwrap(); + } + + let prop_values: Vec<_> = g + .edge(1, 2) + .unwrap() + .explode() + .flat_map(|e| e.properties().get("test").into_i32()) + .collect(); + assert_eq!(prop_values, actual_prop_values) + } + + #[test] + fn test_exploded_edge_multilayer() { + let g = Graph::new(); + let expected_prop_values = vec![0, 1, 2, 3]; + for v in expected_prop_values.iter() { + g.add_edge(0, 1, 2, [("test", *v)], Some((v % 2).to_string().as_str())) + .unwrap(); + } + + let prop_values: Vec<_> = g + .edge(1, 2) + .unwrap() + .explode() + .flat_map(|e| e.properties().get("test").into_i32()) + .collect(); + let actual_layers: Vec<_> = g + .edge(1, 2) + .unwrap() + .explode() + .map(|e| e.layer_names().into_iter().next().unwrap()) + .collect(); + let expected_layers: Vec<_> = expected_prop_values + .iter() + .map(|v| (v % 2).to_string()) + .collect(); + assert_eq!(prop_values, expected_prop_values); + assert_eq!(actual_layers, expected_layers); + } + + #[test] + fn test_sorting_by_secondary_index() { + let g = Graph::new(); + g.add_edge(0, 2, 3, NO_PROPS, None).unwrap(); + g.add_edge(0, 1, 2, NO_PROPS, None).unwrap(); + g.add_edge(0, 1, 2, [("second", true)], None).unwrap(); + g.add_edge(0, 2, 3, [("second", true)], None).unwrap(); + + let mut exploded_edges: Vec<_> = g.edges().explode().collect(); + exploded_edges.sort_by_key(|a| a.time_and_index()); + + let res: Vec<_> = exploded_edges + .into_iter() + .map(|e| { + ( + e.src().id(), + e.dst().id(), + e.properties().get("second").into_bool(), + ) + }) + .collect(); + assert_eq!( + res, + vec![ + (2, 3, None), + (1, 2, None), + (1, 2, Some(true)), + (2, 3, Some(true)) + ] + ) + } +} diff --git a/raphtory/src/db/api/view/graph.rs b/raphtory/src/db/api/view/graph.rs new file mode 100644 index 0000000000..389bbe9019 --- /dev/null +++ b/raphtory/src/db/api/view/graph.rs @@ -0,0 +1,331 @@ +use crate::{ + core::{ + entities::{ + graph::tgraph::InnerTemporalGraph, vertices::vertex_ref::VertexRef, LayerIds, VID, + }, + utils::{errors::GraphError, time::IntoTime}, + ArcStr, + }, + db::{ + api::{ + mutation::{AdditionOps, PropertyAdditionOps}, + properties::Properties, + view::{internal::*, layer::LayerOps, *}, + }, + graph::{ + edge::EdgeView, + vertex::VertexView, + vertices::Vertices, + views::{ + layer_graph::LayeredGraph, vertex_subgraph::VertexSubgraph, + window_graph::WindowedGraph, + }, + }, + }, + prelude::{DeletionOps, NO_PROPS}, +}; +use rustc_hash::FxHashSet; + +/// This trait GraphViewOps defines operations for accessing +/// information about a graph. The trait has associated types +/// that are used to define the type of the vertices, edges +/// and the corresponding iterators. +pub trait GraphViewOps: BoxableGraphView + Clone + Sized { + fn subgraph, V: Into>( + &self, + vertices: I, + ) -> VertexSubgraph; + /// Return all the layer ids in the graph + fn unique_layers(&self) -> BoxedIter; + /// Timestamp of earliest activity in the graph + fn earliest_time(&self) -> Option; + /// Timestamp of latest activity in the graph + fn latest_time(&self) -> Option; + /// Return the number of vertices in the graph. + fn count_vertices(&self) -> usize; + + /// Check if the graph is empty. + fn is_empty(&self) -> bool { + self.count_vertices() == 0 + } + + /// Return the number of edges in the graph. + fn count_edges(&self) -> usize; + + // Return the number of temporal edges in the graph. + fn count_temporal_edges(&self) -> usize; + + /// Check if the graph contains a vertex `v`. + fn has_vertex>(&self, v: T) -> bool; + + /// Check if the graph contains an edge given a pair of vertices `(src, dst)`. + fn has_edge, L: Into>(&self, src: T, dst: T, layer: L) -> bool; + + /// Get a vertex `v`. + fn vertex>(&self, v: T) -> Option>; + + /// Return a View of the vertices in the Graph + fn vertices(&self) -> Vertices; + + /// Get an edge `(src, dst)`. + fn edge>(&self, src: T, dst: T) -> Option>; + + /// Return an iterator over all edges in the graph. + fn edges(&self) -> Box> + Send>; + + /// Get all property values of this graph. + /// + /// # Returns + /// + /// A view of the properties of the graph + fn properties(&self) -> Properties; + + /// Get a graph clone + /// + /// # Arguments + /// + /// # Returns + /// Graph - Returns clone of the graph + fn materialize(&self) -> Result; +} + +impl GraphViewOps for G { + fn subgraph, V: Into>( + &self, + vertices: I, + ) -> VertexSubgraph { + let filter = self.edge_filter(); + let layer_ids = self.layer_ids(); + let vertices: FxHashSet = vertices + .into_iter() + .flat_map(|v| self.internal_vertex_ref(v.into(), &layer_ids, filter)) + .collect(); + VertexSubgraph::new(self.clone(), vertices) + } + + /// Return all the layer ids in the graph + fn unique_layers(&self) -> BoxedIter { + self.get_layer_names_from_ids(self.layer_ids()) + } + + fn earliest_time(&self) -> Option { + self.earliest_time_global() + } + + fn latest_time(&self) -> Option { + self.latest_time_global() + } + + fn count_vertices(&self) -> usize { + self.vertices_len(self.layer_ids(), self.edge_filter()) + } + + fn count_temporal_edges(&self) -> usize { + self.edges().explode().count() + } + + #[inline] + fn count_edges(&self) -> usize { + self.edges_len(self.layer_ids(), self.edge_filter()) + } + + fn has_vertex>(&self, v: T) -> bool { + self.has_vertex_ref(v.into(), &self.layer_ids(), self.edge_filter()) + } + + fn has_edge, L: Into>(&self, src: T, dst: T, layer: L) -> bool { + let src_ref = src.into(); + let dst_ref = dst.into(); + let layers = self.layer_ids_from_names(layer.into()); + if let Some(src) = self.internalise_vertex(src_ref) { + if let Some(dst) = self.internalise_vertex(dst_ref) { + return self.has_edge_ref(src, dst, &layers, self.edge_filter()); + } + } + false + } + + fn vertex>(&self, v: T) -> Option> { + let v = v.into(); + self.internal_vertex_ref(v, &self.layer_ids(), self.edge_filter()) + .map(|v| VertexView::new_internal(self.clone(), v)) + } + + fn vertices(&self) -> Vertices { + let graph = self.clone(); + Vertices::new(graph) + } + + fn edge>(&self, src: T, dst: T) -> Option> { + let layer_ids = self.layer_ids(); + let edge_filter = self.edge_filter(); + if let Some(src) = self.internal_vertex_ref(src.into(), &layer_ids, edge_filter) { + if let Some(dst) = self.internal_vertex_ref(dst.into(), &layer_ids, edge_filter) { + return self + .edge_ref(src, dst, &layer_ids, edge_filter) + .map(|e| EdgeView::new(self.clone(), e)); + } + } + None + } + + fn edges(&self) -> Box> + Send> { + Box::new(self.vertices().iter().flat_map(|v| v.out_edges())) + } + + fn properties(&self) -> Properties { + Properties::new(self.clone()) + } + + fn materialize(&self) -> Result { + let g = InnerTemporalGraph::default(); + // Add edges first so we definitely have all associated vertices (important in case of persistent edges) + for e in self.edges() { + // FIXME: this needs to be verified + for ee in e.explode_layers() { + let layer_id = *ee.edge.layer().expect("exploded layers"); + let layer_ids = LayerIds::One(layer_id); + let layer_name = self.get_layer_name(layer_id); + let layer_name: Option<&str> = if layer_id == 0 { + None + } else { + Some(&layer_name) + }; + + for ee in ee.explode() { + g.add_edge( + ee.time().expect("exploded edge"), + ee.src().id(), + ee.dst().id(), + ee.properties().temporal().collect_properties(), + layer_name, + )?; + } + + if self.include_deletions() { + for t in self.edge_deletion_history(e.edge, layer_ids) { + g.delete_edge(t, e.src().id(), e.dst().id(), layer_name)?; + } + } + + g.edge(ee.src().id(), ee.dst().id()) + .expect("edge added") + .add_constant_properties(ee.properties().constant(), layer_name)?; + } + } + + for v in self.vertices().iter() { + for h in v.history() { + g.add_vertex(h, v.id(), NO_PROPS)?; + } + for (name, prop_view) in v.properties().temporal().iter() { + for (t, prop) in prop_view.iter() { + g.add_vertex(t, v.id(), [(name.clone(), prop)])?; + } + } + g.vertex(v.id()) + .expect("vertex added") + .add_constant_properties(v.properties().constant())?; + } + + g.add_constant_properties(self.properties().constant())?; + + Ok(self.new_base_graph(g)) + } +} + +impl TimeOps for G { + type WindowedViewType = WindowedGraph; + + fn start(&self) -> Option { + self.view_start() + } + + fn end(&self) -> Option { + self.view_end() + } + + fn window(&self, t_start: T, t_end: T) -> WindowedGraph { + WindowedGraph::new(self.clone(), t_start, t_end) + } +} + +impl LayerOps for G { + type LayeredViewType = LayeredGraph; + + fn default_layer(&self) -> Self::LayeredViewType { + LayeredGraph::new(self.clone(), 0.into()) + } + + fn layer>(&self, layers: L) -> Option { + let layers = layers.into(); + let ids = self.layer_ids_from_names(layers); + match ids { + LayerIds::None => None, + _ => Some(LayeredGraph::new(self.clone(), ids)), + } + } +} + +#[cfg(test)] +mod test_exploded_edges { + use crate::prelude::*; + + #[test] + fn test_exploded_edges() { + let g: Graph = Graph::new(); + g.add_edge(0, 0, 1, NO_PROPS, None).unwrap(); + g.add_edge(1, 0, 1, NO_PROPS, None).unwrap(); + g.add_edge(2, 0, 1, NO_PROPS, None).unwrap(); + g.add_edge(3, 0, 1, NO_PROPS, None).unwrap(); + + assert_eq!(g.count_temporal_edges(), 4) + } +} + +#[cfg(test)] +mod test_materialize { + use crate::prelude::*; + + #[test] + fn test_materialize() { + let g = Graph::new(); + g.add_edge(0, 1, 2, [("layer1", "1")], Some("1")).unwrap(); + g.add_edge(0, 1, 2, [("layer2", "2")], Some("2")).unwrap(); + + let gm = g.materialize().unwrap(); + assert!(!g + .layer("2") + .unwrap() + .edge(1, 2) + .unwrap() + .properties() + .temporal() + .contains("layer1")); + assert!(!gm + .into_events() + .unwrap() + .layer("2") + .unwrap() + .edge(1, 2) + .unwrap() + .properties() + .temporal() + .contains("layer1")); + } + + #[test] + fn changing_property_type_errors() { + let g = Graph::new(); + let props_0 = [("test", Prop::U64(1))]; + let props_1 = [("test", Prop::F64(0.1))]; + g.add_properties(0, props_0.clone()).unwrap(); + assert!(g.add_properties(1, props_1.clone()).is_err()); + + g.add_vertex(0, 1, props_0.clone()).unwrap(); + assert!(g.add_vertex(1, 1, props_1.clone()).is_err()); + + g.add_edge(0, 1, 2, props_0.clone(), None).unwrap(); + assert!(g.add_edge(1, 1, 2, props_1.clone(), None).is_err()); + } +} diff --git a/raphtory/src/db/api/view/internal/core_deletion_ops.rs b/raphtory/src/db/api/view/internal/core_deletion_ops.rs new file mode 100644 index 0000000000..10abe08c7e --- /dev/null +++ b/raphtory/src/db/api/view/internal/core_deletion_ops.rs @@ -0,0 +1,48 @@ +use crate::{ + core::{ + entities::{edges::edge_ref::EdgeRef, LayerIds}, + storage::timeindex::{LockedLayeredIndex, TimeIndexEntry}, + }, + db::api::view::internal::Base, +}; +use enum_dispatch::enum_dispatch; + +#[enum_dispatch] +pub trait CoreDeletionOps { + /// Get all the deletion timestamps for an edge + /// (this should always be global and not affected by windowing as deletion semantics may need information outside the current view!) + fn edge_deletions( + &self, + eref: EdgeRef, + layer_ids: LayerIds, + ) -> LockedLayeredIndex<'_, TimeIndexEntry>; +} + +pub trait InheritCoreDeletionOps: Base {} + +impl DelegateCoreDeletionOps for G +where + G::Base: CoreDeletionOps, +{ + type Internal = G::Base; + + fn graph(&self) -> &Self::Internal { + self.base() + } +} + +pub trait DelegateCoreDeletionOps { + type Internal: CoreDeletionOps + ?Sized; + + fn graph(&self) -> &Self::Internal; +} + +impl CoreDeletionOps for G { + fn edge_deletions( + &self, + eref: EdgeRef, + layer_ids: LayerIds, + ) -> LockedLayeredIndex<'_, TimeIndexEntry> { + self.graph().edge_deletions(eref, layer_ids) + } +} diff --git a/raphtory/src/db/api/view/internal/core_ops.rs b/raphtory/src/db/api/view/internal/core_ops.rs new file mode 100644 index 0000000000..94d53be15c --- /dev/null +++ b/raphtory/src/db/api/view/internal/core_ops.rs @@ -0,0 +1,376 @@ +use crate::{ + core::{ + entities::{ + edges::{edge_ref::EdgeRef, edge_store::EdgeStore}, + properties::{ + graph_props::GraphProps, + props::Meta, + tprop::{LockedLayeredTProp, TProp}, + }, + vertices::{vertex_ref::VertexRef, vertex_store::VertexStore}, + LayerIds, EID, VID, + }, + storage::{ + locked_view::LockedView, + timeindex::{LockedLayeredIndex, TimeIndex, TimeIndexEntry}, + ArcEntry, + }, + ArcStr, Prop, + }, + db::api::view::{internal::Base, BoxedIter}, +}; +use enum_dispatch::enum_dispatch; + +/// Core functions that should (almost-)always be implemented by pointing at the underlying graph. +#[enum_dispatch] +pub trait CoreGraphOps { + /// get the number of vertices in the main graph + fn unfiltered_num_vertices(&self) -> usize; + + fn vertex_meta(&self) -> &Meta; + + fn edge_meta(&self) -> &Meta; + + fn graph_meta(&self) -> &GraphProps; + + fn get_layer_name(&self, layer_id: usize) -> ArcStr; + + fn get_layer_id(&self, name: &str) -> Option; + + /// Get the layer name for a given id + fn get_layer_names_from_ids(&self, layer_ids: LayerIds) -> BoxedIter; + + /// Returns the external ID for a vertex + fn vertex_id(&self, v: VID) -> u64; + + /// Returns the string name for a vertex + fn vertex_name(&self, v: VID) -> String; + + /// Get all the addition timestamps for an edge + /// (this should always be global and not affected by windowing as deletion semantics may need information outside the current view!) + fn edge_additions( + &self, + eref: EdgeRef, + layer_ids: LayerIds, + ) -> LockedLayeredIndex<'_, TimeIndexEntry>; + + /// Get all the addition timestamps for a vertex + /// (this should always be global and not affected by windowing as deletion semantics may need information outside the current view!) + fn vertex_additions(&self, v: VID) -> LockedView>; + + /// Gets the internal reference for an external vertex reference and keeps internal references unchanged. + fn internalise_vertex(&self, v: VertexRef) -> Option; + + /// Gets the internal reference for an external vertex reference and keeps internal references unchanged. Assumes vertex exists! + fn internalise_vertex_unchecked(&self, v: VertexRef) -> VID; + + /// Gets a static graph property. + /// + /// # Arguments + /// + /// * `name` - The name of the property. + /// + /// # Returns + /// + /// Option - The property value if it exists. + fn constant_prop(&self, id: usize) -> Option; + + /// Gets a temporal graph property. + /// + /// # Arguments + /// + /// * `name` - The name of the property. + /// + /// # Returns + /// + /// Option> - The history of property values if it exists. + fn temporal_prop(&self, id: usize) -> Option>; + + /// Gets a static property of a given vertex given the name and vertex reference. + /// + /// # Arguments + /// + /// * `v` - A reference to the vertex for which the property is being queried. + /// * `name` - The name of the property. + /// + /// # Returns + /// + /// Option - The property value if it exists. + fn constant_vertex_prop(&self, v: VID, id: usize) -> Option; + + /// Gets the keys of constant properties of a given vertex + /// + /// # Arguments + /// + /// * `v` - A reference to the vertex for which the property is being queried. + /// + /// # Returns + /// + /// The keys of the constant properties. + fn constant_vertex_prop_ids(&self, v: VID) -> Box + '_>; + + /// Gets a temporal property of a given vertex given the name and vertex reference. + /// + /// # Arguments + /// + /// * `v` - A reference to the vertex for which the property is being queried. + /// * `name` - The name of the property. + /// + /// # Returns + /// + /// Option> - The history of property values if it exists. + fn temporal_vertex_prop(&self, v: VID, id: usize) -> Option>; + + /// Returns a vector of all ids of temporal properties within the given vertex + /// + /// # Arguments + /// + /// * `v` - A reference to the vertex for which to retrieve the names. + /// + /// # Returns + /// + /// the ids of the temporal properties + fn temporal_vertex_prop_ids(&self, v: VID) -> Box + '_>; + + /// Returns the static edge property with the given name for the + /// given edge reference. + /// + /// # Arguments + /// + /// * `e` - An `EdgeRef` reference to the edge of interest. + /// * `name` - A `String` containing the name of the temporal property. + /// + /// # Returns + /// + /// A property if it exists + fn get_const_edge_prop(&self, e: EdgeRef, id: usize, layer_ids: LayerIds) -> Option; + + /// Returns a vector of keys for the static properties of the given edge reference. + /// + /// # Arguments + /// + /// * `e` - An `EdgeRef` reference to the edge of interest. + /// + /// # Returns + /// + /// the keys for the constant properties of the given edge. + fn const_edge_prop_ids( + &self, + e: EdgeRef, + layer_ids: LayerIds, + ) -> Box + '_>; + + /// Returns a vector of all temporal values of the edge property with the given name for the + /// given edge reference. + /// + /// # Arguments + /// + /// * `e` - An `EdgeRef` reference to the edge of interest. + /// * `name` - A `String` containing the name of the temporal property. + /// + /// # Returns + /// + /// A property if it exists + fn temporal_edge_prop( + &self, + e: EdgeRef, + id: usize, + layer_ids: LayerIds, + ) -> Option; + + /// Returns a vector of keys for the temporal properties of the given edge reference. + /// + /// # Arguments + /// + /// * `e` - An `EdgeRef` reference to the edge of interest. + /// + /// # Returns + /// + /// * keys for the temporal properties of the given edge. + fn temporal_edge_prop_ids( + &self, + e: EdgeRef, + layer_ids: LayerIds, + ) -> Box + '_>; + + fn core_edges(&self) -> Box>>; + + fn core_edge(&self, eid: EID) -> ArcEntry; + fn core_vertices(&self) -> Box>>; + + fn core_vertex(&self, vid: VID) -> ArcEntry; +} + +pub trait InheritCoreOps: Base {} + +impl DelegateCoreOps for G +where + G::Base: CoreGraphOps, +{ + type Internal = G::Base; + + #[inline] + fn graph(&self) -> &Self::Internal { + self.base() + } +} + +pub trait DelegateCoreOps { + type Internal: CoreGraphOps + ?Sized; + + fn graph(&self) -> &Self::Internal; +} + +impl CoreGraphOps for G { + #[inline] + fn unfiltered_num_vertices(&self) -> usize { + self.graph().unfiltered_num_vertices() + } + + #[inline] + fn vertex_meta(&self) -> &Meta { + self.graph().vertex_meta() + } + + #[inline] + fn edge_meta(&self) -> &Meta { + self.graph().edge_meta() + } + + #[inline] + fn graph_meta(&self) -> &GraphProps { + self.graph().graph_meta() + } + + #[inline] + fn get_layer_name(&self, layer_id: usize) -> ArcStr { + self.graph().get_layer_name(layer_id) + } + + #[inline] + fn get_layer_id(&self, name: &str) -> Option { + self.graph().get_layer_id(name) + } + + #[inline] + fn get_layer_names_from_ids(&self, layer_ids: LayerIds) -> BoxedIter { + self.graph().get_layer_names_from_ids(layer_ids) + } + + #[inline] + fn vertex_id(&self, v: VID) -> u64 { + self.graph().vertex_id(v) + } + + #[inline] + fn vertex_name(&self, v: VID) -> String { + self.graph().vertex_name(v) + } + + #[inline] + fn edge_additions( + &self, + eref: EdgeRef, + layer_ids: LayerIds, + ) -> LockedLayeredIndex<'_, TimeIndexEntry> { + self.graph().edge_additions(eref, layer_ids) + } + + #[inline] + fn vertex_additions(&self, v: VID) -> LockedView> { + self.graph().vertex_additions(v) + } + + #[inline] + fn internalise_vertex(&self, v: VertexRef) -> Option { + self.graph().internalise_vertex(v) + } + + #[inline] + fn internalise_vertex_unchecked(&self, v: VertexRef) -> VID { + self.graph().internalise_vertex_unchecked(v) + } + + #[inline] + fn constant_prop(&self, id: usize) -> Option { + self.graph().constant_prop(id) + } + + #[inline] + fn temporal_prop(&self, id: usize) -> Option> { + self.graph().temporal_prop(id) + } + + #[inline] + fn constant_vertex_prop(&self, v: VID, id: usize) -> Option { + self.graph().constant_vertex_prop(v, id) + } + + #[inline] + fn constant_vertex_prop_ids(&self, v: VID) -> Box + '_> { + self.graph().constant_vertex_prop_ids(v) + } + + #[inline] + fn temporal_vertex_prop(&self, v: VID, id: usize) -> Option> { + self.graph().temporal_vertex_prop(v, id) + } + + #[inline] + fn temporal_vertex_prop_ids(&self, v: VID) -> Box + '_> { + self.graph().temporal_vertex_prop_ids(v) + } + + #[inline] + fn get_const_edge_prop(&self, e: EdgeRef, id: usize, layer_ids: LayerIds) -> Option { + self.graph().get_const_edge_prop(e, id, layer_ids) + } + + #[inline] + fn const_edge_prop_ids( + &self, + e: EdgeRef, + layer_ids: LayerIds, + ) -> Box + '_> { + self.graph().const_edge_prop_ids(e, layer_ids) + } + + #[inline] + fn temporal_edge_prop( + &self, + e: EdgeRef, + id: usize, + layer_ids: LayerIds, + ) -> Option { + self.graph().temporal_edge_prop(e, id, layer_ids) + } + + #[inline] + fn temporal_edge_prop_ids( + &self, + e: EdgeRef, + layer_ids: LayerIds, + ) -> Box + '_> { + self.graph().temporal_edge_prop_ids(e, layer_ids) + } + + #[inline] + fn core_edges(&self) -> Box>> { + self.graph().core_edges() + } + + #[inline] + fn core_edge(&self, eid: EID) -> ArcEntry { + self.graph().core_edge(eid) + } + + #[inline] + fn core_vertices(&self) -> Box>> { + self.graph().core_vertices() + } + + #[inline] + fn core_vertex(&self, vid: VID) -> ArcEntry { + self.graph().core_vertex(vid) + } +} diff --git a/raphtory/src/db/api/view/internal/edge_filter_ops.rs b/raphtory/src/db/api/view/internal/edge_filter_ops.rs new file mode 100644 index 0000000000..4b16688012 --- /dev/null +++ b/raphtory/src/db/api/view/internal/edge_filter_ops.rs @@ -0,0 +1,57 @@ +use crate::{ + core::entities::{edges::edge_store::EdgeStore, LayerIds}, + db::api::view::internal::Base, +}; +use enum_dispatch::enum_dispatch; +use std::sync::Arc; + +pub fn extend_filter( + old: Option, + filter: impl Fn(&EdgeStore, &LayerIds) -> bool + Send + Sync + 'static, +) -> EdgeFilter { + match old { + Some(f) => Arc::new(move |e, l| f(e, l) && filter(e, l)), + None => Arc::new(filter), + } +} + +pub type EdgeFilter = Arc bool + Send + Sync>; + +#[enum_dispatch] +pub trait EdgeFilterOps { + /// Return the optional edge filter for the graph + fn edge_filter(&self) -> Option<&EdgeFilter>; + + /// Called by the windowed graph to get the edge filter (override if it should include more/different edges than a non-windowed graph) + #[inline] + fn edge_filter_window(&self) -> Option<&EdgeFilter> { + self.edge_filter() + } +} + +pub trait InheritEdgeFilterOps: Base {} + +impl DelegateEdgeFilterOps for G +where + G::Base: EdgeFilterOps, +{ + type Internal = G::Base; + + #[inline] + fn graph(&self) -> &Self::Internal { + self.base() + } +} + +pub trait DelegateEdgeFilterOps { + type Internal: EdgeFilterOps + ?Sized; + + fn graph(&self) -> &Self::Internal; +} + +impl EdgeFilterOps for G { + #[inline] + fn edge_filter(&self) -> Option<&EdgeFilter> { + self.graph().edge_filter() + } +} diff --git a/raphtory/src/db/api/view/internal/graph_ops.rs b/raphtory/src/db/api/view/internal/graph_ops.rs new file mode 100644 index 0000000000..8ed0751626 --- /dev/null +++ b/raphtory/src/db/api/view/internal/graph_ops.rs @@ -0,0 +1,286 @@ +use crate::{ + core::{ + entities::{edges::edge_ref::EdgeRef, vertices::vertex_ref::VertexRef, LayerIds, EID, VID}, + Direction, + }, + db::api::view::internal::{Base, EdgeFilter}, +}; +use enum_dispatch::enum_dispatch; + +/// The GraphViewInternalOps trait provides a set of methods to query a directed graph +/// represented by the raphtory_core::tgraph::TGraph struct. +#[enum_dispatch] +pub trait GraphOps: Send + Sync { + /// Check if a vertex exists and returns internal reference. + fn internal_vertex_ref( + &self, + v: VertexRef, + layer_ids: &LayerIds, + filter: Option<&EdgeFilter>, + ) -> Option; + + fn find_edge_id( + &self, + e_id: EID, + layer_ids: &LayerIds, + filter: Option<&EdgeFilter>, + ) -> Option; + + /// Returns the total number of vertices in the graph. + fn vertices_len(&self, layer_ids: LayerIds, filter: Option<&EdgeFilter>) -> usize; + + /// Returns the total number of edges in the graph. + fn edges_len(&self, layers: LayerIds, filter: Option<&EdgeFilter>) -> usize; + + /// Returns true if the graph contains an edge between the source vertex + /// (src) and the destination vertex (dst). + /// # Arguments + /// + /// * `src` - The source vertex of the edge. + /// * `dst` - The destination vertex of the edge. + fn has_edge_ref( + &self, + src: VID, + dst: VID, + layers: &LayerIds, + filter: Option<&EdgeFilter>, + ) -> bool { + self.edge_ref(src, dst, layers, filter).is_some() + } + + /// Returns true if the graph contains the specified vertex (v). + /// # Arguments + /// + /// * `v` - VertexRef of the vertex to check. + fn has_vertex_ref(&self, v: VertexRef, layers: &LayerIds, filter: Option<&EdgeFilter>) -> bool { + self.internal_vertex_ref(v, layers, filter).is_some() + } + + /// Returns the number of edges that point towards or from the specified vertex + /// (v) based on the direction (d). + /// # Arguments + /// + /// * `v` - VID of the vertex to check. + /// * `d` - Direction of the edges to count. + fn degree(&self, v: VID, d: Direction, layers: &LayerIds, filter: Option<&EdgeFilter>) + -> usize; + + /// Returns the VID that corresponds to the specified vertex ID (v). + /// Returns None if the vertex ID is not present in the graph. + /// # Arguments + /// + /// * `v` - The vertex ID to lookup. + fn vertex_ref(&self, v: u64, layers: &LayerIds, filter: Option<&EdgeFilter>) -> Option { + self.internal_vertex_ref(v.into(), layers, filter) + } + + /// Returns all the vertex references in the graph. + /// # Returns + /// * `Box + Send>` - An iterator over all the vertex + /// references in the graph. + fn vertex_refs( + &self, + layers: LayerIds, + filter: Option<&EdgeFilter>, + ) -> Box + Send>; + + /// Returns the edge reference that corresponds to the specified src and dst vertex + /// # Arguments + /// + /// * `src` - The source vertex. + /// * `dst` - The destination vertex. + /// + /// # Returns + /// + /// * `Option` - The edge reference if it exists. + fn edge_ref( + &self, + src: VID, + dst: VID, + layer: &LayerIds, + filter: Option<&EdgeFilter>, + ) -> Option; + + /// Returns all the edge references in the graph. + /// + /// # Returns + /// + /// * `Box + Send>` - An iterator over all the edge references. + fn edge_refs( + &self, + layers: LayerIds, + filter: Option<&EdgeFilter>, + ) -> Box + Send>; + + /// Returns an iterator over the edges connected to a given vertex in a given direction. + /// + /// # Arguments + /// + /// * `v` - A reference to the vertex for which the edges are being queried. + /// * `d` - The direction in which to search for edges. + /// * `layer` - The optional layer to consider + /// + /// # Returns + /// + /// Box + Send> - A boxed iterator that yields references to + /// the edges connected to the vertex. + fn vertex_edges( + &self, + v: VID, + d: Direction, + layer: LayerIds, + filter: Option<&EdgeFilter>, + ) -> Box + Send>; + + /// Returns an iterator over the neighbors of a given vertex in a given direction. + /// + /// # Arguments + /// + /// * `v` - A reference to the vertex for which the neighbors are being queried. + /// * `d` - The direction in which to search for neighbors. + /// + /// # Returns + /// + /// A boxed iterator that yields references to the neighboring vertices. + fn neighbours( + &self, + v: VID, + d: Direction, + layers: LayerIds, + filter: Option<&EdgeFilter>, + ) -> Box + Send>; +} + +pub trait InheritGraphOps: Base {} + +impl DelegateGraphOps for G +where + G::Base: GraphOps, +{ + type Internal = G::Base; + + fn graph(&self) -> &Self::Internal { + self.base() + } +} + +pub trait DelegateGraphOps { + type Internal: GraphOps + ?Sized; + + fn graph(&self) -> &Self::Internal; +} + +impl GraphOps for G { + #[inline] + fn internal_vertex_ref( + &self, + v: VertexRef, + layer_ids: &LayerIds, + filter: Option<&EdgeFilter>, + ) -> Option { + self.graph().internal_vertex_ref(v, layer_ids, filter) + } + + #[inline] + fn find_edge_id( + &self, + e_id: EID, + layer_ids: &LayerIds, + filter: Option<&EdgeFilter>, + ) -> Option { + self.graph().find_edge_id(e_id, layer_ids, filter) + } + + #[inline] + fn vertices_len(&self, layer_ids: LayerIds, filter: Option<&EdgeFilter>) -> usize { + self.graph().vertices_len(layer_ids, filter) + } + + #[inline] + fn edges_len(&self, layers: LayerIds, filter: Option<&EdgeFilter>) -> usize { + self.graph().edges_len(layers, filter) + } + + #[inline] + fn has_edge_ref( + &self, + src: VID, + dst: VID, + layers: &LayerIds, + filter: Option<&EdgeFilter>, + ) -> bool { + self.graph().has_edge_ref(src, dst, layers, filter) + } + + #[inline] + fn has_vertex_ref(&self, v: VertexRef, layers: &LayerIds, filter: Option<&EdgeFilter>) -> bool { + self.graph().has_vertex_ref(v, layers, filter) + } + + #[inline] + fn degree( + &self, + v: VID, + d: Direction, + layers: &LayerIds, + filter: Option<&EdgeFilter>, + ) -> usize { + self.graph().degree(v, d, layers, filter) + } + + #[inline] + fn vertex_ref(&self, v: u64, layers: &LayerIds, filter: Option<&EdgeFilter>) -> Option { + self.graph().vertex_ref(v, layers, filter) + } + + #[inline] + fn vertex_refs( + &self, + layers: LayerIds, + filter: Option<&EdgeFilter>, + ) -> Box + Send> { + self.graph().vertex_refs(layers, filter) + } + + #[inline] + fn edge_ref( + &self, + src: VID, + dst: VID, + layer: &LayerIds, + filter: Option<&EdgeFilter>, + ) -> Option { + self.graph().edge_ref(src, dst, layer, filter) + } + + #[inline] + fn edge_refs( + &self, + layers: LayerIds, + filter: Option<&EdgeFilter>, + ) -> Box + Send> { + self.graph().edge_refs(layers, filter) + } + + #[inline] + fn vertex_edges( + &self, + v: VID, + d: Direction, + layer: LayerIds, + filter: Option<&EdgeFilter>, + ) -> Box + Send> { + self.graph().vertex_edges(v, d, layer, filter) + } + + #[inline] + fn neighbours( + &self, + v: VID, + d: Direction, + layers: LayerIds, + filter: Option<&EdgeFilter>, + ) -> Box + Send> { + self.graph().neighbours(v, d, layers, filter) + } +} diff --git a/raphtory/src/db/api/view/internal/inherit.rs b/raphtory/src/db/api/view/internal/inherit.rs new file mode 100644 index 0000000000..c758814122 --- /dev/null +++ b/raphtory/src/db/api/view/internal/inherit.rs @@ -0,0 +1,18 @@ +use std::ops::Deref; + +/// Get a base for inheriting methods +pub trait Base { + type Base: ?Sized; + + fn base(&self) -> &Self::Base; +} + +/// Deref implies Base +impl Base for T { + type Base = T::Target; + + #[inline(always)] + fn base(&self) -> &Self::Base { + self.deref() + } +} diff --git a/raphtory/src/db/api/view/internal/into_dynamic.rs b/raphtory/src/db/api/view/internal/into_dynamic.rs new file mode 100644 index 0000000000..75b6308ed5 --- /dev/null +++ b/raphtory/src/db/api/view/internal/into_dynamic.rs @@ -0,0 +1,36 @@ +use crate::db::{ + api::view::{internal::DynamicGraph, GraphViewOps}, + graph::views::{ + layer_graph::LayeredGraph, vertex_subgraph::VertexSubgraph, window_graph::WindowedGraph, + }, +}; +use enum_dispatch::enum_dispatch; + +#[enum_dispatch] +pub trait IntoDynamic { + fn into_dynamic(self) -> DynamicGraph; +} + +impl IntoDynamic for WindowedGraph { + fn into_dynamic(self) -> DynamicGraph { + DynamicGraph::new(self) + } +} + +impl IntoDynamic for LayeredGraph { + fn into_dynamic(self) -> DynamicGraph { + DynamicGraph::new(self) + } +} + +impl IntoDynamic for DynamicGraph { + fn into_dynamic(self) -> DynamicGraph { + self + } +} + +impl IntoDynamic for VertexSubgraph { + fn into_dynamic(self) -> DynamicGraph { + DynamicGraph::new(self) + } +} diff --git a/raphtory/src/db/api/view/internal/layer_ops.rs b/raphtory/src/db/api/view/internal/layer_ops.rs new file mode 100644 index 0000000000..fe38b8e85e --- /dev/null +++ b/raphtory/src/db/api/view/internal/layer_ops.rs @@ -0,0 +1,55 @@ +use crate::{ + core::entities::{edges::edge_store::EdgeStore, LayerIds}, + db::api::view::internal::Base, + prelude::Layer, +}; +use enum_dispatch::enum_dispatch; + +#[enum_dispatch] +pub trait InternalLayerOps { + /// get the layer ids for the graph view + fn layer_ids(&self) -> LayerIds; + + /// Get the layer id for the given layer name + fn layer_ids_from_names(&self, key: Layer) -> LayerIds; + + /// get the layer ids for the given edge id + fn edge_layer_ids(&self, e: &EdgeStore) -> LayerIds; +} + +pub trait InheritLayerOps: Base {} + +impl DelegateLayerOps for G +where + G::Base: InternalLayerOps, +{ + type Internal = G::Base; + + #[inline] + fn graph(&self) -> &Self::Internal { + self.base() + } +} + +pub trait DelegateLayerOps { + type Internal: InternalLayerOps + ?Sized; + + fn graph(&self) -> &Self::Internal; +} + +impl InternalLayerOps for G { + #[inline] + fn layer_ids(&self) -> LayerIds { + self.graph().layer_ids() + } + + #[inline] + fn layer_ids_from_names(&self, key: Layer) -> LayerIds { + self.graph().layer_ids_from_names(key) + } + + #[inline] + fn edge_layer_ids(&self, e: &EdgeStore) -> LayerIds { + self.graph().edge_layer_ids(e) + } +} diff --git a/raphtory/src/db/api/view/internal/materialize.rs b/raphtory/src/db/api/view/internal/materialize.rs new file mode 100644 index 0000000000..331a797541 --- /dev/null +++ b/raphtory/src/db/api/view/internal/materialize.rs @@ -0,0 +1,172 @@ +use crate::{ + core::{ + entities::{ + edges::{edge_ref::EdgeRef, edge_store::EdgeStore}, + properties::{ + graph_props::GraphProps, + props::Meta, + tprop::{LockedLayeredTProp, TProp}, + }, + vertices::{vertex_ref::VertexRef, vertex_store::VertexStore}, + LayerIds, EID, VID, + }, + storage::{ + locked_view::LockedView, + timeindex::{LockedLayeredIndex, TimeIndex, TimeIndexEntry}, + ArcEntry, + }, + utils::errors::GraphError, + ArcStr, Direction, PropType, + }, + db::{ + api::{ + mutation::internal::{InternalAdditionOps, InternalPropertyAdditionOps}, + properties::internal::{ + ConstPropertiesOps, TemporalPropertiesOps, TemporalPropertyViewOps, + }, + view::{internal::*, BoxedIter}, + }, + graph::{ + graph::{Graph, InternalGraph}, + views::deletion_graph::GraphWithDeletions, + }, + }, + prelude::{Layer, Prop}, +}; +use enum_dispatch::enum_dispatch; +use serde::{Deserialize, Serialize}; +use std::path::Path; + +#[enum_dispatch(CoreGraphOps)] +#[enum_dispatch(GraphOps)] +#[enum_dispatch(EdgeFilterOps)] +#[enum_dispatch(InternalLayerOps)] +#[enum_dispatch(IntoDynamic)] +#[enum_dispatch(TimeSemantics)] +#[enum_dispatch(InternalMaterialize)] +#[enum_dispatch(TemporalPropertiesOps)] +#[enum_dispatch(TemporalPropertyViewOps)] +#[enum_dispatch(ConstPropertiesOps)] +#[enum_dispatch(InternalAdditionOps)] +#[enum_dispatch(InternalPropertyAdditionOps)] +#[derive(Serialize, Deserialize, Clone)] +pub enum MaterializedGraph { + EventGraph(Graph), + PersistentGraph(GraphWithDeletions), +} + +impl MaterializedGraph { + pub fn into_events(self) -> Option { + match self { + MaterializedGraph::EventGraph(g) => Some(g), + MaterializedGraph::PersistentGraph(_) => None, + } + } + pub fn into_persistent(self) -> Option { + match self { + MaterializedGraph::EventGraph(_) => None, + MaterializedGraph::PersistentGraph(g) => Some(g), + } + } + + pub fn load_from_file>(path: P) -> Result { + let f = std::fs::File::open(path)?; + let mut reader = std::io::BufReader::new(f); + Ok(bincode::deserialize_from(&mut reader)?) + } + + pub fn save_to_file>(&self, path: P) -> Result<(), GraphError> { + let f = std::fs::File::create(path)?; + let mut writer = std::io::BufWriter::new(f); + Ok(bincode::serialize_into(&mut writer, self)?) + } + + pub fn bincode(&self) -> Result, GraphError> { + let encoded = bincode::serialize(self)?; + Ok(encoded) + } + + pub fn from_bincode(b: &[u8]) -> Result { + let g = bincode::deserialize(b)?; + Ok(g) + } +} + +#[enum_dispatch] +pub trait InternalMaterialize { + fn new_base_graph(&self, graph: InternalGraph) -> MaterializedGraph; + + fn include_deletions(&self) -> bool; +} + +pub trait InheritMaterialize: Base {} + +impl InternalMaterialize for G +where + G::Base: InternalMaterialize, +{ + fn new_base_graph(&self, graph: InternalGraph) -> MaterializedGraph { + self.base().new_base_graph(graph) + } + + fn include_deletions(&self) -> bool { + self.base().include_deletions() + } +} + +#[cfg(test)] +mod test_materialised_graph_dispatch { + use crate::{ + core::entities::LayerIds, + db::api::view::internal::{ + CoreGraphOps, EdgeFilterOps, GraphOps, InternalLayerOps, InternalMaterialize, + MaterializedGraph, TimeSemantics, + }, + prelude::*, + }; + + #[test] + fn materialised_graph_has_core_ops() { + let mg = MaterializedGraph::from(Graph::new()); + assert_eq!(mg.unfiltered_num_vertices(), 0); + } + + #[test] + fn materialised_graph_has_graph_ops() { + let mg = MaterializedGraph::from(Graph::new()); + assert_eq!(mg.vertices_len(mg.layer_ids(), mg.edge_filter()), 0); + } + #[test] + fn materialised_graph_has_edge_filter_ops() { + let mg = MaterializedGraph::from(Graph::new()); + assert!(mg.edge_filter().is_none()); + } + + #[test] + fn materialised_graph_has_layer_ops() { + let mg = MaterializedGraph::from(Graph::new()); + assert!(matches!(mg.layer_ids(), LayerIds::All)); + } + + #[test] + fn materialised_graph_has_time_semantics() { + let mg = MaterializedGraph::from(Graph::new()); + assert!(mg.view_start().is_none()); + } + + #[test] + fn materialised_graph_has_internal_materialise() { + let mg = MaterializedGraph::from(Graph::new()); + assert!(!mg.include_deletions()); + } + + #[test] + fn materialised_graph_can_be_used_directly() { + let g = Graph::new(); + + let mg = g.materialize().unwrap(); + + let v = mg.add_vertex(0, 1, NO_PROPS).unwrap(); + assert_eq!(v.id(), 1) + } +} diff --git a/raphtory/src/db/api/view/internal/mod.rs b/raphtory/src/db/api/view/internal/mod.rs new file mode 100644 index 0000000000..5f973d5614 --- /dev/null +++ b/raphtory/src/db/api/view/internal/mod.rs @@ -0,0 +1,153 @@ +mod core_deletion_ops; +mod core_ops; +mod edge_filter_ops; +mod graph_ops; +mod inherit; +mod into_dynamic; +mod layer_ops; +mod materialize; +pub(crate) mod time_semantics; +mod wrapped_graph; + +use crate::{ + db::api::properties::internal::{ConstPropertiesOps, InheritPropertiesOps, PropertiesOps}, + prelude::GraphViewOps, +}; +pub use core_deletion_ops::*; +pub use core_ops::*; +pub use edge_filter_ops::*; +pub use graph_ops::*; +pub use inherit::Base; +pub use into_dynamic::IntoDynamic; +pub use layer_ops::{DelegateLayerOps, InheritLayerOps, InternalLayerOps}; +pub use materialize::*; +use std::{ + fmt::{Debug, Formatter}, + sync::Arc, +}; +pub use time_semantics::*; + +/// Marker trait to indicate that an object is a valid graph view +pub trait BoxableGraphView: + CoreGraphOps + + GraphOps + + EdgeFilterOps + + InternalLayerOps + + TimeSemantics + + InternalMaterialize + + PropertiesOps + + ConstPropertiesOps + + Send + + Sync + + 'static +{ +} + +impl< + G: CoreGraphOps + + GraphOps + + EdgeFilterOps + + InternalLayerOps + + TimeSemantics + + InternalMaterialize + + PropertiesOps + + ConstPropertiesOps + + Send + + Sync + + 'static + + ?Sized, + > BoxableGraphView for G +{ +} + +pub trait InheritViewOps: Base {} + +impl InheritCoreDeletionOps for G {} +impl InheritGraphOps for G {} +impl InheritEdgeFilterOps for G {} +impl InheritLayerOps for G {} +impl InheritTimeSemantics for G {} +impl InheritCoreOps for G {} +impl InheritMaterialize for G {} +impl InheritPropertiesOps for G {} + +/// Trait for marking a struct as not dynamically dispatched. +/// Used to avoid conflicts when implementing `From` for dynamic wrappers. +pub trait Static {} + +impl From for DynamicGraph { + fn from(value: G) -> Self { + DynamicGraph(Arc::new(value)) + } +} + +impl From> for DynamicGraph { + fn from(value: Arc) -> Self { + DynamicGraph(value) + } +} + +/// Trait for marking a graph view as immutable to avoid conflicts when implementing conversions for mutable and immutable views +pub trait Immutable {} + +#[derive(Clone)] +pub struct DynamicGraph(pub(crate) Arc); + +impl Debug for DynamicGraph { + fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result { + write!( + f, + "DynamicGraph(num_vertices={}, num_edges={})", + self.count_vertices(), + self.count_edges() + ) + } +} + +impl DynamicGraph { + pub fn new(graph: G) -> Self { + Self(Arc::new(graph)) + } + + pub fn new_from_arc(graph_arc: Arc) -> Self { + Self(graph_arc) + } +} + +impl Base for DynamicGraph { + type Base = dyn BoxableGraphView; + + #[inline(always)] + fn base(&self) -> &Self::Base { + &self.0 + } +} + +impl Immutable for DynamicGraph {} + +impl InheritViewOps for DynamicGraph {} + +#[cfg(test)] +mod test { + use crate::{ + db::{ + api::{ + mutation::AdditionOps, + view::{internal::BoxableGraphView, *}, + }, + graph::graph::Graph, + }, + prelude::NO_PROPS, + }; + use itertools::Itertools; + use std::sync::Arc; + + #[test] + fn test_boxing() { + // this tests that a boxed graph actually compiles + let g = Graph::new(); + g.add_vertex(0, 1, NO_PROPS).unwrap(); + let boxed: Arc = Arc::new(g); + assert_eq!(boxed.vertices().id().collect_vec(), vec![1]) + } +} diff --git a/raphtory/src/db/api/view/internal/time_semantics.rs b/raphtory/src/db/api/view/internal/time_semantics.rs new file mode 100644 index 0000000000..501ad648f6 --- /dev/null +++ b/raphtory/src/db/api/view/internal/time_semantics.rs @@ -0,0 +1,567 @@ +use crate::{ + core::{ + entities::{ + edges::{edge_ref::EdgeRef, edge_store::EdgeStore}, + LayerIds, VID, + }, + storage::timeindex::TimeIndexOps, + Prop, + }, + db::api::view::{ + internal::{materialize::MaterializedGraph, Base, CoreGraphOps, EdgeFilter, GraphOps}, + BoxedIter, + }, +}; +use enum_dispatch::enum_dispatch; +use std::ops::Range; + +/// Methods for defining time windowing semantics for a graph +#[enum_dispatch] +pub trait TimeSemantics: GraphOps + CoreGraphOps { + /// Return the earliest time for a vertex + fn vertex_earliest_time(&self, v: VID) -> Option { + self.vertex_additions(v).first_t() + } + + /// Return the latest time for a vertex + fn vertex_latest_time(&self, v: VID) -> Option { + self.vertex_additions(v).last_t() + } + + /// Returns the default start time for perspectives over the view + #[inline] + fn view_start(&self) -> Option { + self.earliest_time_global() + } + + /// Returns the default end time for perspectives over the view + #[inline] + fn view_end(&self) -> Option { + self.latest_time_global().map(|v| v.saturating_add(1)) + } + + /// Returns the timestamp for the earliest activity + fn earliest_time_global(&self) -> Option; + /// Returns the timestamp for the latest activity + fn latest_time_global(&self) -> Option; + /// Returns the timestamp for the earliest activity in the window + fn earliest_time_window(&self, t_start: i64, t_end: i64) -> Option; + + /// Returns the timestamp for the latest activity in the window + fn latest_time_window(&self, t_start: i64, t_end: i64) -> Option; + + /// Return the earliest time for a vertex in a window + fn vertex_earliest_time_window(&self, v: VID, t_start: i64, t_end: i64) -> Option { + self.vertex_additions(v).range(t_start..t_end).first_t() + } + + /// Return the latest time for a vertex in a window + fn vertex_latest_time_window(&self, v: VID, t_start: i64, t_end: i64) -> Option { + self.vertex_additions(v).range(t_start..t_end).last_t() + } + /// check if vertex `v` should be included in window `w` + fn include_vertex_window( + &self, + v: VID, + w: Range, + layer_ids: &LayerIds, + edge_filter: Option<&EdgeFilter>, + ) -> bool; + + /// check if edge `e` should be included in window `w` + fn include_edge_window(&self, e: &EdgeStore, w: Range, layer_ids: &LayerIds) -> bool; + + /// Get the timestamps at which a vertex `v` is active (i.e has an edge addition) + fn vertex_history(&self, v: VID) -> Vec { + self.vertex_additions(v).iter_t().copied().collect() + } + + /// Get the timestamps at which a vertex `v` is active in window `w` (i.e has an edge addition) + fn vertex_history_window(&self, v: VID, w: Range) -> Vec { + self.vertex_additions(v) + .range(w) + .iter_t() + .copied() + .collect() + } + + /// Exploded edge iterator for edge `e` + fn edge_exploded(&self, e: EdgeRef, layer_ids: LayerIds) -> BoxedIter; + + /// Explode edge iterator for edge `e` for every layer + fn edge_layers(&self, e: EdgeRef, layer_ids: LayerIds) -> BoxedIter; + + /// Exploded edge iterator for edge`e` over window `w` + fn edge_window_exploded( + &self, + e: EdgeRef, + w: Range, + layer_ids: LayerIds, + ) -> BoxedIter; + + /// Exploded edge iterator for edge `e` over window `w` for every layer + fn edge_window_layers( + &self, + e: EdgeRef, + w: Range, + layer_ids: LayerIds, + ) -> BoxedIter; + + /// Get the time of the earliest activity of an edge + fn edge_earliest_time(&self, e: EdgeRef, layer_ids: LayerIds) -> Option; + + /// Get the time of the earliest activity of an edge `e` in window `w` + fn edge_earliest_time_window( + &self, + e: EdgeRef, + w: Range, + layer_ids: LayerIds, + ) -> Option; + + /// Get the time of the latest activity of an edge + fn edge_latest_time(&self, e: EdgeRef, layer_ids: LayerIds) -> Option; + + /// Get the time of the latest activity of an edge `e` in window `w` + fn edge_latest_time_window( + &self, + e: EdgeRef, + w: Range, + layer_ids: LayerIds, + ) -> Option; + + /// Get the edge deletions for use with materialize + fn edge_deletion_history(&self, e: EdgeRef, layer_ids: LayerIds) -> Vec; + + /// Get the edge deletions for use with materialize restricted to window `w` + fn edge_deletion_history_window( + &self, + e: EdgeRef, + w: Range, + layer_ids: LayerIds, + ) -> Vec; + + /// Check if graph has temporal property with the given id + /// + /// # Arguments + /// + /// * `prop_id` - The id of the property to retrieve. + fn has_temporal_prop(&self, prop_id: usize) -> bool; + + /// Returns a vector of all temporal values of the graph property with the given id + /// + /// # Arguments + /// + /// * `prop_id` - The id of the property to retrieve. + /// + /// # Returns + /// + /// A vector of tuples representing the temporal values of the property + /// that fall within the specified time window, where the first element of each tuple is the timestamp + /// and the second element is the property value. + fn temporal_prop_vec(&self, prop_id: usize) -> Vec<(i64, Prop)>; + + /// Check if graph has temporal property with the given id in the window + /// + /// # Arguments + /// + /// * `prop_id` - The id of the property to retrieve. + /// * `w` - time window + fn has_temporal_prop_window(&self, prop_id: usize, w: Range) -> bool; + + /// Returns a vector of all temporal values of the graph property with the given name + /// that fall within the specified time window. + /// + /// # Arguments + /// + /// * `name` - The name of the property to retrieve. + /// * `t_start` - The start time of the window to consider. + /// * `t_end` - The end time of the window to consider. + /// + /// # Returns + /// + /// A vector of tuples representing the temporal values of the property + /// that fall within the specified time window, where the first element of each tuple is the timestamp + /// and the second element is the property value. + fn temporal_prop_vec_window( + &self, + prop_id: usize, + t_start: i64, + t_end: i64, + ) -> Vec<(i64, Prop)>; + + /// Check if vertex has temporal property with the given id + /// + /// # Arguments + /// + /// * `v` - The id of the vertex + /// * `prop_id` - The id of the property to retrieve. + fn has_temporal_vertex_prop(&self, v: VID, prop_id: usize) -> bool; + + /// Returns a vector of all temporal values of the vertex property with the given name for the + /// given vertex + /// + /// # Arguments + /// + /// * `v` - A reference to the vertex for which to retrieve the temporal property vector. + /// * `name` - The name of the property to retrieve. + /// + /// # Returns + /// + /// A vector of tuples representing the temporal values of the property for the given vertex + /// that fall within the specified time window, where the first element of each tuple is the timestamp + /// and the second element is the property value. + fn temporal_vertex_prop_vec(&self, v: VID, id: usize) -> Vec<(i64, Prop)>; + + /// Check if vertex has temporal property with the given id in the window + /// + /// # Arguments + /// + /// * `v` - the id of the vertex + /// * `prop_id` - The id of the property to retrieve. + /// * `w` - time window + fn has_temporal_vertex_prop_window(&self, v: VID, prop_id: usize, w: Range) -> bool; + + /// Returns a vector of all temporal values of the vertex property with the given name for the given vertex + /// that fall within the specified time window. + /// + /// # Arguments + /// + /// * `v` - A reference to the vertex for which to retrieve the temporal property vector. + /// * `name` - The name of the property to retrieve. + /// * `t_start` - The start time of the window to consider. + /// * `t_end` - The end time of the window to consider. + /// + /// # Returns + /// + /// A vector of tuples representing the temporal values of the property for the given vertex + /// that fall within the specified time window, where the first element of each tuple is the timestamp + /// and the second element is the property value. + fn temporal_vertex_prop_vec_window( + &self, + v: VID, + id: usize, + t_start: i64, + t_end: i64, + ) -> Vec<(i64, Prop)>; + + /// Check if edge has temporal property with the given id in the window + /// + /// # Arguments + /// + /// * `e` - the id of the edge + /// * `prop_id` - The id of the property to retrieve. + /// * `w` - time window + fn has_temporal_edge_prop_window( + &self, + e: EdgeRef, + prop_id: usize, + w: Range, + layer_ids: LayerIds, + ) -> bool; + + /// Returns a vector of tuples containing the values of the temporal property with the given name + /// for the given edge reference within the specified time window. + /// + /// # Arguments + /// + /// * `e` - An `EdgeRef` reference to the edge of interest. + /// * `name` - A `String` containing the name of the temporal property. + /// * `t_start` - An `i64` containing the start time of the time window (inclusive). + /// * `t_end` - An `i64` containing the end time of the time window (exclusive). + /// + /// # Returns + /// + /// * A `Vec` of tuples containing the values of the temporal property with the given name for the given edge + /// within the specified time window. + /// + fn temporal_edge_prop_vec_window( + &self, + e: EdgeRef, + id: usize, + t_start: i64, + t_end: i64, + layer_ids: LayerIds, + ) -> Vec<(i64, Prop)>; + + /// Check if edge has temporal property with the given id + /// + /// # Arguments + /// + /// * `e` - The id of the edge + /// * `prop_id` - The id of the property to retrieve. + fn has_temporal_edge_prop(&self, e: EdgeRef, prop_id: usize, layer_ids: LayerIds) -> bool; + + /// Returns a vector of tuples containing the values of the temporal property with the given name + /// for the given edge reference. + /// + /// # Arguments + /// + /// * `e` - An `EdgeRef` reference to the edge of interest. + /// * `name` - A `String` containing the name of the temporal property. + /// + /// # Returns + /// + /// * A `Vec` of tuples containing the values of the temporal property with the given name for the given edge. + fn temporal_edge_prop_vec( + &self, + e: EdgeRef, + id: usize, + layer_ids: LayerIds, + ) -> Vec<(i64, Prop)>; +} + +pub trait InheritTimeSemantics: Base + GraphOps + CoreGraphOps {} + +impl DelegateTimeSemantics for G +where + ::Base: TimeSemantics, +{ + type Internal = ::Base; + + fn graph(&self) -> &Self::Internal { + self.base() + } +} + +pub trait DelegateTimeSemantics: GraphOps + CoreGraphOps { + type Internal: TimeSemantics + ?Sized; + + fn graph(&self) -> &Self::Internal; +} + +impl TimeSemantics for G { + #[inline] + fn vertex_earliest_time(&self, v: VID) -> Option { + self.graph().vertex_earliest_time(v) + } + + #[inline] + fn vertex_latest_time(&self, v: VID) -> Option { + self.graph().vertex_latest_time(v) + } + + #[inline] + fn view_start(&self) -> Option { + self.graph().view_start() + } + #[inline] + fn view_end(&self) -> Option { + self.graph().view_end() + } + #[inline] + fn earliest_time_global(&self) -> Option { + self.graph().earliest_time_global() + } + #[inline] + fn latest_time_global(&self) -> Option { + self.graph().latest_time_global() + } + #[inline] + fn earliest_time_window(&self, t_start: i64, t_end: i64) -> Option { + self.graph().earliest_time_window(t_start, t_end) + } + #[inline] + fn latest_time_window(&self, t_start: i64, t_end: i64) -> Option { + self.graph().latest_time_window(t_start, t_end) + } + #[inline] + fn vertex_earliest_time_window(&self, v: VID, t_start: i64, t_end: i64) -> Option { + self.graph().vertex_earliest_time_window(v, t_start, t_end) + } + #[inline] + fn vertex_latest_time_window(&self, v: VID, t_start: i64, t_end: i64) -> Option { + self.graph().vertex_latest_time_window(v, t_start, t_end) + } + #[inline] + fn include_vertex_window( + &self, + v: VID, + w: Range, + layer_ids: &LayerIds, + edge_filter: Option<&EdgeFilter>, + ) -> bool { + self.graph() + .include_vertex_window(v, w, layer_ids, edge_filter) + } + + #[inline] + fn include_edge_window(&self, e: &EdgeStore, w: Range, layer_ids: &LayerIds) -> bool { + self.graph().include_edge_window(e, w, layer_ids) + } + + #[inline] + fn vertex_history(&self, v: VID) -> Vec { + self.graph().vertex_history(v) + } + + #[inline] + fn vertex_history_window(&self, v: VID, w: Range) -> Vec { + self.graph().vertex_history_window(v, w) + } + + #[inline] + fn edge_exploded(&self, e: EdgeRef, layer_ids: LayerIds) -> BoxedIter { + self.graph().edge_exploded(e, layer_ids) + } + + #[inline] + fn edge_layers(&self, e: EdgeRef, layer_ids: LayerIds) -> BoxedIter { + self.graph().edge_layers(e, layer_ids) + } + + #[inline] + fn edge_window_exploded( + &self, + e: EdgeRef, + w: Range, + layer_ids: LayerIds, + ) -> BoxedIter { + self.graph().edge_window_exploded(e, w, layer_ids) + } + + #[inline] + fn edge_window_layers( + &self, + e: EdgeRef, + w: Range, + layer_ids: LayerIds, + ) -> BoxedIter { + self.graph().edge_window_layers(e, w, layer_ids) + } + + #[inline] + fn edge_earliest_time(&self, e: EdgeRef, layer_ids: LayerIds) -> Option { + self.graph().edge_earliest_time(e, layer_ids) + } + + #[inline] + fn edge_earliest_time_window( + &self, + e: EdgeRef, + w: Range, + layer_ids: LayerIds, + ) -> Option { + self.graph().edge_earliest_time_window(e, w, layer_ids) + } + + #[inline] + fn edge_latest_time(&self, e: EdgeRef, layer_ids: LayerIds) -> Option { + self.graph().edge_latest_time(e, layer_ids) + } + + #[inline] + fn edge_latest_time_window( + &self, + e: EdgeRef, + w: Range, + layer_ids: LayerIds, + ) -> Option { + self.graph().edge_latest_time_window(e, w, layer_ids) + } + + #[inline] + fn edge_deletion_history(&self, e: EdgeRef, layer_ids: LayerIds) -> Vec { + self.graph().edge_deletion_history(e, layer_ids) + } + + #[inline] + fn edge_deletion_history_window( + &self, + e: EdgeRef, + w: Range, + layer_ids: LayerIds, + ) -> Vec { + self.graph().edge_deletion_history_window(e, w, layer_ids) + } + + #[inline] + fn has_temporal_prop(&self, prop_id: usize) -> bool { + self.graph().has_temporal_prop(prop_id) + } + + #[inline] + fn temporal_prop_vec(&self, prop_id: usize) -> Vec<(i64, Prop)> { + self.graph().temporal_prop_vec(prop_id) + } + + #[inline] + fn has_temporal_prop_window(&self, prop_id: usize, w: Range) -> bool { + self.graph().has_temporal_prop_window(prop_id, w) + } + + #[inline] + fn temporal_prop_vec_window( + &self, + prop_id: usize, + t_start: i64, + t_end: i64, + ) -> Vec<(i64, Prop)> { + self.graph() + .temporal_prop_vec_window(prop_id, t_start, t_end) + } + + #[inline] + fn has_temporal_vertex_prop(&self, v: VID, prop_id: usize) -> bool { + self.graph().has_temporal_vertex_prop(v, prop_id) + } + + #[inline] + fn temporal_vertex_prop_vec(&self, v: VID, prop_id: usize) -> Vec<(i64, Prop)> { + self.graph().temporal_vertex_prop_vec(v, prop_id) + } + + #[inline] + fn has_temporal_vertex_prop_window(&self, v: VID, prop_id: usize, w: Range) -> bool { + self.graph().has_temporal_vertex_prop_window(v, prop_id, w) + } + + #[inline] + fn temporal_vertex_prop_vec_window( + &self, + v: VID, + prop_id: usize, + t_start: i64, + t_end: i64, + ) -> Vec<(i64, Prop)> { + self.graph() + .temporal_vertex_prop_vec_window(v, prop_id, t_start, t_end) + } + + fn has_temporal_edge_prop_window( + &self, + e: EdgeRef, + prop_id: usize, + w: Range, + layer_ids: LayerIds, + ) -> bool { + self.graph() + .has_temporal_edge_prop_window(e, prop_id, w, layer_ids) + } + + #[inline] + fn temporal_edge_prop_vec_window( + &self, + e: EdgeRef, + prop_id: usize, + t_start: i64, + t_end: i64, + layer_ids: LayerIds, + ) -> Vec<(i64, Prop)> { + self.graph() + .temporal_edge_prop_vec_window(e, prop_id, t_start, t_end, layer_ids) + } + + fn has_temporal_edge_prop(&self, e: EdgeRef, prop_id: usize, layer_ids: LayerIds) -> bool { + self.graph().has_temporal_edge_prop(e, prop_id, layer_ids) + } + + #[inline] + fn temporal_edge_prop_vec( + &self, + e: EdgeRef, + prop_id: usize, + layer_ids: LayerIds, + ) -> Vec<(i64, Prop)> { + self.graph().temporal_edge_prop_vec(e, prop_id, layer_ids) + } +} diff --git a/raphtory/src/db/api/view/internal/wrapped_graph.rs b/raphtory/src/db/api/view/internal/wrapped_graph.rs new file mode 100644 index 0000000000..1b49794d60 --- /dev/null +++ b/raphtory/src/db/api/view/internal/wrapped_graph.rs @@ -0,0 +1,4 @@ +use crate::db::api::view::internal::{BoxableGraphView, InheritViewOps}; +use std::sync::Arc; + +impl InheritViewOps for Arc {} diff --git a/raphtory/src/db/api/view/layer.rs b/raphtory/src/db/api/view/layer.rs new file mode 100644 index 0000000000..ed622ef30b --- /dev/null +++ b/raphtory/src/db/api/view/layer.rs @@ -0,0 +1,83 @@ +use crate::core::ArcStr; +use std::sync::Arc; + +/// Trait defining layer operations +pub trait LayerOps { + type LayeredViewType; + + /// Return a graph containing only the default edge layer + fn default_layer(&self) -> Self::LayeredViewType; + + /// Return a graph containing the layer `name` + fn layer>(&self, name: L) -> Option; +} + +#[derive(Debug)] +pub enum Layer { + All, + Default, + One(ArcStr), + Multiple(Arc<[String]>), +} + +impl<'a, T: ToOwned + ?Sized> From> for Layer { + fn from(name: Option<&'a T>) -> Self { + match name { + Some(name) => Layer::One(name.to_owned().into()), + None => Layer::All, + } + } +} + +impl From> for Layer { + fn from(value: Option) -> Self { + match value { + Some(name) => Layer::One(name.into()), + None => Layer::All, + } + } +} + +impl From for Layer { + fn from(value: ArcStr) -> Self { + Layer::One(value) + } +} + +impl From for Layer { + fn from(value: String) -> Self { + Layer::One(value.into()) + } +} + +impl<'a, T: ToOwned + ?Sized> From<&'a T> for Layer { + fn from(name: &'a T) -> Self { + Layer::One(name.to_owned().into()) + } +} + +impl<'a, T: ToOwned + ?Sized> From> for Layer { + fn from(names: Vec<&'a T>) -> Self { + match names.len() { + 0 => Layer::All, + 1 => Layer::One(names[0].to_owned().into()), + _ => Layer::Multiple( + names + .into_iter() + .map(|s| s.to_owned()) + .collect::>() + .into(), + ), + } + } +} + +impl From> for Layer { + fn from(names: Vec) -> Self { + match names.len() { + 0 => Layer::All, + 1 => Layer::One(names.into_iter().next().expect("exists").into()), + _ => Layer::Multiple(names.into()), + } + } +} diff --git a/raphtory/src/db/api/view/mod.rs b/raphtory/src/db/api/view/mod.rs new file mode 100644 index 0000000000..6be1d0f853 --- /dev/null +++ b/raphtory/src/db/api/view/mod.rs @@ -0,0 +1,16 @@ +//! Defines the `ViewApi` trait, which represents the API for querying a view of the graph. + +mod edge; +mod graph; +pub mod internal; +mod layer; +mod time; +mod vertex; + +pub use edge::*; +pub use graph::*; +pub use layer::*; +pub use time::*; +pub use vertex::*; + +pub type BoxedIter = Box + Send>; diff --git a/raphtory/src/db/view_api/time.rs b/raphtory/src/db/api/view/time.rs similarity index 80% rename from raphtory/src/db/view_api/time.rs rename to raphtory/src/db/api/view/time.rs index 6f79cf5b73..b5569dbed0 100644 --- a/raphtory/src/db/view_api/time.rs +++ b/raphtory/src/db/api/view/time.rs @@ -1,5 +1,4 @@ -use crate::core::time::error::ParseTimeError; -use crate::core::time::{Interval, IntoTime}; +use crate::core::utils::time::{error::ParseTimeError, Interval, IntoTime}; /// Trait defining time query operations pub trait TimeOps { @@ -24,11 +23,17 @@ pub trait TimeOps { /// Create a view including all events until `end` (inclusive) fn at(&self, end: T) -> Self::WindowedViewType { - self.window(i64::MIN, end.into_time().saturating_add(1)) + let end = end.into_time(); + let start = self.start().unwrap_or(end); + if start > end { + self.window(end, end.saturating_add(1)) + } else { + self.window(start, end.saturating_add(1)) + } } - /// Creates a `WindowSet` with the given `step` size and optional `start` and `end` times, - /// using an expanding window. + /// Creates a `WindowSet` with the given `step` size + /// using an expanding window. The last window may fall partially outside the range of the data/view. /// /// An expanding window is a window that grows by `step` size at each iteration. fn expanding(&self, step: I) -> Result, ParseTimeError> @@ -47,8 +52,8 @@ pub trait TimeOps { } } - /// Creates a `WindowSet` with the given `window` size and optional `step`, `start` and `end` times, - /// using a rolling window. + /// Creates a `WindowSet` with the given `window` size and optional `step` + /// using a rolling window. The last window may fall partially outside the range of the data/view. /// /// A rolling window is a window that moves forward by `step` size at each iteration. fn rolling(&self, window: I, step: Option) -> Result, ParseTimeError> @@ -90,7 +95,7 @@ impl WindowSet { // } else { // timeline_start + step - 1 // }; - let cursor_start = start + step - 1; + let cursor_start = start + step; Self { view, cursor: cursor_start, @@ -145,9 +150,12 @@ impl Iterator for TimeIndex { impl Iterator for WindowSet { type Item = T::WindowedViewType; fn next(&mut self) -> Option { - if self.cursor < self.end { - let window_end = self.cursor + 1; - let window_start = self.window.map(|w| window_end - w).unwrap_or(i64::MIN); + if self.cursor < self.end + self.step { + let window_end = self.cursor; + let window_start = self + .window + .map(|w| window_end - w) + .unwrap_or(self.view.start().unwrap_or(window_end)); let window = self.view.window(window_start, window_end); self.cursor = self.cursor + self.step; Some(window) @@ -159,18 +167,24 @@ impl Iterator for WindowSet { #[cfg(test)] mod time_tests { - use crate::core::time::TryIntoTime; - use crate::db::graph::Graph; - use crate::db::view_api::internal::GraphViewInternalOps; - use crate::db::view_api::time::WindowSet; - use crate::db::view_api::{GraphViewOps, TimeOps}; + use crate::{ + core::utils::time::TryIntoTime, + db::{ + api::{ + mutation::AdditionOps, + view::{time::WindowSet, GraphViewOps, TimeOps}, + }, + graph::graph::Graph, + }, + prelude::NO_PROPS, + }; use itertools::Itertools; // start inclusive, end exclusive fn graph_with_timeline(start: i64, end: i64) -> Graph { - let g = Graph::new(4); - g.add_vertex(start, 0, &vec![]).unwrap(); - g.add_vertex(end - 1, 0, &vec![]).unwrap(); + let g = Graph::new(); + g.add_vertex(start, 0, NO_PROPS).unwrap(); + g.add_vertex(end - 1, 0, NO_PROPS).unwrap(); assert_eq!(g.start().unwrap(), start); assert_eq!(g.end().unwrap(), end); g @@ -178,7 +192,7 @@ mod time_tests { fn assert_bounds(windows: WindowSet, expected: Vec<(i64, i64)>) where - G: GraphViewOps + GraphViewInternalOps, + G: GraphViewOps, { let window_bounds = windows .map(|w| (w.start().unwrap(), w.end().unwrap())) @@ -195,7 +209,7 @@ mod time_tests { let g = graph_with_timeline(1, 6); let windows = g.rolling(3, Some(2)).unwrap(); - let expected = vec![(0, 3), (2, 5)]; + let expected = vec![(0, 3), (2, 5), (4, 7)]; assert_bounds(windows, expected.clone()); let g = graph_with_timeline(0, 9).window(1, 6); @@ -205,15 +219,14 @@ mod time_tests { #[test] fn expanding() { - let min = i64::MIN; let g = graph_with_timeline(1, 7); let windows = g.expanding(2).unwrap(); - let expected = vec![(min, 3), (min, 5), (min, 7)]; + let expected = vec![(1, 3), (1, 5), (1, 7)]; assert_bounds(windows, expected); let g = graph_with_timeline(1, 6); let windows = g.expanding(2).unwrap(); - let expected = vec![(min, 3), (min, 5)]; + let expected = vec![(1, 3), (1, 5), (1, 7)]; assert_bounds(windows, expected.clone()); let g = graph_with_timeline(0, 9).window(1, 6); @@ -227,10 +240,16 @@ mod time_tests { let end = "2020-06-07 23:59:59.999".try_into_time().unwrap(); let g = graph_with_timeline(start, end); let windows = g.rolling("1 day", None).unwrap(); - let expected = vec![( - "2020-06-06 00:00:00".try_into_time().unwrap(), // entire 2020-06-06 - "2020-06-07 00:00:00".try_into_time().unwrap(), - )]; + let expected = vec![ + ( + "2020-06-06 00:00:00".try_into_time().unwrap(), // entire 2020-06-06 + "2020-06-07 00:00:00".try_into_time().unwrap(), + ), + ( + "2020-06-07 00:00:00".try_into_time().unwrap(), // entire 2020-06-06 + "2020-06-08 00:00:00".try_into_time().unwrap(), + ), + ]; assert_bounds(windows, expected); let start = "2020-06-06 00:00:00".try_into_time().unwrap(); @@ -269,13 +288,14 @@ mod time_tests { #[test] fn expanding_dates() { - let min = i64::MIN; - let start = "2020-06-06 00:00:00".try_into_time().unwrap(); let end = "2020-06-07 23:59:59.999".try_into_time().unwrap(); let g = graph_with_timeline(start, end); let windows = g.expanding("1 day").unwrap(); - let expected = vec![(min, "2020-06-07 00:00:00".try_into_time().unwrap())]; + let expected = vec![ + (start, "2020-06-07 00:00:00".try_into_time().unwrap()), + (start, "2020-06-08 00:00:00".try_into_time().unwrap()), + ]; assert_bounds(windows, expected); let start = "2020-06-06 00:00:00".try_into_time().unwrap(); @@ -283,8 +303,8 @@ mod time_tests { let g = graph_with_timeline(start, end); let windows = g.expanding("1 day").unwrap(); let expected = vec![ - (min, "2020-06-07 00:00:00".try_into_time().unwrap()), - (min, "2020-06-08 00:00:00".try_into_time().unwrap()), + (start, "2020-06-07 00:00:00".try_into_time().unwrap()), + (start, "2020-06-08 00:00:00".try_into_time().unwrap()), ]; assert_bounds(windows, expected); } diff --git a/raphtory/src/db/view_api/vertex.rs b/raphtory/src/db/api/view/vertex.rs similarity index 60% rename from raphtory/src/db/view_api/vertex.rs rename to raphtory/src/db/api/view/vertex.rs index a9bc641eab..98a0eb4fc1 100644 --- a/raphtory/src/db/view_api/vertex.rs +++ b/raphtory/src/db/api/view/vertex.rs @@ -1,7 +1,10 @@ -use crate::core::Prop; -use crate::db::view_api::edge::EdgeListOps; -use crate::db::view_api::{GraphViewOps, TimeOps}; -use std::collections::HashMap; +use crate::db::{ + api::{ + properties::Properties, + view::{edge::EdgeListOps, GraphViewOps, TimeOps}, + }, + graph::vertex::VertexView, +}; /// Operations defined for a vertex pub trait VertexViewOps: TimeOps { @@ -28,88 +31,15 @@ pub trait VertexViewOps: TimeOps { /// Get the timestamp for the latest activity of the vertex fn latest_time(&self) -> Self::ValueType>; - /// Gets the property value of this vertex given the name of the property. - fn property(&self, name: String, include_static: bool) -> Self::ValueType>; - /// Gets the history of the vertex (time that the vertex was added and times when changes were made to the vertex) fn history(&self) -> Self::ValueType>; - /// Get the temporal property value of this vertex. - /// - /// # Arguments - /// - /// * `name` - The name of the property to retrieve. - /// - /// # Returns - /// - /// A vector of `(i64, Prop)` tuples where the `i64` value is the timestamp of the - /// property value and `Prop` is the value itself. - fn property_history(&self, name: String) -> Self::ValueType>; - - /// Get all property values of this vertex. - /// - /// # Arguments - /// - /// * `include_static` - If `true` then static properties are included in the result. - /// - /// # Returns - /// - /// A HashMap with the names of the properties as keys and the property values as values. - fn properties(&self, include_static: bool) -> Self::ValueType>; - - /// Get all temporal property values of this vertex. - /// - /// # Returns - /// - /// A HashMap with the names of the properties as keys and a vector of `(i64, Prop)` tuples - /// as values. The `i64` value is the timestamp of the property value and `Prop` - /// is the value itself. - fn property_histories(&self) -> Self::ValueType>>; - - /// Get the names of all properties of this vertex. - /// - /// # Arguments - /// - /// * `include_static` - If `true` then static properties are included in the result. - /// - /// # Returns - /// - /// A vector of the names of the properties of this vertex. - fn property_names(&self, include_static: bool) -> Self::ValueType>; - - /// Checks if a property exists on this vertex. - /// - /// # Arguments - /// - /// * `name` - The name of the property to check for. - /// * `include_static` - If `true` then static properties are included in the result. - /// - /// # Returns - /// - /// `true` if the property exists, otherwise `false`. - fn has_property(&self, name: String, include_static: bool) -> Self::ValueType; - - /// Checks if a static property exists on this vertex. - /// - /// # Arguments - /// - /// * `name` - The name of the property to check for. - /// - /// # Returns - /// - /// `true` if the property exists, otherwise `false`. - fn has_static_property(&self, name: String) -> Self::ValueType; - - /// Get the static property value of this vertex. - /// - /// # Arguments - /// - /// * `name` - The name of the property to retrieve. + /// Get a view of the temporal properties of this vertex. /// /// # Returns /// - /// The value of the property if it exists, otherwise `None`. - fn static_property(&self, name: String) -> Self::ValueType>; + /// A view with the names of the properties as keys and the property values as values. + fn properties(&self) -> Self::ValueType>>; /// Get the degree of this vertex (i.e., the number of edges that are incident to it). /// @@ -201,9 +131,7 @@ pub trait VertexListOps: ) -> Self::IterType<::WindowedViewType>; /// Create views for the vertices including all events until `end` (inclusive) - fn at(self, end: i64) -> Self::IterType<::WindowedViewType> { - self.window(i64::MIN, end.saturating_add(1)) - } + fn at(self, end: i64) -> Self::IterType<::WindowedViewType>; /// Returns the ids of vertices in the list. /// @@ -212,31 +140,10 @@ pub trait VertexListOps: fn id(self) -> Self::IterType; fn name(self) -> Self::IterType; - fn property(self, name: String, include_static: bool) -> Self::IterType>; + /// Returns an iterator over properties of the vertices + fn properties(self) -> Self::IterType>>; - /// Returns an iterator of the values of the given property name - /// including the times when it changed - /// - /// # Arguments - /// * `name` - The name of the property. - /// - /// # Returns - /// An iterator of the values of the given property name including the times when it changed - /// as a vector of tuples of the form (time, property). - fn property_history(self, name: String) -> Self::IterType>; - fn properties(self, include_static: bool) -> Self::IterType>; fn history(self) -> Self::IterType>; - /// Returns an iterator over all vertex properties. - /// - /// # Returns - /// An iterator over all vertex properties. - fn property_histories(self) -> Self::IterType>>; - fn property_names(self, include_static: bool) -> Self::IterType>; - fn has_property(self, name: String, include_static: bool) -> Self::IterType; - - fn has_static_property(self, name: String) -> Self::IterType; - - fn static_property(self, name: String) -> Self::IterType>; /// Returns an iterator over the degree of the vertices. /// diff --git a/raphtory/src/db/edge.rs b/raphtory/src/db/edge.rs deleted file mode 100644 index 3ae42e782b..0000000000 --- a/raphtory/src/db/edge.rs +++ /dev/null @@ -1,264 +0,0 @@ -//! Defines the `Edge` struct, which represents an edge in the graph. -//! -//! Edges are used to define directed connections between verticies in the graph. -//! Edges are identified by a unique ID, can have a direction (Ingoing, Outgoing, or Both) -//! and can have properties associated with them. -//! - -use crate::core::edge_ref::EdgeRef; -use crate::core::time::IntoTime; -use crate::core::vertex_ref::VertexRef; -use crate::core::Prop; -use crate::db::graph_window::WindowedGraph; -use crate::db::vertex::VertexView; -use crate::db::view_api::edge::{EdgeViewInternalOps, EdgeViewOps}; -use crate::db::view_api::*; -use std::collections::HashMap; -use std::fmt::{Debug, Formatter}; -use std::iter; - -/// A view of an edge in the graph. -#[derive(Clone)] -pub struct EdgeView { - /// A view of an edge in the graph. - pub graph: G, - /// A reference to the edge. - pub edge: EdgeRef, -} - -impl EdgeView { - pub fn new(graph: G, edge: EdgeRef) -> Self { - Self { graph, edge } - } -} - -impl EdgeViewInternalOps> for EdgeView { - fn graph(&self) -> G { - self.graph.clone() - } - - fn eref(&self) -> EdgeRef { - self.edge - } - - fn new_vertex(&self, v: VertexRef) -> VertexView { - VertexView::new(self.graph(), v) - } - - fn new_edge(&self, e: EdgeRef) -> Self { - Self { - graph: self.graph(), - edge: e, - } - } -} - -impl EdgeViewOps for EdgeView { - type Graph = G; - type Vertex = VertexView; - type EList = BoxedIter; - - fn explode(&self) -> Self::EList { - let ev = self.clone(); - match self.edge.time() { - Some(_) => Box::new(iter::once(ev)), - None => { - let e = self.edge; - let ts = self.graph.edge_timestamps(self.edge, None); - Box::new(ts.into_iter().map(move |t| ev.new_edge(e.at(t)))) - } - } - } -} - -impl Debug for EdgeView { - fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result { - write!( - f, - "EdgeView({}, {})", - self.graph.vertex(self.edge.src()).unwrap().id(), - self.graph.vertex(self.edge.dst()).unwrap().id() - ) - } -} - -impl From> for EdgeRef { - fn from(value: EdgeView) -> Self { - value.edge - } -} - -impl TimeOps for EdgeView { - type WindowedViewType = EdgeView>; - - fn start(&self) -> Option { - self.graph.start() - } - - fn end(&self) -> Option { - self.graph.end() - } - - fn window(&self, t_start: T, t_end: T) -> Self::WindowedViewType { - EdgeView { - graph: self.graph.window(t_start, t_end), - edge: self.edge, - } - } -} - -/// Implement `EdgeListOps` trait for an iterator of `EdgeView` objects. -/// -/// This implementation enables the use of the `src` and `dst` methods to retrieve the vertices -/// connected to the edges inside the iterator. -impl EdgeListOps for BoxedIter> { - type Graph = G; - type Vertex = VertexView; - type Edge = EdgeView; - type ValueType = T; - - /// Specifies the associated type for an iterator over vertices. - type VList = Box> + Send>; - - /// Specifies the associated type for the iterator over edges. - type IterType = Box + Send>; - - fn has_property(self, name: String, include_static: bool) -> BoxedIter { - Box::new(self.map(move |e| e.has_property(name.clone(), include_static))) - } - - fn property(self, name: String, include_static: bool) -> BoxedIter> { - Box::new(self.map(move |e| e.property(name.clone(), include_static))) - } - - fn properties(self, include_static: bool) -> BoxedIter> { - Box::new(self.map(move |e| e.properties(include_static))) - } - - fn property_names(self, include_static: bool) -> BoxedIter> { - Box::new(self.map(move |e| e.property_names(include_static))) - } - - fn has_static_property(self, name: String) -> BoxedIter { - Box::new(self.map(move |e| e.has_static_property(name.clone()))) - } - - fn static_property(self, name: String) -> BoxedIter> { - Box::new(self.map(move |e| e.static_property(name.clone()))) - } - - fn property_history(self, name: String) -> BoxedIter> { - Box::new(self.map(move |e| e.property_history(name.clone()))) - } - - fn property_histories(self) -> BoxedIter>> { - Box::new(self.map(|e| e.property_histories())) - } - - /// Returns an iterator over the source vertices of the edges in the iterator. - fn src(self) -> Self::VList { - Box::new(self.map(|e| e.src())) - } - - /// Returns an iterator over the destination vertices of the edges in the iterator. - fn dst(self) -> Self::VList { - Box::new(self.map(|e| e.dst())) - } - - fn id(self) -> Self::IterType<(u64, u64)> { - Box::new(self.map(|e| e.id())) - } - - /// returns an iterator of exploded edges that include an edge at each point in time - fn explode(self) -> Self { - Box::new(self.flat_map(move |e| e.explode())) - } - - /// Gets the earliest times of a list of edges - fn earliest_time(self) -> Self::IterType> { - Box::new(self.map(|e| e.earliest_time())) - } - - /// Gets the latest times of a list of edges - fn latest_time(self) -> Self::IterType> { - Box::new(self.map(|e| e.latest_time())) - } -} - -impl EdgeListOps for BoxedIter>> { - type Graph = G; - type Vertex = VertexView; - type Edge = EdgeView; - type ValueType = Box + Send>; - type VList = Box> + Send>> + Send>; - type IterType = Box + Send>> + Send>; - - fn has_property(self, name: String, include_static: bool) -> BoxedIter> { - Box::new(self.map(move |it| { - let name = name.clone(); - let iter: Self::ValueType = - Box::new(it.map(move |e| e.has_property(name.clone(), include_static))); - iter - })) - } - - fn property( - self, - name: String, - include_static: bool, - ) -> BoxedIter>> { - Box::new(self.map(move |it| it.property(name.clone(), include_static))) - } - - fn properties(self, include_static: bool) -> BoxedIter>> { - Box::new(self.map(move |it| it.properties(include_static))) - } - - fn property_names(self, include_static: bool) -> BoxedIter>> { - Box::new(self.map(move |it| it.property_names(include_static))) - } - - fn has_static_property(self, name: String) -> BoxedIter> { - Box::new(self.map(move |it| it.has_static_property(name.clone()))) - } - - fn static_property(self, name: String) -> BoxedIter>> { - Box::new(self.map(move |it| it.static_property(name.clone()))) - } - - fn property_history(self, name: String) -> BoxedIter>> { - Box::new(self.map(move |it| it.property_history(name.clone()))) - } - - fn property_histories(self) -> BoxedIter>>> { - Box::new(self.map(|it| it.property_histories())) - } - - fn src(self) -> Self::VList { - Box::new(self.map(|it| it.src())) - } - - fn dst(self) -> Self::VList { - Box::new(self.map(|it| it.dst())) - } - - fn id(self) -> Self::IterType<(u64, u64)> { - Box::new(self.map(|it| it.id())) - } - - fn explode(self) -> Self { - Box::new(self.map(move |it| it.explode())) - } - - /// Gets the earliest times of a list of edges - fn earliest_time(self) -> Self::IterType> { - Box::new(self.map(|e| e.earliest_time())) - } - - /// Gets the latest times of a list of edges - fn latest_time(self) -> Self::IterType> { - Box::new(self.map(|e| e.latest_time())) - } -} - -pub type EdgeList = Box> + Send>; diff --git a/raphtory/src/db/graph.rs b/raphtory/src/db/graph.rs deleted file mode 100644 index 40a92e995d..0000000000 --- a/raphtory/src/db/graph.rs +++ /dev/null @@ -1,2178 +0,0 @@ -//! Defines the `Graph` struct, which represents a raphtory graph in memory. -//! -//! This is the base class used to create a temporal graph, add vertices and edges, -//! create windows, and query the graph with a variety of algorithms. -//! It is a wrapper around a set of shards, which are the actual graph data structures. -//! -//! # Examples -//! -//! ```rust -//! use raphtory::db::graph::InternalGraph; -//! use raphtory::db::view_api::*; -//! let graph = InternalGraph::new(2); -//! graph.add_vertex(0, "Alice", &vec![]); -//! graph.add_vertex(1, "Bob", &vec![]); -//! graph.add_edge(2, "Alice", "Bob", &vec![], None); -//! graph.num_edges(); -//! ``` -//! - -use crate::core::tgraph::TemporalGraph; -use crate::core::tgraph_shard::TGraphShard; -use crate::core::time::{IntoTimeWithFormat, TryIntoTime}; -use crate::core::{ - edge_ref::EdgeRef, tgraph_shard::errors::GraphError, utils, vertex::InputVertex, - vertex_ref::VertexRef, Direction, Prop, -}; - -use crate::core::vertex_ref::LocalVertexRef; -use crate::db::graph_immutable::ImmutableGraph; -use crate::db::view_api::internal::{GraphViewInternalOps, WrappedGraph}; -use crate::db::view_api::*; -use itertools::Itertools; -use rayon::prelude::*; -use rustc_hash::FxHashMap; -use serde::{Deserialize, Serialize}; -use std::cmp::{max, min}; -use std::fmt::{Display, Formatter}; -use std::ops::{Deref, DerefMut}; -use std::{ - collections::HashMap, - iter, - ops::Range, - path::{Path, PathBuf}, - sync::Arc, -}; - -/// A temporal graph composed of multiple shards. -/// -/// This is the public facing struct used to create a temporal graph, add vertices and edges, -/// create windows, and query the graph with a variety of algorithms. -/// It is a wrapper around a set of shards, which are the actual graph data structures. -#[derive(Debug, Clone, Serialize, Deserialize)] -pub struct InternalGraph { - /// The number of shards in the graph. - pub(crate) nr_shards: usize, - /// A vector of `TGraphShard` representing the shards in the graph. - pub(crate) shards: Vec>, - /// Translates layer names to layer ids - pub(crate) layer_ids: Arc>>, -} - -#[repr(transparent)] -#[derive(Debug, Clone, Serialize, Deserialize, Default, PartialEq)] -pub struct Graph(Arc); - -impl Display for Graph { - fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result { - write!(f, "{}", self.0) - } -} - -impl Deref for Graph { - type Target = Arc; - - fn deref(&self) -> &Self::Target { - &self.0 - } -} - -impl DerefMut for Graph { - fn deref_mut(&mut self) -> &mut Self::Target { - &mut self.0 - } -} - -impl WrappedGraph for Graph { - type Internal = InternalGraph; - - fn as_graph(&self) -> &InternalGraph { - &self.0 - } -} - -impl Graph { - /// Create a new graph with the specified number of shards - /// - /// # Arguments - /// - /// * `nr_shards` - The number of shards - /// - /// # Returns - /// - /// A raphtory graph - /// - /// # Example - /// - /// ``` - /// use raphtory::db::graph::Graph; - /// let g = Graph::new(4); - /// ``` - pub fn new(nr_shards: usize) -> Self { - Self(Arc::new(InternalGraph::new(nr_shards))) - } - - pub(crate) fn new_from_frozen( - nr_shards: usize, - shards: Vec>, - layer_ids: Arc>>, - ) -> Self { - Self(Arc::new(InternalGraph { - nr_shards, - shards, - layer_ids, - })) - } - - /// Load a graph from a directory - /// - /// # Arguments - /// - /// * `path` - The path to the directory - /// - /// # Returns - /// - /// A raphtory graph - /// - /// # Example - /// - /// ``` - /// use raphtory::db::graph::InternalGraph; - /// // let g = Graph::load_from_file("path/to/graph"); - /// ``` - pub fn load_from_file>(path: P) -> Result> { - Ok(Self(Arc::new(InternalGraph::load_from_file(path)?))) - } - - /// Freezes the current mutable graph into an immutable graph. - /// - /// This removes the internal locks, allowing the graph to be queried in - /// a read-only fashion. - /// - /// # Returns - /// - /// An `ImmutableGraph` which is an immutable copy of the current graph. - /// - /// # Example - /// ``` - /// use raphtory::db::view_api::*; - /// use raphtory::db::graph::Graph; - /// - /// let mut mutable_graph = Graph::new(1); - /// // ... add vertices and edges to the graph - /// - /// // Freeze the mutable graph into an immutable graph - /// let immutable_graph = mutable_graph.freeze(); - /// ``` - pub fn freeze(self) -> ImmutableGraph { - ImmutableGraph { - nr_shards: self.nr_shards, - shards: self.shards.iter().map(|s| s.freeze()).collect_vec(), - layer_ids: Arc::new(self.layer_ids.read().clone()), - } - } - - pub fn as_arc(&self) -> Arc { - self.0.clone() - } -} - -impl Default for InternalGraph { - fn default() -> Self { - InternalGraph::new(1) - } -} - -impl Display for InternalGraph { - fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result { - write!( - f, - "Graph(num_vertices={}, num_edges={})", - self.num_vertices(), - self.num_edges() - ) - } -} - -impl PartialEq for InternalGraph { - fn eq(&self, other: &G) -> bool { - if self.num_vertices() == other.num_vertices() && self.num_edges() == other.num_edges() { - self.vertices().id().all(|v| other.has_vertex(v)) && // all vertices exist in other - self.edges().explode().count() == other.edges().explode().count() && // same number of exploded edges - self.edges().explode().all(|e| { // all exploded edges exist in other - other - .edge(e.src().id(), e.dst().id(), None) - .filter(|ee| ee.active(e.time().expect("exploded"))) - .is_some() - }) - } else { - false - } - } -} - -impl GraphViewInternalOps for InternalGraph { - fn local_vertex(&self, v: VertexRef) -> Option { - self.get_shard_from_v(v).local_vertex(v) - } - - fn local_vertex_window( - &self, - v: VertexRef, - t_start: i64, - t_end: i64, - ) -> Option { - self.get_shard_from_v(v) - .local_vertex_window(v, t_start..t_end) - } - - /// Return all the layer ids, included the id of the default layer, 0 - fn get_unique_layers_internal(&self) -> Vec { - Box::new(iter::once(0).chain(self.layer_ids.read().values().copied())).collect_vec() - } - - fn get_layer_name_by_id(&self, layer_id: usize) -> String { - let layer_ids = self.layer_ids.read(); - layer_ids - .iter() - .find_map(|(name, &id)| (layer_id == id).then_some(name)) - .expect(&format!("layer id '{layer_id}' doesn't exist")) - .to_string() - } - - fn get_layer(&self, key: Option<&str>) -> Option { - match key { - None => Some(0), - Some(key) => self.layer_ids.read().get(key).copied(), - } - } - - fn view_start(&self) -> Option { - self.earliest_time_global() - } - - fn view_end(&self) -> Option { - self.latest_time_global().map(|t| t + 1) // so it is exclusive - } - - fn earliest_time_global(&self) -> Option { - let min_from_shards = self.shards.iter().map(|shard| shard.earliest_time()).min(); - min_from_shards.filter(|&min| min != i64::MAX) - } - - fn earliest_time_window(&self, t_start: i64, t_end: i64) -> Option { - //FIXME: this is not correct, should actually be the earliest activity in window - let earliest = self.earliest_time_global()?; - if earliest > t_end { - None - } else { - Some(max(earliest, t_start)) - } - } - - fn latest_time_global(&self) -> Option { - let max_from_shards = self.shards.iter().map(|shard| shard.latest_time()).max(); - max_from_shards.filter(|&max| max != i64::MIN) - } - - fn latest_time_window(&self, t_start: i64, t_end: i64) -> Option { - //FIXME: this is not correct, should actually be the latest activity in window - let latest = self.latest_time_global()?; - if latest < t_start { - None - } else { - Some(min(latest, t_end)) - } - } - - fn vertices_len(&self) -> usize { - self.shards.iter().map(|shard| shard.len()).sum() - } - - fn vertices_len_window(&self, t_start: i64, t_end: i64) -> usize { - //FIXME: This nees to be optimised ideally - self.shards - .iter() - .map(|shard| shard.vertices_window(t_start..t_end).count()) - .sum() - } - - fn edges_len(&self, layer: Option) -> usize { - let vs: Vec = self - .shards - .iter() - .map(|shard| shard.out_edges_len(layer)) - .collect(); - vs.iter().sum() - } - - fn edges_len_window(&self, t_start: i64, t_end: i64, layer: Option) -> usize { - self.shards - .iter() - .map(|shard| shard.out_edges_len_window(&(t_start..t_end), layer)) - .sum() - } - - fn has_edge_ref(&self, src: VertexRef, dst: VertexRef, layer: usize) -> bool { - let (shard, src, dst) = self.localise_edge(src, dst); - self.shards[shard].has_edge(src, dst, layer) - } - - fn has_edge_ref_window( - &self, - src: VertexRef, - dst: VertexRef, - t_start: i64, - t_end: i64, - layer: usize, - ) -> bool { - let (shard, src, dst) = self.localise_edge(src, dst); - self.shards[shard].has_edge_window(src, dst, t_start..t_end, layer) - } - - fn has_vertex_ref(&self, v: VertexRef) -> bool { - self.get_shard_from_v(v).has_vertex(v) - } - - fn has_vertex_ref_window(&self, v: VertexRef, t_start: i64, t_end: i64) -> bool { - self.get_shard_from_v(v) - .has_vertex_window(v, t_start..t_end) - } - - fn degree(&self, v: LocalVertexRef, d: Direction, layer: Option) -> usize { - self.get_shard_from_local_v(v).degree(v, d, layer) - } - - fn degree_window( - &self, - v: LocalVertexRef, - t_start: i64, - t_end: i64, - d: Direction, - layer: Option, - ) -> usize { - self.get_shard_from_local_v(v) - .degree_window(v, t_start..t_end, d, layer) - } - - fn vertex_ref(&self, v: u64) -> Option { - self.get_shard_from_id(v).vertex(v) - } - - fn vertex_id(&self, v: LocalVertexRef) -> u64 { - self.shards[v.shard_id].vertex_id(v) - } - - fn vertex_ref_window(&self, v: u64, t_start: i64, t_end: i64) -> Option { - self.get_shard_from_id(v).vertex_window(v, t_start..t_end) - } - - fn vertex_earliest_time(&self, v: LocalVertexRef) -> Option { - self.get_shard_from_local_v(v).vertex_earliest_time(v) - } - - fn vertex_earliest_time_window( - &self, - v: LocalVertexRef, - t_start: i64, - t_end: i64, - ) -> Option { - self.get_shard_from_local_v(v) - .vertex_earliest_time_window(v, t_start..t_end) - } - - fn vertex_latest_time(&self, v: LocalVertexRef) -> Option { - self.get_shard_from_local_v(v).vertex_latest_time(v) - } - - fn vertex_latest_time_window( - &self, - v: LocalVertexRef, - t_start: i64, - t_end: i64, - ) -> Option { - self.get_shard_from_local_v(v) - .vertex_latest_time_window(v, t_start..t_end) - } - - fn vertex_refs(&self) -> Box + Send> { - let shards = self.shards.clone(); - Box::new(shards.into_iter().flat_map(|s| s.vertices())) - } - - fn vertex_refs_window( - &self, - t_start: i64, - t_end: i64, - ) -> Box + Send> { - let shards = self.shards.clone(); - Box::new( - shards - .into_iter() - .flat_map(move |s| s.vertices_window(t_start..t_end)), - ) - } - - fn vertex_refs_shard(&self, shard: usize) -> Box + Send> { - let shard = self.shards[shard].clone(); - Box::new(shard.vertices()) - } - - fn vertex_refs_window_shard( - &self, - shard: usize, - t_start: i64, - t_end: i64, - ) -> Box + Send> { - let shard = self.shards[shard].clone(); - Box::new(shard.vertices_window(t_start..t_end)) - } - - fn edge_ref(&self, src: VertexRef, dst: VertexRef, layer: usize) -> Option { - let (shard_id, src, dst) = self.localise_edge(src, dst); - self.shards[shard_id].edge(src, dst, layer) - } - - fn edge_ref_window( - &self, - src: VertexRef, - dst: VertexRef, - t_start: i64, - t_end: i64, - layer: usize, - ) -> Option { - let (shard_id, src, dst) = self.localise_edge(src, dst); - self.shards[shard_id].edge_window(src, dst, t_start..t_end, layer) - } - - fn edge_refs(&self, layer: Option) -> Box + Send> { - //FIXME: needs low-level primitive - let g = self.clone(); - match layer { - Some(layer) => Box::new( - self.vertex_refs() - .flat_map(move |v| g.vertex_edges(v, Direction::OUT, Some(layer))), - ), - None => Box::new( - self.vertex_refs() - .flat_map(move |v| g.vertex_edges(v, Direction::OUT, None)), - ), - } - } - - fn edge_refs_window( - &self, - t_start: i64, - t_end: i64, - layer: Option, - ) -> Box + Send> { - //FIXME: needs low-level primitive - let g = self.clone(); - Box::new( - self.vertex_refs() - .flat_map(move |v| g.vertex_edges_window(v, t_start, t_end, Direction::OUT, layer)), - ) - } - - fn vertex_edges( - &self, - v: LocalVertexRef, - d: Direction, - layer: Option, - ) -> Box + Send> { - Box::new(self.get_shard_from_local_v(v).vertex_edges(v, d, layer)) - } - - fn vertex_edges_t( - &self, - v: LocalVertexRef, - d: Direction, - layer: Option, - ) -> Box + Send> { - // FIXME: missing low-level implementation - Box::new(self.get_shard_from_local_v(v).vertex_edges_window_t( - v, - i64::MIN..i64::MAX, - d, - layer, - )) - } - - fn vertex_edges_window( - &self, - v: LocalVertexRef, - t_start: i64, - t_end: i64, - d: Direction, - layer: Option, - ) -> Box + Send> { - Box::new( - self.get_shard_from_local_v(v) - .vertex_edges_window(v, t_start..t_end, d, layer), - ) - } - - fn vertex_edges_window_t( - &self, - v: LocalVertexRef, - t_start: i64, - t_end: i64, - d: Direction, - layer: Option, - ) -> Box + Send> { - Box::new( - self.get_shard_from_local_v(v) - .vertex_edges_window_t(v, t_start..t_end, d, layer), - ) - } - - fn neighbours( - &self, - v: LocalVertexRef, - d: Direction, - layer: Option, - ) -> Box + Send> { - Box::new(self.get_shard_from_local_v(v).neighbours(v, d, layer)) - } - - fn neighbours_window( - &self, - v: LocalVertexRef, - t_start: i64, - t_end: i64, - d: Direction, - layer: Option, - ) -> Box + Send> { - Box::new( - self.get_shard_from_local_v(v) - .neighbours_window(v, t_start..t_end, d, layer), - ) - } - - fn static_vertex_prop(&self, v: LocalVertexRef, name: String) -> Option { - self.get_shard_from_local_v(v).static_vertex_prop(v, name) - } - - fn static_vertex_prop_names(&self, v: LocalVertexRef) -> Vec { - self.get_shard_from_local_v(v).static_vertex_prop_names(v) - } - - fn temporal_vertex_prop_names(&self, v: LocalVertexRef) -> Vec { - self.get_shard_from_local_v(v).temporal_vertex_prop_names(v) - } - - fn temporal_vertex_prop_vec(&self, v: LocalVertexRef, name: String) -> Vec<(i64, Prop)> { - self.get_shard_from_local_v(v) - .temporal_vertex_prop_vec(v, name) - } - - fn vertex_timestamps(&self, v: LocalVertexRef) -> Vec { - self.get_shard_from_local_v(v).vertex_timestamps(v) - } - - fn vertex_timestamps_window(&self, v: LocalVertexRef, t_start: i64, t_end: i64) -> Vec { - self.get_shard_from_local_v(v) - .vertex_timestamps_window(v, t_start..t_end) - } - - fn temporal_vertex_prop_vec_window( - &self, - v: LocalVertexRef, - name: String, - t_start: i64, - t_end: i64, - ) -> Vec<(i64, Prop)> { - self.get_shard_from_local_v(v) - .temporal_vertex_prop_vec_window(v, name, t_start..t_end) - } - - fn temporal_vertex_props(&self, v: LocalVertexRef) -> HashMap> { - self.get_shard_from_local_v(v).temporal_vertex_props(v) - } - - fn temporal_vertex_props_window( - &self, - v: LocalVertexRef, - t_start: i64, - t_end: i64, - ) -> HashMap> { - self.get_shard_from_local_v(v) - .temporal_vertex_props_window(v, t_start..t_end) - } - - fn static_edge_prop(&self, e: EdgeRef, name: String) -> Option { - self.get_shard_from_e(e).static_edge_prop(e, name) - } - - fn static_edge_prop_names(&self, e: EdgeRef) -> Vec { - self.get_shard_from_e(e).static_edge_prop_names(e) - } - - fn temporal_edge_prop_names(&self, e: EdgeRef) -> Vec { - self.get_shard_from_e(e).temporal_edge_prop_names(e) - } - - fn temporal_edge_props_vec(&self, e: EdgeRef, name: String) -> Vec<(i64, Prop)> { - self.get_shard_from_e(e).temporal_edge_prop_vec(e, name) - } - - fn temporal_edge_props_vec_window( - &self, - e: EdgeRef, - name: String, - t_start: i64, - t_end: i64, - ) -> Vec<(i64, Prop)> { - self.get_shard_from_e(e) - .temporal_edge_props_vec_window(e, name, t_start..t_end) - } - - fn edge_timestamps(&self, e: EdgeRef, window: Option>) -> Vec { - self.get_shard_from_e(e).edge_timestamps(e, window) - } - - fn temporal_edge_props(&self, e: EdgeRef) -> HashMap> { - self.get_shard_from_e(e).temporal_edge_props(e) - } - - fn temporal_edge_props_window( - &self, - e: EdgeRef, - t_start: i64, - t_end: i64, - ) -> HashMap> { - self.get_shard_from_e(e) - .temporal_edge_props_window(e, t_start..t_end) - } - - fn num_shards(&self) -> usize { - self.nr_shards - } -} - -/// The implementation of a temporal graph composed of multiple shards. -impl InternalGraph { - /// Freezes the current mutable graph into an immutable graph. - /// - /// This removes the internal locks, allowing the graph to be queried in - /// a read-only fashion. - /// - /// # Returns - /// - /// An `ImmutableGraph` which is an immutable copy of the current graph. - /// - /// # Example - /// ``` - /// use raphtory::db::view_api::*; - /// use raphtory::db::graph::Graph; - /// - /// let mut mutable_graph = Graph::new(1); - /// // ... add vertices and edges to the graph - /// - /// // Freeze the mutable graph into an immutable graph - /// let immutable_graph = mutable_graph.freeze(); - /// ``` - pub fn freeze(self) -> ImmutableGraph { - ImmutableGraph { - nr_shards: self.nr_shards, - shards: self.shards.iter().map(|s| s.freeze()).collect_vec(), - layer_ids: Arc::new(self.layer_ids.read().clone()), - } - } - - fn localise_edge(&self, src: VertexRef, dst: VertexRef) -> (usize, VertexRef, VertexRef) { - match src { - VertexRef::Local(local_src) => match dst { - VertexRef::Local(local_dst) => { - if local_src.shard_id == local_dst.shard_id { - (local_src.shard_id, src, dst) - } else { - ( - local_src.shard_id, - src, - VertexRef::Remote(self.vertex_id(local_dst)), - ) - } - } - VertexRef::Remote(_) => (local_src.shard_id, src, dst), - }, - VertexRef::Remote(gid) => match dst { - VertexRef::Local(local_dst) => (local_dst.shard_id, src, dst), - VertexRef::Remote(_) => (self.shard_id(gid), src, dst), - }, - } - } - - /// Get the shard id from a global vertex id - /// - /// # Arguments - /// - /// * `g_id` - The global vertex id - /// - /// # Returns - /// - /// The shard id - fn shard_id(&self, g_id: u64) -> usize { - utils::get_shard_id_from_global_vid(g_id, self.nr_shards) - } - - /// Get the shard from a global vertex id - /// - /// # Arguments - /// - /// * `g_id` - The global vertex id - /// - /// # Returns - /// - /// The shard reference - fn get_shard_from_id(&self, g_id: u64) -> &TGraphShard { - &self.shards[self.shard_id(g_id)] - } - - /// Get the shard from a vertex reference - /// - /// # Arguments - /// - /// * `g_id` - The global vertex id - /// - /// # Returns - /// - /// The shard reference - fn get_shard_from_v(&self, v: VertexRef) -> &TGraphShard { - match v { - VertexRef::Local(v) => self.get_shard_from_local_v(v), - VertexRef::Remote(g_id) => self.get_shard_from_id(g_id), - } - } - - #[inline(always)] - fn get_shard_from_local_v(&self, v: LocalVertexRef) -> &TGraphShard { - &self.shards[v.shard_id] - } - - /// Get the shard from an edge reference - /// - /// # Arguments - /// - /// * `e` - The edge reference - /// - /// # Returns - /// - /// The shard reference - fn get_shard_from_e(&self, e: EdgeRef) -> &TGraphShard { - &self.shards[e.shard()] - } - - /// Create a new graph with the specified number of shards - /// - /// # Arguments - /// - /// * `nr_shards` - The number of shards - /// - /// # Returns - /// - /// A raphtory graph - /// - /// # Example - /// - /// ``` - /// use raphtory::db::graph::Graph; - /// let g = Graph::new(4); - /// ``` - pub fn new(nr_shards: usize) -> Self { - InternalGraph { - nr_shards, - shards: (0..nr_shards).map(|i| TGraphShard::new(i)).collect(), - layer_ids: Default::default(), - } - } - - /// Load a graph from a directory - /// - /// # Arguments - /// - /// * `path` - The path to the directory - /// - /// # Returns - /// - /// A raphtory graph - /// - /// # Example - /// - /// ``` - /// use raphtory::db::graph::InternalGraph; - /// // let g = Graph::load_from_file("path/to/graph"); - /// ``` - pub fn load_from_file>(path: P) -> Result> { - // use BufReader for better performance - - //TODO turn to logging? - println!("loading from {:?}", path.as_ref()); - let mut p = PathBuf::from(path.as_ref()); - p.push("graphdb_nr_shards"); - - let f = std::fs::File::open(p).unwrap(); - let mut reader = std::io::BufReader::new(f); - let (nr_shards, layer_ids) = bincode::deserialize_from(&mut reader)?; - - let mut shard_paths = vec![]; - for i in 0..nr_shards { - let mut p = PathBuf::from(path.as_ref()); - p.push(format!("shard_{}", i)); - shard_paths.push((i, p)); - } - let mut shards = shard_paths - .par_iter() - .map(|(i, path)| { - let shard = TGraphShard::load_from_file(path)?; - Ok((*i, shard)) - }) - .collect::, Box>>()?; - - shards.sort_by_cached_key(|(i, _)| *i); - - let shards = shards.into_iter().map(|(_, shard)| shard).collect(); - Ok(InternalGraph { - nr_shards, - shards, - layer_ids, - }) //TODO I need to put in the actual values here - } - - /// Save a graph to a directory - /// - /// # Arguments - /// - /// * `path` - The path to the directory - /// - /// # Returns - /// - /// A raphtory graph - /// - /// # Example - /// - /// ``` - /// use raphtory::db::graph::InternalGraph; - /// use std::fs::File; - /// let g = InternalGraph::new(4); - /// g.add_vertex(1, 1, &vec![]); - /// // g.save_to_file("path_str"); - /// ``` - pub fn save_to_file>(&self, path: P) -> Result<(), Box> { - // write each shard to a different file - - // crate directory path if it doesn't exist - std::fs::create_dir_all(path.as_ref())?; - - let mut shard_paths = vec![]; - for i in 0..self.nr_shards { - let mut p = PathBuf::from(path.as_ref()); - p.push(format!("shard_{}", i)); - //TODO turn to logging? - //println!("saving shard {} to {:?}", i, p); - shard_paths.push((i, p)); - } - shard_paths - .par_iter() - .try_for_each(|(i, path)| self.shards[*i].save_to_file(path))?; - - let mut p = PathBuf::from(path.as_ref()); - p.push("graphdb_nr_shards"); - - let f = std::fs::File::create(p)?; - let writer = std::io::BufWriter::new(f); - bincode::serialize_into(writer, &(self.nr_shards, self.layer_ids.clone()))?; - Ok(()) - } - - // TODO: Probably add vector reference here like add - /// Add a vertex to the graph - /// - /// # Arguments - /// - /// * `t` - The time - /// * `v` - The vertex (can be a string or integer) - /// * `props` - The properties of the vertex - /// - /// # Returns - /// - /// A result containing the vertex id - /// - /// # Example - /// - /// ``` - /// use raphtory::db::graph::InternalGraph; - /// let g = InternalGraph::new(1); - /// let v = g.add_vertex(0, "Alice", &vec![]); - /// let v = g.add_vertex(0, 5, &vec![]); - /// ``` - pub fn add_vertex( - &self, - t: T, - v: V, - props: &Vec<(String, Prop)>, - ) -> Result<(), GraphError> { - let shard_id = utils::get_shard_id_from_global_vid(v.id(), self.nr_shards); - self.shards[shard_id].add_vertex(t.try_into_time()?, v, props) - } - - pub fn add_vertex_with_custom_time_format( - &self, - t: &str, - fmt: &str, - v: V, - props: &Vec<(String, Prop)>, - ) -> Result<(), GraphError> { - let time: i64 = t.parse_time(fmt)?; - self.add_vertex(time, v, props) - } - - /// Adds properties to the given input vertex. - /// - /// # Arguments - /// - /// * `v` - A vertex - /// * `data` - A vector of tuples containing the property name and value pairs to add to the vertex. - /// - /// # Example - /// - /// ``` - /// use raphtory::db::graph::InternalGraph; - /// use raphtory::core::Prop; - /// let graph = InternalGraph::new(1); - /// graph.add_vertex(0, "Alice", &vec![]); - /// let properties = vec![("color".to_owned(), Prop::Str("blue".to_owned())), ("weight".to_owned(), Prop::I64(11))]; - /// let result = graph.add_vertex_properties("Alice", &properties); - /// ``` - pub fn add_vertex_properties( - &self, - v: V, - data: &Vec<(String, Prop)>, - ) -> Result<(), GraphError> { - let shard_id = utils::get_shard_id_from_global_vid(v.id(), self.nr_shards); - self.shards[shard_id].add_vertex_properties(v.id(), data) - } - - // TODO: Vertex.name which gets ._id property else numba as string - /// Adds an edge between the source and destination vertices with the given timestamp and properties. - /// - /// # Arguments - /// - /// * `t` - The timestamp of the edge. - /// * `src` - An instance of `T` that implements the `InputVertex` trait representing the source vertex. - /// * `dst` - An instance of `T` that implements the `InputVertex` trait representing the destination vertex. - /// * `props` - A vector of tuples containing the property name and value pairs to add to the edge. - /// - /// # Example - /// - /// ``` - /// use raphtory::db::graph::InternalGraph; - /// - /// let graph = InternalGraph::new(1); - /// graph.add_vertex(1, "Alice", &vec![]); - /// graph.add_vertex(2, "Bob", &vec![]); - /// graph.add_edge(3, "Alice", "Bob", &vec![], None); - /// ``` - pub fn add_edge( - &self, - t: T, - src: V, - dst: V, - props: &Vec<(String, Prop)>, - layer: Option<&str>, - ) -> Result<(), GraphError> { - let time = t.try_into_time()?; - let src_shard_id = utils::get_shard_id_from_global_vid(src.id(), self.nr_shards); - let dst_shard_id = utils::get_shard_id_from_global_vid(dst.id(), self.nr_shards); - - let layer_id = self.get_or_allocate_layer(layer); - - if src_shard_id == dst_shard_id { - self.shards[src_shard_id].add_edge(time, src, dst, props, layer_id) - } else { - // FIXME these are sort of connected, we need to hold both locks for - // the src partition and dst partition to add a remote edge between both - self.shards[src_shard_id].add_edge_remote_out( - time, - src.clone(), - dst.clone(), - props, - layer_id, - )?; - self.shards[dst_shard_id].add_edge_remote_into(time, src, dst, props, layer_id)?; - Ok(()) - } - } - - pub fn add_edge_with_custom_time_format( - &self, - t: &str, - fmt: &str, - src: V, - dst: V, - props: &Vec<(String, Prop)>, - layer: Option<&str>, - ) -> Result<(), GraphError> { - let time: i64 = t.parse_time(fmt)?; - self.add_edge(time, src, dst, props, layer) - } - - /// Adds properties to an existing edge between a source and destination vertices - /// - /// # Arguments - /// - /// * `src` - An instance of `T` that implements the `InputVertex` trait representing the source vertex. - /// * `dst` - An instance of `T` that implements the `InputVertex` trait representing the destination vertex. - /// * `props` - A vector of tuples containing the property name and value pairs to add to the edge. - /// - /// # Example - /// - /// ``` - /// use raphtory::db::graph::InternalGraph; - /// use raphtory::core::Prop; - /// let graph = InternalGraph::new(1); - /// graph.add_vertex(1, "Alice", &vec![]); - /// graph.add_vertex(2, "Bob", &vec![]); - /// graph.add_edge(3, "Alice", "Bob", &vec![], None); - /// let properties = vec![("price".to_owned(), Prop::I64(100))]; - /// let result = graph.add_edge_properties("Alice", "Bob", &properties, None); - /// ``` - pub fn add_edge_properties( - &self, - src: V, - dst: V, - props: &Vec<(String, Prop)>, - layer: Option<&str>, - ) -> Result<(), GraphError> { - let layer_id = self.get_layer(layer).unwrap(); // FIXME: bubble up instead - - // TODO: we don't add properties to dst shard, but may need to depending on the plans - self.get_shard_from_id(src.id()) - .add_edge_properties(src.id(), dst.id(), props, layer_id) - } - - fn get_or_allocate_layer(&self, key: Option<&str>) -> usize { - self.get_layer(key).unwrap_or_else(|| { - let mut layer_ids = self.layer_ids.write(); - let layer_id = layer_ids.len() + 1; // default layer not included in the hashmap - layer_ids.insert(key.unwrap().to_string(), layer_id); - for shard in &self.shards { - shard.allocate_layer(layer_id).unwrap() // FIXME: bubble up error - } - layer_id - }) - } -} - -#[cfg(test)] -mod db_tests { - use super::*; - use crate::db::edge::EdgeView; - use crate::db::path::PathFromVertex; - use crate::db::view_api::edge::EdgeViewOps; - use crate::db::view_api::layer::LayerOps; - use crate::graphgen::random_attachment::random_attachment; - use itertools::Itertools; - use std::fs; - use std::sync::Arc; - use tempdir::TempDir; - use uuid::Uuid; - - #[test] - fn cloning_vec() { - let mut vs = vec![]; - for i in 0..10 { - vs.push(Arc::new(i)) - } - let should_be_10: usize = vs.iter().map(Arc::strong_count).sum(); - assert_eq!(should_be_10, 10); - - let vs2 = vs.clone(); - - let should_be_10: usize = vs2.iter().map(Arc::strong_count).sum(); - assert_eq!(should_be_10, 20) - } - - #[quickcheck] - fn add_vertex_grows_graph_len(vs: Vec<(i64, u64)>) { - let g = Graph::new(2); - - let expected_len = vs.iter().map(|(_, v)| v).sorted().dedup().count(); - for (t, v) in vs { - g.add_vertex(t, v, &vec![]) - .map_err(|err| println!("{:?}", err)) - .ok(); - } - - assert_eq!(g.num_vertices(), expected_len) - } - - #[quickcheck] - fn add_edge_grows_graph_edge_len(edges: Vec<(i64, u64, u64)>) { - let nr_shards: usize = 2; - - let g = InternalGraph::new(nr_shards); - - let unique_vertices_count = edges - .iter() - .flat_map(|(_, src, dst)| vec![src, dst]) - .sorted() - .dedup() - .count(); - - let unique_edge_count = edges - .iter() - .map(|(_, src, dst)| (src, dst)) - .unique() - .count(); - - for (t, src, dst) in edges { - g.add_edge(t, src, dst, &vec![], None).unwrap(); - } - - assert_eq!(g.num_vertices(), unique_vertices_count); - assert_eq!(g.num_edges(), unique_edge_count); - } - - #[quickcheck] - fn add_edge_works(edges: Vec<(i64, u64, u64)>) -> bool { - let g = InternalGraph::new(3); - for &(t, src, dst) in edges.iter() { - g.add_edge(t, src, dst, &vec![], None).unwrap(); - } - - edges - .iter() - .all(|&(_, src, dst)| g.has_edge(src, dst, None)) - } - - #[quickcheck] - fn get_edge_works(edges: Vec<(i64, u64, u64)>) -> bool { - let g = InternalGraph::new(100); - for &(t, src, dst) in edges.iter() { - g.add_edge(t, src, dst, &vec![], None).unwrap(); - } - - edges - .iter() - .all(|&(_, src, dst)| g.edge(src, dst, None).is_some()) - } - - #[test] - fn graph_save_to_load_from_file() { - let vs = vec![ - (1, 1, 2), - (2, 1, 3), - (-1, 2, 1), - (0, 1, 1), - (7, 3, 2), - (1, 1, 1), - ]; - - let g = InternalGraph::new(2); - - for (t, src, dst) in &vs { - g.add_edge(*t, *src, *dst, &vec![], None).unwrap(); - } - - let rand_dir = Uuid::new_v4(); - let tmp_raphtory_path: TempDir = TempDir::new("raphtory").unwrap(); - let shards_path = - format!("{:?}/{}", tmp_raphtory_path.path().display(), rand_dir).replace('\"', ""); - - println!("shards_path: {}", shards_path); - - // Save to files - let mut expected = vec![ - format!("{}/shard_1", shards_path), - format!("{}/shard_0", shards_path), - format!("{}/graphdb_nr_shards", shards_path), - ] - .iter() - .map(Path::new) - .map(PathBuf::from) - .collect::>(); - - expected.sort(); - - match g.save_to_file(&shards_path) { - Ok(()) => { - let mut actual = fs::read_dir(&shards_path) - .unwrap() - .map(|f| f.unwrap().path()) - .collect::>(); - - actual.sort(); - - assert_eq!(actual, expected); - } - Err(e) => panic!("{e}"), - } - - // Load from files - match InternalGraph::load_from_file(Path::new(&shards_path)) { - Ok(g) => { - assert!(g.has_vertex_ref(1.into())); - assert_eq!(g.nr_shards, 2); - } - Err(e) => panic!("{e}"), - } - - let _ = tmp_raphtory_path.close(); - } - - #[test] - fn has_edge() { - let g = InternalGraph::new(2); - g.add_edge(1, 7, 8, &vec![], None).unwrap(); - - assert!(!g.has_edge(8, 7, None)); - assert!(g.has_edge(7, 8, None)); - - g.add_edge(1, 7, 9, &vec![], None).unwrap(); - - assert!(!g.has_edge(9, 7, None)); - assert!(g.has_edge(7, 9, None)); - - g.add_edge(2, "haaroon", "northLondon", &vec![], None) - .unwrap(); - assert!(g.has_edge("haaroon", "northLondon", None)); - } - - #[test] - fn graph_edge() { - let g = InternalGraph::new(2); - let es = vec![ - (1, 1, 2), - (2, 1, 3), - (-1, 2, 1), - (0, 1, 1), - (7, 3, 2), - (1, 1, 1), - ]; - for (t, src, dst) in es { - g.add_edge(t, src, dst, &vec![], None).unwrap() - } - - let e = g - .edge_ref_window(1.into(), 3.into(), i64::MIN, i64::MAX, 0) - .unwrap(); - assert_eq!(g.vertex_id(g.localise_vertex_unchecked(e.src())), 1u64); - assert_eq!(g.vertex_id(g.localise_vertex_unchecked(e.dst())), 3u64); - } - - #[test] - fn graph_degree_window() { - let vs = vec![ - (1, 1, 2), - (2, 1, 3), - (-1, 2, 1), - (0, 1, 1), - (7, 3, 2), - (1, 1, 1), - ]; - - let g = InternalGraph::new(1); - - for (t, src, dst) in &vs { - g.add_edge(*t, *src, *dst, &vec![], None).unwrap(); - } - - let expected = vec![(2, 3, 1), (1, 0, 0), (1, 0, 0)]; - let actual = (1..=3) - .map(|i| { - let i = g.vertex_ref(i).unwrap(); - ( - g.degree_window(i, -1, 7, Direction::IN, None), - g.degree_window(i, 1, 7, Direction::OUT, None), - g.degree_window(i, 0, 1, Direction::BOTH, None), - ) - }) - .collect::>(); - - assert_eq!(actual, expected); - - // Check results from multiple graphs with different number of shards - let g = InternalGraph::new(3); - - for (t, src, dst) in &vs { - g.add_edge(*t, *src, *dst, &vec![], None).unwrap(); - } - - let expected = (1..=3) - .map(|i| { - let i = g.vertex_ref(i).unwrap(); - ( - g.degree_window(i, -1, 7, Direction::IN, None), - g.degree_window(i, 1, 7, Direction::OUT, None), - g.degree_window(i, 0, 1, Direction::BOTH, None), - ) - }) - .collect::>(); - - assert_eq!(actual, expected); - } - - #[test] - fn graph_edges_window() { - let vs = vec![ - (1, 1, 2), - (2, 1, 3), - (-1, 2, 1), - (0, 1, 1), - (7, 3, 2), - (1, 1, 1), - ]; - - let g = InternalGraph::new(1); - - for (t, src, dst) in &vs { - g.add_edge(*t, *src, *dst, &vec![], None).unwrap(); - } - - let expected = vec![(2, 3, 2), (1, 0, 0), (1, 0, 0)]; - let actual = (1..=3) - .map(|i| { - let i = g.vertex_ref(i).unwrap(); - ( - g.vertex_edges_window(i, -1, 7, Direction::IN, None) - .collect::>() - .len(), - g.vertex_edges_window(i, 1, 7, Direction::OUT, None) - .collect::>() - .len(), - g.vertex_edges_window(i, 0, 1, Direction::BOTH, None) - .collect::>() - .len(), - ) - }) - .collect::>(); - - assert_eq!(actual, expected); - - // Check results from multiple graphs with different number of shards - let g = InternalGraph::new(10); - - for (t, src, dst) in &vs { - g.add_edge(*t, *src, *dst, &vec![], None).unwrap(); - } - - let expected = (1..=3) - .map(|i| { - let i = g.vertex_ref(i).unwrap(); - ( - g.vertex_edges_window(i, -1, 7, Direction::IN, None) - .collect::>() - .len(), - g.vertex_edges_window(i, 1, 7, Direction::OUT, None) - .collect::>() - .len(), - g.vertex_edges_window(i, 0, 1, Direction::BOTH, None) - .collect::>() - .len(), - ) - }) - .collect::>(); - - assert_eq!(actual, expected); - } - - #[test] - fn graph_edges_window_t() { - let vs = vec![ - (1, 1, 2), - (2, 1, 3), - (-1, 2, 1), - (0, 1, 1), - (7, 3, 2), - (1, 1, 1), - ]; - - let g = InternalGraph::new(1); - - for (t, src, dst) in &vs { - g.add_edge(*t, *src, *dst, &vec![], None).unwrap(); - } - - let in_actual = (1..=3) - .map(|i| { - let i = g.vertex_ref(i).unwrap(); - g.vertex_edges_window_t(i, -1, 7, Direction::IN, None) - .map(|e| e.time().unwrap()) - .sorted() // sorted by neighbour first and then time but neighbour order can be arbitrary so normalise - .collect::>() - }) - .collect::>(); - assert_eq!(vec![vec![-1, 0, 1], vec![1], vec![2]], in_actual); - - let out_actual = (1..=3) - .map(|i| { - let i = g.vertex_ref(i).unwrap(); - g.vertex_edges_window_t(i, 1, 7, Direction::OUT, None) - .map(|e| e.time().unwrap()) - .sorted() - .collect::>() - }) - .collect::>(); - assert_eq!(vec![vec![1, 1, 2], vec![], vec![]], out_actual); - - let both_actual = (1..=3) - .map(|i| { - let i = g.vertex_ref(i).unwrap(); - g.vertex_edges_window_t(i, 0, 1, Direction::BOTH, None) - .map(|e| e.time().unwrap()) - .sorted() - .collect::>() - }) - .collect::>(); - assert_eq!(vec![vec![0, 0], vec![], vec![]], both_actual); - - // Check results from multiple graphs with different number of shards - let g = InternalGraph::new(4); - - for (src, dst, t) in &vs { - g.add_edge(*src, *dst, *t, &vec![], None).unwrap(); - } - } - - #[test] - fn time_test() { - let g = Graph::new(4); - - assert_eq!(g.latest_time(), None); - assert_eq!(g.earliest_time(), None); - - g.add_vertex(5, 1, &vec![]) - .map_err(|err| println!("{:?}", err)) - .ok(); - - assert_eq!(g.latest_time(), Some(5)); - assert_eq!(g.earliest_time(), Some(5)); - - let g = Graph::new(4); - - g.add_edge(10, 1, 2, &vec![], None).unwrap(); - assert_eq!(g.latest_time(), Some(10)); - assert_eq!(g.earliest_time(), Some(10)); - - g.add_vertex(5, 1, &vec![]) - .map_err(|err| println!("{:?}", err)) - .ok(); - assert_eq!(g.latest_time(), Some(10)); - assert_eq!(g.earliest_time(), Some(5)); - - g.add_edge(20, 3, 4, &vec![], None).unwrap(); - assert_eq!(g.latest_time(), Some(20)); - assert_eq!(g.earliest_time(), Some(5)); - - random_attachment(&g, 100, 10); - assert_eq!(g.latest_time(), Some(126)); - assert_eq!(g.earliest_time(), Some(5)); - } - - #[test] - fn static_properties() { - let g = Graph::new(100); // big enough so all edges are very likely remote - g.add_edge(0, 11, 22, &vec![], None).unwrap(); - g.add_edge( - 0, - 11, - 11, - &vec![("temp".to_string(), Prop::Bool(true))], - None, - ) - .unwrap(); - g.add_edge(0, 22, 33, &vec![], None).unwrap(); - g.add_edge(0, 33, 11, &vec![], None).unwrap(); - g.add_vertex(0, 11, &vec![("temp".to_string(), Prop::Bool(true))]) - .unwrap(); - let v11 = g.vertex_ref(11).unwrap(); - let v22 = g.vertex_ref(22).unwrap(); - let v33 = g.vertex_ref(33).unwrap(); - let edge1111 = g.edge_ref(11.into(), 11.into(), 0).unwrap(); - let edge2233 = g.edge_ref(v22.into(), v33.into(), 0).unwrap(); - let edge3311 = g.edge_ref(v33.into(), v11.into(), 0).unwrap(); - - g.add_vertex_properties( - 11, - &vec![ - ("a".to_string(), Prop::U64(11)), - ("b".to_string(), Prop::I64(11)), - ], - ) - .unwrap(); - g.add_vertex_properties(11, &vec![("c".to_string(), Prop::U32(11))]) - .unwrap(); - g.add_vertex_properties(22, &vec![("b".to_string(), Prop::U64(22))]) - .unwrap(); - g.add_edge_properties(11, 11, &vec![("d".to_string(), Prop::U64(1111))], None) - .unwrap(); - g.add_edge_properties(33, 11, &vec![("a".to_string(), Prop::U64(3311))], None) - .unwrap(); - - assert_eq!(g.static_vertex_prop_names(v11), vec!["a", "b", "c"]); - assert_eq!(g.static_vertex_prop_names(v22), vec!["b"]); - assert!(g.static_vertex_prop_names(v33).is_empty()); - assert_eq!(g.static_edge_prop_names(edge1111), vec!["d"]); - assert_eq!(g.static_edge_prop_names(edge3311), vec!["a"]); - assert!(g.static_edge_prop_names(edge2233).is_empty()); - - assert_eq!( - g.static_vertex_prop(v11, "a".to_string()), - Some(Prop::U64(11)) - ); - assert_eq!( - g.static_vertex_prop(v11, "b".to_string()), - Some(Prop::I64(11)) - ); - assert_eq!( - g.static_vertex_prop(v11, "c".to_string()), - Some(Prop::U32(11)) - ); - assert_eq!( - g.static_vertex_prop(v22, "b".to_string()), - Some(Prop::U64(22)) - ); - assert_eq!(g.static_vertex_prop(v22, "a".to_string()), None); - assert_eq!( - g.static_edge_prop(edge1111, "d".to_string()), - Some(Prop::U64(1111)) - ); - assert_eq!( - g.static_edge_prop(edge3311, "a".to_string()), - Some(Prop::U64(3311)) - ); - assert_eq!(g.static_edge_prop(edge2233, "a".to_string()), None); - } - - #[test] - #[should_panic] - fn changing_property_type_for_vertex_panics() { - let g = InternalGraph::new(4); - g.add_vertex(0, 11, &vec![("test".to_string(), Prop::Bool(true))]) - .unwrap(); - g.add_vertex_properties(11, &vec![("test".to_string(), Prop::Bool(true))]) - .unwrap(); - } - - #[test] - #[should_panic] - fn changing_property_type_for_edge_panics() { - let g = InternalGraph::new(4); - g.add_edge( - 0, - 11, - 22, - &vec![("test".to_string(), Prop::Bool(true))], - None, - ) - .unwrap(); - g.add_edge_properties(11, 22, &vec![("test".to_string(), Prop::Bool(true))], None) - .unwrap(); - } - - #[test] - fn graph_neighbours_window() { - let vs = vec![ - (1, 1, 2), - (2, 1, 3), - (-1, 2, 1), - (0, 1, 1), - (7, 3, 2), - (1, 1, 1), - ]; - - let g = InternalGraph::new(2); - - for (t, src, dst) in &vs { - g.add_edge(*t, *src, *dst, &vec![], None).unwrap(); - } - - let local_1 = VertexRef::new_local(0, 1); - let remote_2 = VertexRef::Remote(2); - let local_3 = VertexRef::new_local(1, 1); - - let expected = [ - ( - vec![local_1, remote_2], - vec![local_1, local_3, remote_2], - vec![local_1], - ), - (vec![VertexRef::Remote(1)], vec![], vec![]), - (vec![local_1], vec![], vec![]), - ]; - let actual = (1..=3) - .map(|i| { - let i = g.vertex_ref(i).unwrap(); - ( - g.neighbours_window(i, -1, 7, Direction::IN, None) - .collect::>(), - g.neighbours_window(i, 1, 7, Direction::OUT, None) - .collect::>(), - g.neighbours_window(i, 0, 1, Direction::BOTH, None) - .collect::>(), - ) - }) - .collect::>(); - - assert_eq!(actual, expected); - } - - #[test] - fn test_time_range_on_empty_graph() { - let g = InternalGraph::new(1); - - let rolling = g.rolling(1, None).unwrap().collect_vec(); - assert!(rolling.is_empty()); - - let expanding = g.expanding(1).unwrap().collect_vec(); - assert!(expanding.is_empty()); - } - - #[test] - fn test_add_vertex_with_strings() { - let g = InternalGraph::new(1); - - g.add_vertex(0, "haaroon", &vec![]).unwrap(); - g.add_vertex(1, "hamza", &vec![]).unwrap(); - g.add_vertex(1, 831, &vec![]).unwrap(); - - assert!(g.has_vertex(831)); - assert!(g.has_vertex("haaroon")); - assert!(g.has_vertex("hamza")); - - assert_eq!(g.num_vertices(), 3); - } - - #[test] - fn layers() { - let g = InternalGraph::new(4); - g.add_edge(0, 11, 22, &vec![], None).unwrap(); - g.add_edge(0, 11, 33, &vec![], None).unwrap(); - g.add_edge(0, 33, 11, &vec![], None).unwrap(); - g.add_edge(0, 11, 22, &vec![], Some("layer1")).unwrap(); - g.add_edge(0, 11, 33, &vec![], Some("layer2")).unwrap(); - g.add_edge(0, 11, 44, &vec![], Some("layer2")).unwrap(); - - assert_eq!(g.has_edge(11, 22, None), true); - assert_eq!(g.has_edge(11, 44, None), false); - assert_eq!(g.has_edge(11, 22, Some("layer2")), false); - assert_eq!(g.has_edge(11, 44, Some("layer2")), true); - - assert!(g.edge(11, 22, None).is_some()); - assert!(g.edge(11, 44, None).is_none()); - assert!(g.edge(11, 22, Some("layer2")).is_none()); - assert!(g.edge(11, 44, Some("layer2")).is_some()); - - let dft_layer = g.default_layer(); - let layer1 = g.layer("layer1").unwrap(); - let layer2 = g.layer("layer2").unwrap(); - assert!(g.layer("missing layer").is_none()); - - assert_eq!(g.num_edges(), 4); - assert_eq!(dft_layer.num_edges(), 3); - assert_eq!(layer1.num_edges(), 1); - assert_eq!(layer2.num_edges(), 2); - - let vertex = g.vertex(11).unwrap(); - let vertex_dft = dft_layer.vertex(11).unwrap(); - let vertex1 = layer1.vertex(11).unwrap(); - let vertex2 = layer2.vertex(11).unwrap(); - - assert_eq!(vertex.degree(), 3); - assert_eq!(vertex_dft.degree(), 2); - assert_eq!(vertex1.degree(), 1); - assert_eq!(vertex2.degree(), 2); - - assert_eq!(vertex.out_degree(), 3); - assert_eq!(vertex_dft.out_degree(), 2); - assert_eq!(vertex1.out_degree(), 1); - assert_eq!(vertex2.out_degree(), 2); - - assert_eq!(vertex.in_degree(), 1); - assert_eq!(vertex_dft.in_degree(), 1); - assert_eq!(vertex1.in_degree(), 0); - assert_eq!(vertex2.in_degree(), 0); - - fn to_tuples>>( - edges: I, - ) -> Vec<(u64, u64)> { - edges - .map(|e| (e.src().id(), e.dst().id())) - .sorted() - .collect_vec() - } - - assert_eq!( - to_tuples(vertex.edges()), - vec![(11, 22), (11, 22), (11, 33), (11, 33), (11, 44), (33, 11)] - ); - assert_eq!( - to_tuples(vertex_dft.edges()), - vec![(11, 22), (11, 33), (33, 11)] - ); - assert_eq!(to_tuples(vertex1.edges()), vec![(11, 22)]); - assert_eq!(to_tuples(vertex2.edges()), vec![(11, 33), (11, 44)]); - - assert_eq!(to_tuples(vertex.in_edges()), vec![(33, 11)]); - assert_eq!(to_tuples(vertex_dft.in_edges()), vec![(33, 11)]); - assert_eq!(to_tuples(vertex1.in_edges()), vec![]); - assert_eq!(to_tuples(vertex2.in_edges()), vec![]); - - assert_eq!( - to_tuples(vertex.out_edges()), - vec![(11, 22), (11, 22), (11, 33), (11, 33), (11, 44)] - ); - assert_eq!(to_tuples(vertex_dft.out_edges()), vec![(11, 22), (11, 33)]); - assert_eq!(to_tuples(vertex1.out_edges()), vec![(11, 22)]); - assert_eq!(to_tuples(vertex2.out_edges()), vec![(11, 33), (11, 44)]); - - fn to_ids(neighbours: PathFromVertex) -> Vec { - neighbours.iter().map(|n| n.id()).sorted().collect_vec() - } - - assert_eq!(to_ids(vertex.neighbours()), vec![22, 33, 44]); - assert_eq!(to_ids(vertex_dft.neighbours()), vec![22, 33]); - assert_eq!(to_ids(vertex1.neighbours()), vec![22]); - assert_eq!(to_ids(vertex2.neighbours()), vec![33, 44]); - - assert_eq!(to_ids(vertex.out_neighbours()), vec![22, 33, 44]); - assert_eq!(to_ids(vertex_dft.out_neighbours()), vec![22, 33]); - assert_eq!(to_ids(vertex1.out_neighbours()), vec![22]); - assert_eq!(to_ids(vertex2.out_neighbours()), vec![33, 44]); - - assert_eq!(to_ids(vertex.in_neighbours()), vec![33]); - assert_eq!(to_ids(vertex_dft.in_neighbours()), vec![33]); - assert!(to_ids(vertex1.in_neighbours()).is_empty()); - assert!(to_ids(vertex2.in_neighbours()).is_empty()); - } - - #[test] - fn test_exploded_edge() { - let g = InternalGraph::new(1); - g.add_edge(0, 1, 2, &vec![("weight".to_string(), Prop::I64(1))], None) - .unwrap(); - g.add_edge(1, 1, 2, &vec![("weight".to_string(), Prop::I64(2))], None) - .unwrap(); - g.add_edge(2, 1, 2, &vec![("weight".to_string(), Prop::I64(3))], None) - .unwrap(); - - let exploded = g.edge(1, 2, None).unwrap().explode(); - - let res = exploded.map(|e| e.properties(false)).collect_vec(); - - let mut expected = Vec::new(); - for i in 1..4 { - let mut map = HashMap::new(); - map.insert("weight".to_string(), Prop::I64(i)); - expected.push(map); - } - - assert_eq!(res, expected); - - let e = g - .vertex(1) - .unwrap() - .edges() - .explode() - .map(|e| e.properties(false)) - .collect_vec(); - assert_eq!(e, expected); - } - - #[test] - fn test_edge_earliest_latest() { - let g = InternalGraph::new(1); - g.add_edge(0, 1, 2, &vec![], None).unwrap(); - g.add_edge(1, 1, 2, &vec![], None).unwrap(); - g.add_edge(2, 1, 2, &vec![], None).unwrap(); - g.add_edge(0, 1, 3, &vec![], None).unwrap(); - g.add_edge(1, 1, 3, &vec![], None).unwrap(); - g.add_edge(2, 1, 3, &vec![], None).unwrap(); - - let mut res = g.edge(1, 2, None).unwrap().earliest_time().unwrap(); - assert_eq!(res, 0); - - res = g.edge(1, 2, None).unwrap().latest_time().unwrap(); - assert_eq!(res, 2); - - res = g.at(1).edge(1, 2, None).unwrap().earliest_time().unwrap(); - assert_eq!(res, 0); - - res = g.at(1).edge(1, 2, None).unwrap().latest_time().unwrap(); - assert_eq!(res, 1); - - let res_list: Vec = g - .vertex(1) - .unwrap() - .edges() - .earliest_time() - .flatten() - .collect(); - assert_eq!(res_list, vec![0, 0]); - - let res_list: Vec = g - .vertex(1) - .unwrap() - .edges() - .latest_time() - .flatten() - .collect(); - assert_eq!(res_list, vec![2, 2]); - - let res_list: Vec = g - .vertex(1) - .unwrap() - .at(1) - .edges() - .earliest_time() - .flatten() - .collect(); - assert_eq!(res_list, vec![0, 0]); - - let res_list: Vec = g - .vertex(1) - .unwrap() - .at(1) - .edges() - .latest_time() - .flatten() - .collect(); - assert_eq!(res_list, vec![1, 1]); - } - - #[test] - fn check_vertex_history() { - let g = InternalGraph::new(1); - - g.add_vertex(1, 1, &vec![]).unwrap(); - g.add_vertex(2, 1, &vec![]).unwrap(); - g.add_vertex(3, 1, &vec![]).unwrap(); - g.add_vertex(4, 1, &vec![]).unwrap(); - g.add_vertex(8, 1, &vec![]).unwrap(); - - g.add_vertex(4, "Lord Farquaad", &vec![]).unwrap(); - g.add_vertex(6, "Lord Farquaad", &vec![]).unwrap(); - g.add_vertex(7, "Lord Farquaad", &vec![]).unwrap(); - g.add_vertex(8, "Lord Farquaad", &vec![]).unwrap(); - - let times_of_one = g.vertex(1).unwrap().history(); - let times_of_farquaad = g.vertex("Lord Farquaad").unwrap().history(); - - assert_eq!(times_of_one, [1, 2, 3, 4, 8]); - assert_eq!(times_of_farquaad, [4, 6, 7, 8]); - - let view = g.window(1, 8); - - let windowed_times_of_one = view.vertex(1).unwrap().history(); - let windowed_times_of_farquaad = view.vertex("Lord Farquaad").unwrap().history(); - assert_eq!(windowed_times_of_one, [1, 2, 3, 4]); - assert_eq!(windowed_times_of_farquaad, [4, 6, 7]); - } - - #[test] - fn check_edge_history() { - let g = InternalGraph::new(1); - - g.add_edge(1, 1, 2, &vec![], None).unwrap(); - g.add_edge(2, 1, 3, &vec![], None).unwrap(); - g.add_edge(3, 1, 2, &vec![], None).unwrap(); - g.add_edge(4, 1, 4, &vec![], None).unwrap(); - - let times_of_onetwo = g.edge(1, 2, None).unwrap().history(); - let times_of_four = g.edge(1, 4, None).unwrap().window(1, 5).history(); - let view = g.window(2, 5); - let windowed_times_of_four = view.edge(1, 4, None).unwrap().window(2, 4).history(); - - assert_eq!(times_of_onetwo, [1, 3]); - assert_eq!(times_of_four, [4]); - assert!(windowed_times_of_four.is_empty()); - } - - #[test] - fn check_edge_history_on_multiple_shards() { - let g = InternalGraph::new(10); - - g.add_edge(1, 1, 2, &vec![], None).unwrap(); - g.add_edge(2, 1, 3, &vec![], None).unwrap(); - g.add_edge(3, 1, 2, &vec![], None).unwrap(); - g.add_edge(4, 1, 4, &vec![], None).unwrap(); - g.add_edge(5, 1, 4, &vec![], None).unwrap(); - g.add_edge(6, 1, 4, &vec![], None).unwrap(); - g.add_edge(7, 1, 4, &vec![], None).unwrap(); - g.add_edge(8, 1, 4, &vec![], None).unwrap(); - g.add_edge(9, 1, 4, &vec![], None).unwrap(); - g.add_edge(10, 1, 4, &vec![], None).unwrap(); - - let times_of_onetwo = g.edge(1, 2, None).unwrap().history(); - let times_of_four = g.edge(1, 4, None).unwrap().window(1, 5).history(); - let times_of_outside_window = g.edge(1, 4, None).unwrap().window(1, 4).history(); - let times_of_four_higher = g.edge(1, 4, None).unwrap().window(6, 11).history(); - - let view = g.window(1, 11); - let windowed_times_of_four = view.edge(1, 4, None).unwrap().window(2, 5).history(); - let windowed_times_of_four_higher = view.edge(1, 4, None).unwrap().window(8, 11).history(); - - assert_eq!(times_of_onetwo, [1, 3]); - assert_eq!(times_of_four, [4]); - assert_eq!(times_of_four_higher, [6, 7, 8, 9, 10]); - assert!(times_of_outside_window.is_empty()); - assert_eq!(windowed_times_of_four, [4]); - assert_eq!(windowed_times_of_four_higher, [8, 9, 10]); - } - - #[test] - fn check_vertex_history_multiple_shards() { - let g = InternalGraph::new(10); - - g.add_vertex(1, 1, &vec![]).unwrap(); - g.add_vertex(2, 1, &vec![]).unwrap(); - g.add_vertex(3, 1, &vec![]).unwrap(); - g.add_vertex(4, 1, &vec![]).unwrap(); - g.add_vertex(5, 2, &vec![]).unwrap(); - g.add_vertex(6, 2, &vec![]).unwrap(); - g.add_vertex(7, 2, &vec![]).unwrap(); - g.add_vertex(8, 1, &vec![]).unwrap(); - g.add_vertex(9, 2, &vec![]).unwrap(); - g.add_vertex(10, 2, &vec![]).unwrap(); - - g.add_vertex(4, "Lord Farquaad", &vec![]).unwrap(); - g.add_vertex(6, "Lord Farquaad", &vec![]).unwrap(); - g.add_vertex(7, "Lord Farquaad", &vec![]).unwrap(); - g.add_vertex(8, "Lord Farquaad", &vec![]).unwrap(); - - let times_of_one = g.vertex(1).unwrap().history(); - let times_of_farquaad = g.vertex("Lord Farquaad").unwrap().history(); - let times_of_upper = g.vertex(2).unwrap().history(); - - assert_eq!(times_of_one, [1, 2, 3, 4, 8]); - assert_eq!(times_of_farquaad, [4, 6, 7, 8]); - assert_eq!(times_of_upper, [5, 6, 7, 9, 10]); - - let view = g.window(1, 8); - let windowed_times_of_one = view.vertex(1).unwrap().history(); - let windowed_times_of_two = view.vertex(2).unwrap().history(); - let windowed_times_of_farquaad = view.vertex("Lord Farquaad").unwrap().history(); - - assert_eq!(windowed_times_of_one, [1, 2, 3, 4]); - assert_eq!(windowed_times_of_farquaad, [4, 6, 7]); - assert_eq!(windowed_times_of_two, [5, 6, 7]); - } - - #[test] - fn test_ingesting_timestamps() { - let earliest_time = "2022-06-06 12:34:00".try_into_time().unwrap(); - let latest_time = "2022-06-07 12:34:00".try_into_time().unwrap(); - - let g = InternalGraph::new(4); - g.add_vertex("2022-06-06T12:34:00.000", 0, &vec![]).unwrap(); - g.add_edge("2022-06-07T12:34:00", 1, 2, &vec![], None) - .unwrap(); - assert_eq!(g.earliest_time().unwrap(), earliest_time); - assert_eq!(g.latest_time().unwrap(), latest_time); - - let g = InternalGraph::new(4); - let fmt = "%Y-%m-%d %H:%M"; - g.add_vertex_with_custom_time_format("2022-06-06 12:34", fmt, 0, &vec![]) - .unwrap(); - g.add_edge_with_custom_time_format("2022-06-07 12:34", fmt, 1, 2, &vec![], None) - .unwrap(); - assert_eq!(g.earliest_time().unwrap(), earliest_time); - assert_eq!(g.latest_time().unwrap(), latest_time); - } - - #[test] - fn test_prop_display_str() { - let mut prop = Prop::Str(String::from("hello")); - assert_eq!(format!("{}", prop), "hello"); - - prop = Prop::I32(42); - assert_eq!(format!("{}", prop), "42"); - - prop = Prop::I64(9223372036854775807); - assert_eq!(format!("{}", prop), "9223372036854775807"); - - prop = Prop::U32(4294967295); - assert_eq!(format!("{}", prop), "4294967295"); - - prop = Prop::U64(18446744073709551615); - assert_eq!(format!("{}", prop), "18446744073709551615"); - - prop = Prop::F32(3.14159); - assert_eq!(format!("{}", prop), "3.14159"); - - prop = Prop::F64(3.141592653589793); - assert_eq!(format!("{}", prop), "3.141592653589793"); - - prop = Prop::Bool(true); - assert_eq!(format!("{}", prop), "true"); - } - - #[test] - fn test_temporral_edge_props_window() { - let g = Graph::new(1); - g.add_edge(1, 1, 2, &vec![("weight".to_string(), Prop::I64(1))], None) - .unwrap(); - g.add_edge(2, 1, 2, &vec![("weight".to_string(), Prop::I64(2))], None) - .unwrap(); - g.add_edge(3, 1, 2, &vec![("weight".to_string(), Prop::I64(3))], None) - .unwrap(); - - let e = g.vertex(1).unwrap().out_edges().next().unwrap(); - - let res = g.temporal_edge_props_window(EdgeRef::from(e), 1, 3); - let mut exp = HashMap::new(); - exp.insert( - "weight".to_string(), - vec![(1, Prop::I64(1)), (2, Prop::I64(2))], - ); - assert_eq!(res, exp); - } - - #[test] - fn test_vertex_early_late_times() { - let g = InternalGraph::new(1); - g.add_vertex(1, 1, &vec![]).unwrap(); - g.add_vertex(2, 1, &vec![]).unwrap(); - g.add_vertex(3, 1, &vec![]).unwrap(); - - assert_eq!(g.vertex(1).unwrap().earliest_time(), Some(1)); - assert_eq!(g.vertex(1).unwrap().latest_time(), Some(3)); - - assert_eq!(g.at(2).vertex(1).unwrap().earliest_time(), Some(1)); - assert_eq!(g.at(2).vertex(1).unwrap().latest_time(), Some(2)); - } - - #[test] - fn test_vertex_ids() { - let g = InternalGraph::new(1); - g.add_vertex(1, 1, &vec![]).unwrap(); - g.add_vertex(1, 2, &vec![]).unwrap(); - g.add_vertex(2, 3, &vec![]).unwrap(); - - assert_eq!(g.vertices().id().collect::>(), vec![1, 2, 3]); - - let g_at = g.at(1); - assert_eq!(g_at.vertices().id().collect::>(), vec![1, 2]); - } - - #[test] - fn test_edge_layer_name() -> Result<(), GraphError> { - let g = InternalGraph::new(4); - g.add_edge(0, 0, 1, &vec![], None)?; - g.add_edge(0, 0, 1, &vec![], Some("awesome name"))?; - - let layer_names = g.edges().map(|e| e.layer_name()).sorted().collect_vec(); - assert_eq!(layer_names, vec!["awesome name", "default layer"]); - Ok(()) - } - - #[test] - fn test_edge_from_single_layer() { - let g = InternalGraph::new(4); - g.add_edge(0, 1, 2, &vec![], Some("layer")).unwrap(); - - assert!(g.edge(1, 2, None).is_none()); - assert!(g.layer("layer").unwrap().edge(1, 2, None).is_some()) - } - - #[test] - fn test_unique_layers() { - let g = InternalGraph::new(4); - g.add_edge(0, 1, 2, &vec![], Some("layer1")).unwrap(); - g.add_edge(0, 1, 2, &vec![], Some("layer2")).unwrap(); - assert_eq!( - g.layer("layer2").unwrap().get_unique_layers(), - vec!["layer2"] - ) - } - - #[quickcheck] - fn vertex_from_id_is_consistent(vertices: Vec) -> bool { - let g = InternalGraph::new(1); - for v in vertices.iter() { - g.add_vertex(0, *v, &vec![]).unwrap(); - } - g.vertices() - .name() - .map(|name| g.vertex(name)) - .all(|v| v.is_some()) - } - - #[quickcheck] - fn exploded_edge_times_is_consistent(edges: Vec<(u64, u64, Vec)>, offset: i64) -> bool { - let mut correct = true; - let mut check = |condition: bool, message: String| { - if !condition { - println!("Failed: {}", message); - } - correct = correct && condition; - }; - // checks that exploded edges are preserved with correct timestamps - let mut edges: Vec<(u64, u64, Vec)> = - edges.into_iter().filter(|e| !e.2.is_empty()).collect(); - // discard edges without timestamps - for e in edges.iter_mut() { - e.2.sort(); - // FIXME: Should not have to do this, see issue https://github.com/Pometry/Raphtory/issues/973 - e.2.dedup(); // add each timestamp only once (multi-edge per timestamp currently not implemented) - } - edges.sort(); - edges.dedup_by_key(|(src, dst, _)| (*src, *dst)); - - let g = Graph::new(1); - for (src, dst, times) in edges.iter() { - for t in times.iter() { - g.add_edge(*t, *src, *dst, &vec![], None).unwrap(); - } - } - - let mut actual_edges: Vec<(u64, u64, Vec)> = g - .edges() - .map(|e| { - ( - e.src().id(), - e.dst().id(), - e.explode() - .map(|ee| { - check( - ee.earliest_time() == ee.latest_time(), - format!("times mismatched for {:?}", ee), - ); // times are the same for exploded edge - let t = ee.earliest_time().unwrap(); - check( - ee.active(t), - format!("exploded edge {:?} inactive at {}", ee, t), - ); - if t < i64::MAX { - // window is broken at MAX! - check(e.active(t), format!("edge {:?} inactive at {}", e, t)); - } - let t_test = t.saturating_add(offset); - if t_test != t && t_test < i64::MAX && t_test > i64::MIN { - check( - !ee.active(t_test), - format!("exploded edge {:?} active at {}", ee, t_test), - ); - } - t - }) - .collect(), - ) - }) - .collect(); - - for e in actual_edges.iter_mut() { - e.2.sort(); - } - actual_edges.sort(); - check( - actual_edges == edges, - format!( - "actual edges didn't match input actual: {:?}, expected: {:?}", - actual_edges, edges - ), - ); - correct - } -} diff --git a/raphtory/src/db/graph/edge.rs b/raphtory/src/db/graph/edge.rs new file mode 100644 index 0000000000..3622d68940 --- /dev/null +++ b/raphtory/src/db/graph/edge.rs @@ -0,0 +1,561 @@ +//! Defines the `Edge` struct, which represents an edge in the graph. +//! +//! Edges are used to define directed connections between verticies in the graph. +//! Edges are identified by a unique ID, can have a direction (Ingoing, Outgoing, or Both) +//! and can have properties associated with them. +//! + +use super::views::layer_graph::LayeredGraph; +use crate::{ + core::{ + entities::{edges::edge_ref::EdgeRef, LayerIds, VID}, + storage::timeindex::TimeIndexEntry, + utils::{errors::GraphError, time::IntoTime}, + ArcStr, + }, + db::{ + api::{ + mutation::{ + internal::{InternalAdditionOps, InternalDeletionOps, InternalPropertyAdditionOps}, + CollectProperties, TryIntoInputTime, + }, + properties::{ + internal::{ConstPropertiesOps, TemporalPropertiesOps, TemporalPropertyViewOps}, + Properties, + }, + view::{internal::Static, BoxedIter, EdgeViewInternalOps, LayerOps}, + }, + graph::{vertex::VertexView, views::window_graph::WindowedGraph}, + }, + prelude::*, +}; +use std::{ + fmt::{Debug, Formatter}, + iter, +}; + +/// A view of an edge in the graph. +#[derive(Clone)] +pub struct EdgeView { + /// A view of an edge in the graph. + pub graph: G, + /// A reference to the edge. + pub edge: EdgeRef, +} + +impl Static for EdgeView {} + +impl EdgeView { + pub fn new(graph: G, edge: EdgeRef) -> Self { + Self { graph, edge } + } + + pub(crate) fn layer_ids(&self) -> LayerIds { + self.graph.layer_ids().constrain_from_edge(self.edge) + } +} + +impl + EdgeView +{ + pub fn delete(&self, t: T, layer: Option<&str>) -> Result<(), GraphError> { + let t = TimeIndexEntry::from_input(&self.graph, t)?; + let layer = self.resolve_layer(layer)?; + self.graph + .internal_delete_edge(t, self.edge.src(), self.edge.dst(), layer) + } +} + +impl PartialEq for EdgeView { + fn eq(&self, other: &Self) -> bool { + self.id() == other.id() + } +} + +impl EdgeViewInternalOps> for EdgeView { + fn graph(&self) -> G { + self.graph.clone() + } + + fn eref(&self) -> EdgeRef { + self.edge + } + + fn new_vertex(&self, v: VID) -> VertexView { + VertexView::new_internal(self.graph(), v) + } + + fn new_edge(&self, e: EdgeRef) -> Self { + Self { + graph: self.graph(), + edge: e, + } + } +} + +impl EdgeView { + fn resolve_layer(&self, layer: Option<&str>) -> Result { + match layer { + Some(name) => match self.edge.layer() { + Some(l_id) => self + .graph + .get_layer_id(name) + .filter(|id| id == l_id) + .ok_or_else(|| GraphError::InvalidLayer(name.to_owned())), + None => Ok(self.graph.resolve_layer(layer)), + }, + None => Ok(self.edge.layer().copied().unwrap_or(0)), + } + } + + /// Add constant properties for the edge + /// + /// Returns a person with the name given them + /// + /// # Arguments + /// + /// * `props` - Property key-value pairs to add + /// * `layer` - The layer to which properties should be added. If the edge view is restricted to a + /// single layer, 'None' will add the properties to that layer and 'Some("name")' + /// fails unless the layer matches the edge view. If the edge view is not restricted + /// to a single layer, 'None' sets the properties on the default layer and 'Some("name")' + /// sets the properties on layer '"name"' and fails if that layer doesn't exist. + pub fn add_constant_properties( + &self, + props: C, + layer: Option<&str>, + ) -> Result<(), GraphError> { + let properties: Vec<(usize, Prop)> = props.collect_properties( + |name, dtype| self.graph.resolve_edge_property(name, dtype, true), + |prop| self.graph.process_prop_value(prop), + )?; + let input_layer_id = self.resolve_layer(layer)?; + + self.graph.internal_add_constant_edge_properties( + self.edge.pid(), + input_layer_id, + properties, + ) + } + + pub fn add_updates( + &self, + time: T, + props: C, + layer: Option<&str>, + ) -> Result<(), GraphError> { + let t = TimeIndexEntry::from_input(&self.graph, time)?; + let layer_id = self.resolve_layer(layer)?; + let properties: Vec<(usize, Prop)> = props.collect_properties( + |name, dtype| self.graph.resolve_edge_property(name, dtype, false), + |prop| self.graph.process_prop_value(prop), + )?; + + self.graph + .internal_add_edge(t, self.edge.src(), self.edge.dst(), properties, layer_id)?; + Ok(()) + } +} + +impl ConstPropertiesOps for EdgeView { + fn get_const_prop_id(&self, name: &str) -> Option { + self.graph.edge_meta().const_prop_meta().get_id(name) + } + + fn get_const_prop_name(&self, id: usize) -> ArcStr { + self.graph.edge_meta().const_prop_meta().get_name(id) + } + + fn const_prop_ids(&self) -> Box + '_> { + self.graph + .const_edge_prop_ids(self.edge, self.graph.layer_ids()) + } + + fn const_prop_keys(&self) -> Box + '_> { + let reverse_map = self.graph.edge_meta().const_prop_meta().get_keys(); + Box::new(self.const_prop_ids().map(move |id| reverse_map[id].clone())) + } + + fn get_const_prop(&self, id: usize) -> Option { + self.graph + .get_const_edge_prop(self.edge, id, self.graph.layer_ids()) + } +} + +impl TemporalPropertyViewOps for EdgeView { + fn temporal_history(&self, id: usize) -> Vec { + self.graph + .temporal_edge_prop_vec(self.edge, id, self.graph.layer_ids()) + .into_iter() + .map(|(t, _)| t) + .collect() + } + + fn temporal_values(&self, id: usize) -> Vec { + let layer_ids = self.graph.layer_ids().constrain_from_edge(self.edge); + self.graph + .temporal_edge_prop_vec(self.edge, id, layer_ids) + .into_iter() + .map(|(_, v)| v) + .collect() + } +} + +impl TemporalPropertiesOps for EdgeView { + fn get_temporal_prop_id(&self, name: &str) -> Option { + self.graph + .edge_meta() + .temporal_prop_meta() + .get_id(name) + .filter(|id| { + self.graph + .has_temporal_edge_prop(self.edge, *id, self.layer_ids()) + }) + } + + fn get_temporal_prop_name(&self, id: usize) -> ArcStr { + self.graph.edge_meta().temporal_prop_meta().get_name(id) + } + + fn temporal_prop_ids(&self) -> Box + '_> { + Box::new( + self.graph + .temporal_edge_prop_ids(self.edge, self.layer_ids()) + .filter(|id| { + self.graph + .has_temporal_edge_prop(self.edge, *id, self.layer_ids()) + }), + ) + } + + fn temporal_prop_keys(&self) -> Box + '_> { + let reverse_map = self.graph.edge_meta().temporal_prop_meta().get_keys(); + Box::new( + self.temporal_prop_ids() + .map(move |id| reverse_map[id].clone()), + ) + } +} + +impl EdgeViewOps for EdgeView { + type Graph = G; + type Vertex = VertexView; + type EList = BoxedIter; + + fn explode(&self) -> Self::EList { + let ev = self.clone(); + match self.edge.time() { + Some(_) => Box::new(iter::once(ev)), + None => { + let layer_ids = self.graph.layer_ids().constrain_from_edge(self.edge); + let e = self.edge; + let ex_iter = self.graph.edge_exploded(e, layer_ids); + // FIXME: use duration + Box::new(ex_iter.map(move |ex| ev.new_edge(ex))) + } + } + } + + fn explode_layers(&self) -> Self::EList { + let ev = self.clone(); + match self.edge.layer() { + Some(_) => Box::new(iter::once(ev)), + None => { + let e = self.edge; + let ex_iter = self.graph.edge_layers(e, self.graph.layer_ids()); + Box::new(ex_iter.map(move |ex| ev.new_edge(ex))) + } + } + } +} + +impl Debug for EdgeView { + fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result { + write!( + f, + "EdgeView({}, {})", + self.graph.vertex(self.edge.src()).unwrap().id(), + self.graph.vertex(self.edge.dst()).unwrap().id() + ) + } +} + +impl From> for EdgeRef { + fn from(value: EdgeView) -> Self { + value.edge + } +} + +impl TimeOps for EdgeView { + type WindowedViewType = EdgeView>; + + fn start(&self) -> Option { + self.graph.start() + } + + fn end(&self) -> Option { + self.graph.end() + } + + fn window(&self, t_start: T, t_end: T) -> Self::WindowedViewType { + EdgeView { + graph: self.graph.window(t_start, t_end), + edge: self.edge, + } + } +} + +impl LayerOps for EdgeView { + type LayeredViewType = EdgeView>; + + fn default_layer(&self) -> Self::LayeredViewType { + EdgeView { + graph: self.graph.default_layer(), + edge: self.edge, + } + } + + fn layer>(&self, name: L) -> Option { + let layer_ids = self + .graph + .layer_ids_from_names(name.into()) + .constrain_from_edge(self.edge); + self.graph + .has_edge_ref( + self.edge.src(), + self.edge.dst(), + &layer_ids, + self.graph.edge_filter(), + ) + .then(|| EdgeView { + graph: LayeredGraph::new(self.graph.clone(), layer_ids), + edge: self.edge, + }) + } +} + +/// Implement `EdgeListOps` trait for an iterator of `EdgeView` objects. +/// +/// This implementation enables the use of the `src` and `dst` methods to retrieve the vertices +/// connected to the edges inside the iterator. +impl EdgeListOps for BoxedIter> { + type Graph = G; + type Vertex = VertexView; + type Edge = EdgeView; + type ValueType = T; + + /// Specifies the associated type for an iterator over vertices. + type VList = Box> + Send>; + + /// Specifies the associated type for the iterator over edges. + type IterType = Box + Send>; + + fn properties(self) -> Self::IterType> { + Box::new(self.map(move |e| e.properties())) + } + + /// Returns an iterator over the source vertices of the edges in the iterator. + fn src(self) -> Self::VList { + Box::new(self.map(|e| e.src())) + } + + /// Returns an iterator over the destination vertices of the edges in the iterator. + fn dst(self) -> Self::VList { + Box::new(self.map(|e| e.dst())) + } + + fn id(self) -> Self::IterType<(u64, u64)> { + Box::new(self.map(|e| e.id())) + } + + /// returns an iterator of exploded edges that include an edge at each point in time + fn explode(self) -> Self { + Box::new(self.flat_map(move |e| e.explode())) + } + + /// Gets the earliest times of a list of edges + fn earliest_time(self) -> Self::IterType> { + Box::new(self.map(|e| e.earliest_time())) + } + + /// Gets the latest times of a list of edges + fn latest_time(self) -> Self::IterType> { + Box::new(self.map(|e| e.latest_time())) + } + + fn time(self) -> Self::IterType> { + Box::new(self.map(|e| e.time())) + } + + fn layer_name(self) -> Self::IterType> { + Box::new(self.map(|e| e.layer_name().map(|v| v.clone()))) + } +} + +impl EdgeListOps for BoxedIter>> { + type Graph = G; + type Vertex = VertexView; + type Edge = EdgeView; + type ValueType = Box + Send>; + type VList = Box> + Send>> + Send>; + type IterType = Box + Send>> + Send>; + + fn properties(self) -> Self::IterType> { + Box::new(self.map(move |it| it.properties())) + } + + fn src(self) -> Self::VList { + Box::new(self.map(|it| it.src())) + } + + fn dst(self) -> Self::VList { + Box::new(self.map(|it| it.dst())) + } + + fn id(self) -> Self::IterType<(u64, u64)> { + Box::new(self.map(|it| it.id())) + } + + fn explode(self) -> Self { + Box::new(self.map(move |it| it.explode())) + } + + /// Gets the earliest times of a list of edges + fn earliest_time(self) -> Self::IterType> { + Box::new(self.map(|e| e.earliest_time())) + } + + /// Gets the latest times of a list of edges + fn latest_time(self) -> Self::IterType> { + Box::new(self.map(|e| e.latest_time())) + } + + fn time(self) -> Self::IterType> { + Box::new(self.map(|it| it.time())) + } + + fn layer_name(self) -> Self::IterType> { + Box::new(self.map(|it| it.layer_name())) + } +} + +pub type EdgeList = Box> + Send>; + +#[cfg(test)] +mod test_edge { + use crate::{ + core::{ArcStr, IntoPropMap}, + prelude::*, + }; + use itertools::Itertools; + use std::collections::HashMap; + + #[test] + fn test_properties() { + let g = Graph::new(); + let props = [(ArcStr::from("test"), "test".into_prop())]; + g.add_edge(0, 1, 2, NO_PROPS, None).unwrap(); + g.add_edge(2, 1, 2, props.clone(), None).unwrap(); + + let e1 = g.edge(1, 2).unwrap(); + let e1_w = g.window(0, 1).edge(1, 2).unwrap(); + assert_eq!(HashMap::from_iter(e1.properties().as_vec()), props.into()); + assert!(e1_w.properties().as_vec().is_empty()) + } + + #[test] + fn test_constant_properties() { + let g = Graph::new(); + g.add_edge(1, 1, 2, NO_PROPS, Some("layer 1")) + .unwrap() + .add_constant_properties([("test_prop", "test_val")], Some("layer 1")) + .unwrap(); + g.add_edge(1, 2, 3, NO_PROPS, Some("layer 2")) + .unwrap() + .add_constant_properties([("test_prop", "test_val")], Some("layer 2")) + .unwrap(); + + assert_eq!( + g.edge(1, 2) + .unwrap() + .properties() + .constant() + .get("test_prop"), + Some([("layer 1", "test_val")].into_prop_map()) + ); + assert_eq!( + g.edge(2, 3) + .unwrap() + .properties() + .constant() + .get("test_prop"), + Some([("layer 2", "test_val")].into_prop_map()) + ); + for e in g.edges() { + for ee in e.explode() { + assert_eq!( + ee.properties().constant().get("test_prop"), + Some("test_val".into()) + ) + } + } + } + + #[test] + fn test_property_additions() { + let g = Graph::new(); + let props = [("test", "test")]; + let e1 = g.add_edge(0, 1, 2, NO_PROPS, None).unwrap(); + e1.add_updates(2, props, None).unwrap(); // same layer works + assert!(e1.add_updates(2, props, Some("test2")).is_err()); // different layer is error + let e = g.edge(1, 2).unwrap(); + e.add_updates(2, props, Some("test2")).unwrap(); // non-restricted edge view can create new layers + let layered_views = e.explode_layers().collect_vec(); + for ev in layered_views { + let layer = ev.layer_name().unwrap(); + assert!(ev.add_updates(1, props, Some("test")).is_err()); // restricted edge view cannot create updates in different layer + ev.add_updates(1, [("test2", layer)], None).unwrap() // this will add an update to the same layer as the view (not the default layer) + } + let e1_w = e1.window(0, 1); + assert_eq!( + e1.properties().as_map(), + props + .into_iter() + .map(|(k, v)| (ArcStr::from(k), v.into_prop())) + .chain([(ArcStr::from("test2"), "_default".into_prop())]) + .collect() + ); + assert_eq!( + e.layer("test2").unwrap().properties().as_map(), + props + .into_iter() + .map(|(k, v)| (ArcStr::from(k), v.into_prop())) + .chain([(ArcStr::from("test2"), "test2".into_prop())]) + .collect() + ); + assert_eq!(e1_w.properties().as_map(), HashMap::default()) + } + + #[test] + fn test_constant_property_additions() { + let g = Graph::new(); + let e = g.add_edge(0, 1, 2, NO_PROPS, Some("test")).unwrap(); + assert!(e + .add_constant_properties([("test1", "test1")], None) + .is_ok()); // adds properties to layer `"test"` + assert!(e + .add_constant_properties([("test", "test")], Some("test2")) + .is_err()); // cannot add properties to a different layer + e.add_constant_properties([("test", "test")], Some("test")) + .unwrap(); // layer is consistent + assert_eq!(e.properties().get("test"), Some("test".into())); + assert_eq!(e.properties().get("test1"), Some("test1".into())); + } + + #[test] + fn test_layers_earliest_time() { + let g = Graph::new(); + let e = g.add_edge(1, 1, 2, NO_PROPS, Some("test")).unwrap(); + assert_eq!(e.earliest_time(), Some(1)); + } +} diff --git a/raphtory/src/db/graph/graph.rs b/raphtory/src/db/graph/graph.rs new file mode 100644 index 0000000000..332a5ec18a --- /dev/null +++ b/raphtory/src/db/graph/graph.rs @@ -0,0 +1,1577 @@ +//! Defines the `Graph` struct, which represents a raphtory graph in memory. +//! +//! This is the base class used to create a temporal graph, add vertices and edges, +//! create windows, and query the graph with a variety of algorithms. +//! It is a wrapper around a set of shards, which are the actual graph data structures. +//! +//! # Examples +//! +//! ```rust +//! use raphtory::prelude::*; +//! let graph = Graph::new(); +//! graph.add_vertex(0, "Alice", NO_PROPS).unwrap(); +//! graph.add_vertex(1, "Bob", NO_PROPS).unwrap(); +//! graph.add_edge(2, "Alice", "Bob", NO_PROPS, None).unwrap(); +//! graph.count_edges(); +//! ``` +//! + +use crate::{ + core::{entities::graph::tgraph::InnerTemporalGraph, utils::errors::GraphError}, + db::api::{ + mutation::internal::{InheritAdditionOps, InheritPropertyAdditionOps}, + view::internal::{Base, DynamicGraph, InheritViewOps, IntoDynamic, MaterializedGraph}, + }, + prelude::*, +}; +use serde::{Deserialize, Serialize}; +use std::{ + fmt::{Display, Formatter}, + path::Path, + sync::Arc, +}; + +const SEG: usize = 16; +pub(crate) type InternalGraph = InnerTemporalGraph; + +#[repr(transparent)] +#[derive(Debug, Clone, Serialize, Deserialize, Default)] +pub struct Graph(pub Arc); + +pub fn graph_equal(g1: &G1, g2: &G2) -> bool { + if g1.count_vertices() == g2.count_vertices() && g1.count_edges() == g2.count_edges() { + g1.vertices().id().all(|v| g2.has_vertex(v)) && // all vertices exist in other + g1.edges().explode().count() == g2.edges().explode().count() && // same number of exploded edges + g1.edges().explode().all(|e| { // all exploded edges exist in other + g2 + .edge(e.src().id(), e.dst().id()) + .filter(|ee| ee.active(e.time().expect("exploded"))) + .is_some() + }) + } else { + false + } +} + +impl Display for Graph { + fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result { + write!(f, "{}", self.0) + } +} + +impl From for Graph { + fn from(value: InternalGraph) -> Self { + Self(Arc::new(value)) + } +} + +impl PartialEq for Graph { + fn eq(&self, other: &G) -> bool { + graph_equal(self, other) + } +} + +impl Base for Graph { + type Base = InternalGraph; + + #[inline(always)] + fn base(&self) -> &InternalGraph { + &self.0 + } +} + +impl InheritAdditionOps for Graph {} +impl InheritPropertyAdditionOps for Graph {} +impl InheritViewOps for Graph {} + +impl Graph { + /// Create a new graph with the specified number of shards + /// + /// # Returns + /// + /// A raphtory graph + /// + /// # Example + /// + /// ``` + /// use raphtory::prelude::Graph; + /// let g = Graph::new(); + /// ``` + pub fn new() -> Self { + Self(Arc::new(InternalGraph::default())) + } + + pub(crate) fn new_from_inner(inner: Arc) -> Self { + Self(inner) + } + + /// Load a graph from a directory + /// + /// # Arguments + /// + /// * `path` - The path to the directory + /// + /// # Returns + /// + /// A raphtory graph + /// + /// # Example + /// + /// ```no_run + /// use raphtory::prelude::Graph; + /// let g = Graph::load_from_file("path/to/graph"); + /// ``` + pub fn load_from_file>(path: P) -> Result { + let g = MaterializedGraph::load_from_file(path)?; + g.into_events().ok_or(GraphError::GraphLoadError) + } + + /// Save a graph to a directory + pub fn save_to_file>(&self, path: P) -> Result<(), GraphError> { + MaterializedGraph::from(self.clone()).save_to_file(path) + } + + pub fn as_arc(&self) -> Arc { + self.0.clone() + } +} + +impl IntoDynamic for Graph { + fn into_dynamic(self) -> DynamicGraph { + DynamicGraph::new(self) + } +} + +#[cfg(test)] +mod db_tests { + use super::*; + use crate::{ + core::{ + utils::time::{error::ParseTimeError, TryIntoTime}, + ArcStr, Prop, + }, + db::{ + api::view::{ + EdgeListOps, EdgeViewOps, GraphViewOps, Layer, LayerOps, TimeOps, VertexViewOps, + }, + graph::{edge::EdgeView, path::PathFromVertex}, + }, + graphgen::random_attachment::random_attachment, + prelude::{AdditionOps, PropertyAdditionOps}, + }; + use chrono::NaiveDateTime; + use itertools::Itertools; + use quickcheck::Arbitrary; + use rayon::prelude::*; + use std::collections::{HashMap, HashSet}; + use tempdir::TempDir; + + #[quickcheck] + fn test_multithreaded_add_edge(edges: Vec<(u64, u64)>) -> bool { + let g = Graph::new(); + edges.par_iter().enumerate().for_each(|(t, (i, j))| { + g.add_edge(t as i64, *i, *j, NO_PROPS, None).unwrap(); + }); + edges + .iter() + .all(|(i, j)| g.has_edge(*i, *j, Layer::Default)) + && g.count_temporal_edges() == edges.len() + } + + #[quickcheck] + fn add_vertex_grows_graph_len(vs: Vec<(i64, u64)>) { + let g = Graph::new(); + + let expected_len = vs.iter().map(|(_, v)| v).sorted().dedup().count(); + for (t, v) in vs { + g.add_vertex(t, v, NO_PROPS) + .map_err(|err| println!("{:?}", err)) + .ok(); + } + + assert_eq!(g.count_vertices(), expected_len) + } + + #[quickcheck] + fn add_vertex_gets_names(vs: Vec) -> bool { + let g = Graph::new(); + + let expected_len = vs.iter().sorted().dedup().count(); + for (t, name) in vs.iter().enumerate() { + g.add_vertex(t as i64, name.clone(), NO_PROPS) + .map_err(|err| println!("{:?}", err)) + .ok(); + } + + assert_eq!(g.count_vertices(), expected_len); + + vs.iter().all(|name| { + let v = g.vertex(name.clone()).unwrap(); + v.name() == name.clone() + }) + } + + #[quickcheck] + fn add_edge_grows_graph_edge_len(edges: Vec<(i64, u64, u64)>) { + let g = Graph::new(); + + let unique_vertices_count = edges + .iter() + .flat_map(|(_, src, dst)| vec![src, dst]) + .sorted() + .dedup() + .count(); + + let unique_edge_count = edges + .iter() + .map(|(_, src, dst)| (src, dst)) + .unique() + .count(); + + for (t, src, dst) in edges { + g.add_edge(t, src, dst, NO_PROPS, None).unwrap(); + } + + assert_eq!(g.count_vertices(), unique_vertices_count); + assert_eq!(g.count_edges(), unique_edge_count); + } + + #[quickcheck] + fn add_edge_works(edges: Vec<(i64, u64, u64)>) -> bool { + let g = Graph::new(); + for &(t, src, dst) in edges.iter() { + g.add_edge(t, src, dst, NO_PROPS, None).unwrap(); + } + + edges + .iter() + .all(|&(_, src, dst)| g.has_edge(src, dst, Layer::All)) + } + + #[quickcheck] + fn get_edge_works(edges: Vec<(i64, u64, u64)>) -> bool { + let g = Graph::new(); + for &(t, src, dst) in edges.iter() { + g.add_edge(t, src, dst, NO_PROPS, None).unwrap(); + } + + edges + .iter() + .all(|&(_, src, dst)| g.edge(src, dst).is_some()) + } + + #[test] + fn graph_save_to_load_from_file() { + let vs = vec![ + (1, 1, 2), + (2, 1, 3), + (-1, 2, 1), + (0, 1, 1), + (7, 3, 2), + (1, 1, 1), + ]; + + let g = Graph::new(); + + for (t, src, dst) in &vs { + g.add_edge(*t, *src, *dst, NO_PROPS, None).unwrap(); + } + + let tmp_raphtory_path: TempDir = + TempDir::new("raphtory").expect("Failed to create tempdir"); + + let graph_path = format!("{}/graph.bin", tmp_raphtory_path.path().display()); + g.save_to_file(&graph_path).expect("Failed to save graph"); + + // Load from files + let g2 = Graph::load_from_file(&graph_path).expect("Failed to load graph"); + + assert_eq!(g, g2); + + let _ = tmp_raphtory_path.close(); + } + + #[test] + fn has_edge() { + let g = Graph::new(); + g.add_edge(1, 7, 8, NO_PROPS, None).unwrap(); + + assert!(!g.has_edge(8, 7, Layer::All)); + assert!(g.has_edge(7, 8, Layer::All)); + + g.add_edge(1, 7, 9, NO_PROPS, None).unwrap(); + + assert!(!g.has_edge(9, 7, Layer::All)); + assert!(g.has_edge(7, 9, Layer::All)); + + g.add_edge(2, "haaroon", "northLondon", NO_PROPS, None) + .unwrap(); + assert!(g.has_edge("haaroon", "northLondon", Layer::All)); + } + + #[test] + fn graph_edge() { + let g = Graph::new(); + let es = vec![ + (1, 1, 2), + (2, 1, 3), + (-1, 2, 1), + (0, 1, 1), + (7, 3, 2), + (1, 1, 1), + ]; + for (t, src, dst) in es { + g.add_edge(t, src, dst, NO_PROPS, None).unwrap(); + } + + let e = g + .window(i64::MIN, i64::MAX) + .layer(Layer::Default) + .unwrap() + .edge(1, 3) + .unwrap(); + assert_eq!(e.src().id(), 1u64); + assert_eq!(e.dst().id(), 3u64); + } + + #[test] + fn graph_degree_window() { + let vs = vec![ + (1, 1, 2), + (2, 1, 3), + (-1, 2, 1), + (0, 1, 1), + (7, 3, 2), + (1, 1, 1), + ]; + + let g = Graph::new(); + + for (t, src, dst) in &vs { + g.add_edge(*t, *src, *dst, NO_PROPS, None).unwrap(); + } + + let expected = vec![(2, 3, 1), (1, 0, 0), (1, 0, 0)]; + let actual = (1..=3) + .map(|i| { + let v = g.vertex(i).unwrap(); + ( + v.window(-1, 7).in_degree(), + v.window(1, 7).out_degree(), + v.window(0, 1).degree(), + ) + }) + .collect::>(); + + assert_eq!(actual, expected); + } + + #[test] + fn graph_edges_window() { + let vs = vec![ + (1, 1, 2), + (2, 1, 3), + (-1, 2, 1), + (0, 1, 1), + (7, 3, 2), + (1, 1, 1), + ]; + + let g = Graph::new(); + + for (t, src, dst) in &vs { + g.add_edge(*t, *src, *dst, NO_PROPS, None).unwrap(); + } + + let expected = vec![(2, 3, 2), (1, 0, 0), (1, 0, 0)]; + let actual = (1..=3) + .map(|i| { + let v = g.vertex(i).unwrap(); + ( + v.window(-1, 7).in_edges().collect::>().len(), + v.window(1, 7).out_edges().collect::>().len(), + v.window(0, 1).edges().collect::>().len(), + ) + }) + .collect::>(); + + assert_eq!(actual, expected); + } + + #[test] + fn time_test() { + let g = Graph::new(); + + assert_eq!(g.latest_time(), None); + assert_eq!(g.earliest_time(), None); + + g.add_vertex(5, 1, NO_PROPS) + .map_err(|err| println!("{:?}", err)) + .ok(); + + assert_eq!(g.latest_time(), Some(5)); + assert_eq!(g.earliest_time(), Some(5)); + + let g = Graph::new(); + + g.add_edge(10, 1, 2, NO_PROPS, None).unwrap(); + assert_eq!(g.latest_time(), Some(10)); + assert_eq!(g.earliest_time(), Some(10)); + + g.add_vertex(5, 1, NO_PROPS) + .map_err(|err| println!("{:?}", err)) + .ok(); + assert_eq!(g.latest_time(), Some(10)); + assert_eq!(g.earliest_time(), Some(5)); + + g.add_edge(20, 3, 4, NO_PROPS, None).unwrap(); + assert_eq!(g.latest_time(), Some(20)); + assert_eq!(g.earliest_time(), Some(5)); + + random_attachment(&g, 100, 10); + assert_eq!(g.latest_time(), Some(126)); + assert_eq!(g.earliest_time(), Some(5)); + } + + #[test] + fn static_properties() { + let g = Graph::new(); + g.add_edge(0, 11, 22, NO_PROPS, None).unwrap(); + g.add_edge( + 0, + 11, + 11, + vec![("temp".to_string(), Prop::Bool(true))], + None, + ) + .unwrap(); + g.add_edge(0, 22, 33, NO_PROPS, None).unwrap(); + g.add_edge(0, 33, 11, NO_PROPS, None).unwrap(); + g.add_vertex(0, 11, vec![("temp".to_string(), Prop::Bool(true))]) + .unwrap(); + g.add_edge(0, 44, 55, NO_PROPS, None).unwrap(); + let v11 = g.vertex(11).unwrap(); + let v22 = g.vertex(22).unwrap(); + let v33 = g.vertex(33).unwrap(); + let v44 = g.vertex(44).unwrap(); + let v55 = g.vertex(55).unwrap(); + let edge1111 = g.edge(&v11, &v11).unwrap(); + let edge2233 = g.edge(&v22, &v33).unwrap(); + let edge3311 = g.edge(&v33, &v11).unwrap(); + + v11.add_constant_properties(vec![("a", Prop::U64(11)), ("b", Prop::I64(11))]) + .unwrap(); + v11.add_constant_properties(vec![("c", Prop::U32(11))]) + .unwrap(); + + v44.add_constant_properties(vec![("e", Prop::U8(1))]) + .unwrap(); + v55.add_constant_properties(vec![("f", Prop::U16(1))]) + .unwrap(); + edge1111 + .add_constant_properties(vec![("d", Prop::U64(1111))], None) + .unwrap(); + edge3311 + .add_constant_properties(vec![("a", Prop::U64(3311))], None) + .unwrap(); + + // cannot change property type + assert!(v22 + .add_constant_properties(vec![("b", Prop::U64(22))]) + .is_err()); + + assert_eq!(v11.properties().constant().keys(), vec!["a", "b", "c"]); + assert!(v22.properties().constant().keys().is_empty()); + assert!(v33.properties().constant().keys().is_empty()); + assert_eq!(v44.properties().constant().keys(), vec!["e"]); + assert_eq!(v55.properties().constant().keys(), vec!["f"]); + assert_eq!(edge1111.properties().constant().keys(), vec!["d"]); + assert_eq!(edge3311.properties().constant().keys(), vec!["a"]); + assert!(edge2233.properties().constant().keys().is_empty()); + + assert_eq!(v11.properties().constant().get("a"), Some(Prop::U64(11))); + assert_eq!(v11.properties().constant().get("b"), Some(Prop::I64(11))); + assert_eq!(v11.properties().constant().get("c"), Some(Prop::U32(11))); + assert_eq!(v22.properties().constant().get("b"), None); + assert_eq!(v44.properties().constant().get("e"), Some(Prop::U8(1))); + assert_eq!(v55.properties().constant().get("f"), Some(Prop::U16(1))); + assert_eq!(v22.properties().constant().get("a"), None); + assert_eq!( + edge1111.properties().constant().get("d"), + Some(Prop::U64(1111)) + ); + assert_eq!( + edge3311.properties().constant().get("a"), + Some(Prop::U64(3311)) + ); + assert_eq!(edge2233.properties().constant().get("a"), None); + } + + #[test] + fn temporal_props_vertex() { + let g = Graph::new(); + + g.add_vertex(0, 1, [("cool".to_string(), Prop::Bool(true))]) + .unwrap(); + + let v = g.vertex(1).unwrap(); + + let actual = v.properties().get("cool"); + assert_eq!(actual, Some(Prop::Bool(true))); + + // we flip cool from true to false after t 3 + g.add_vertex(3, 1, [("cool".to_string(), Prop::Bool(false))]) + .unwrap(); + + let wg = g.window(3, 15); + let v = wg.vertex(1).unwrap(); + + let actual = v.properties().get("cool"); + assert_eq!(actual, Some(Prop::Bool(false))); + + let hist: Vec<_> = v + .properties() + .temporal() + .get("cool") + .unwrap() + .iter() + .collect(); + assert_eq!(hist, vec![(3, Prop::Bool(false))]); + + let v = g.vertex(1).unwrap(); + + let hist: Vec<_> = v + .properties() + .temporal() + .get("cool") + .unwrap() + .iter() + .collect(); + assert_eq!(hist, vec![(0, Prop::Bool(true)), (3, Prop::Bool(false))]); + } + + #[test] + fn temporal_props_edge() { + let g = Graph::new(); + + g.add_edge(1, 0, 1, vec![("distance".to_string(), Prop::U32(5))], None) + .expect("add edge"); + + let e = g.edge(0, 1).unwrap(); + + let prop = e.properties().get("distance").unwrap(); + assert_eq!(prop, Prop::U32(5)); + } + + #[test] + fn graph_neighbours_window() { + let vs = vec![ + (1, 1, 2), + (2, 1, 3), + (-1, 2, 1), + (0, 1, 1), + (7, 3, 2), + (1, 1, 1), + ]; + + let g = Graph::new(); + + for (t, src, dst) in &vs { + g.add_edge(*t, *src, *dst, NO_PROPS, None).unwrap(); + } + + let expected = vec![ + (vec![1, 2], vec![1, 2, 3], vec![1]), + (vec![1], vec![], vec![]), + (vec![1], vec![], vec![]), + ]; + let actual = (1..=3) + .map(|i| { + let v = g.vertex(i).unwrap(); + ( + v.window(-1, 7).in_neighbours().id().collect::>(), + v.window(1, 7).out_neighbours().id().collect::>(), + v.window(0, 1).neighbours().id().collect::>(), + ) + }) + .collect::>(); + + assert_eq!(actual, expected); + } + + #[test] + fn test_time_range_on_empty_graph() { + let g = Graph::new(); + + let rolling = g.rolling(1, None).unwrap().collect_vec(); + assert!(rolling.is_empty()); + + let expanding = g.expanding(1).unwrap().collect_vec(); + assert!(expanding.is_empty()); + } + + #[test] + fn test_add_vertex_with_strings() { + let g = Graph::new(); + + g.add_vertex(0, "haaroon", NO_PROPS).unwrap(); + g.add_vertex(1, "hamza", NO_PROPS).unwrap(); + g.add_vertex(1, 831, NO_PROPS).unwrap(); + + assert!(g.has_vertex(831)); + assert!(g.has_vertex("haaroon")); + assert!(g.has_vertex("hamza")); + + assert_eq!(g.count_vertices(), 3); + } + + #[test] + fn layers() -> Result<(), GraphError> { + let g = Graph::new(); + g.add_edge(0, 11, 22, NO_PROPS, None)?; + g.add_edge(0, 11, 33, NO_PROPS, None)?; + g.add_edge(0, 33, 11, NO_PROPS, None)?; + g.add_edge(0, 11, 22, NO_PROPS, Some("layer1"))?; + g.add_edge(0, 11, 33, NO_PROPS, Some("layer2"))?; + g.add_edge(0, 11, 44, NO_PROPS, Some("layer2"))?; + + assert!(g.has_edge(11, 22, Layer::All)); + assert!(g.has_edge(11, 22, Layer::Default)); + assert!(!g.has_edge(11, 44, Layer::Default)); + assert!(!g.has_edge(11, 22, "layer2")); + assert!(g.has_edge(11, 44, "layer2")); + + assert!(g.edge(11, 22).is_some()); + assert!(g.layer(Layer::Default).unwrap().edge(11, 44).is_none()); + assert!(g.edge(11, 22).unwrap().layer("layer2").is_none()); + assert!(g.edge(11, 44).unwrap().layer("layer2").is_some()); + + let dft_layer = g.default_layer(); + let layer1 = g.layer("layer1").expect("layer1"); + let layer2 = g.layer("layer2").expect("layer2"); + assert!(g.layer("missing layer").is_none()); + + assert_eq!(g.count_vertices(), 4); + assert_eq!(g.count_edges(), 4); + assert_eq!(dft_layer.count_edges(), 3); + assert_eq!(layer1.count_edges(), 1); + assert_eq!(layer2.count_edges(), 2); + + let vertex = g.vertex(11).unwrap(); + let vertex_dft = dft_layer.vertex(11).unwrap(); + let vertex1 = layer1.vertex(11).unwrap(); + let vertex2 = layer2.vertex(11).unwrap(); + + assert_eq!(vertex.degree(), 3); + assert_eq!(vertex_dft.degree(), 2); + assert_eq!(vertex1.degree(), 1); + assert_eq!(vertex2.degree(), 2); + + assert_eq!(vertex.out_degree(), 3); + assert_eq!(vertex_dft.out_degree(), 2); + assert_eq!(vertex1.out_degree(), 1); + assert_eq!(vertex2.out_degree(), 2); + + assert_eq!(vertex.in_degree(), 1); + assert_eq!(vertex_dft.in_degree(), 1); + assert_eq!(vertex1.in_degree(), 0); + assert_eq!(vertex2.in_degree(), 0); + + fn to_tuples>>( + edges: I, + ) -> Vec<(u64, u64)> { + edges + .map(|e| (e.src().id(), e.dst().id())) + .sorted() + .collect_vec() + } + + assert_eq!( + to_tuples(vertex.edges()), + vec![(11, 22), (11, 33), (11, 44), (33, 11)] + ); + assert_eq!( + to_tuples(vertex_dft.edges()), + vec![(11, 22), (11, 33), (33, 11)] + ); + assert_eq!(to_tuples(vertex1.edges()), vec![(11, 22)]); + assert_eq!(to_tuples(vertex2.edges()), vec![(11, 33), (11, 44)]); + + assert_eq!(to_tuples(vertex.in_edges()), vec![(33, 11)]); + assert_eq!(to_tuples(vertex_dft.in_edges()), vec![(33, 11)]); + assert_eq!(to_tuples(vertex1.in_edges()), vec![]); + assert_eq!(to_tuples(vertex2.in_edges()), vec![]); + + assert_eq!( + to_tuples(vertex.out_edges()), + vec![(11, 22), (11, 33), (11, 44)] + ); + assert_eq!(to_tuples(vertex_dft.out_edges()), vec![(11, 22), (11, 33)]); + assert_eq!(to_tuples(vertex1.out_edges()), vec![(11, 22)]); + assert_eq!(to_tuples(vertex2.out_edges()), vec![(11, 33), (11, 44)]); + + fn to_ids(neighbours: PathFromVertex) -> Vec { + neighbours.iter().map(|n| n.id()).sorted().collect_vec() + } + + assert_eq!(to_ids(vertex.neighbours()), vec![22, 33, 44]); + assert_eq!(to_ids(vertex_dft.neighbours()), vec![22, 33]); + assert_eq!(to_ids(vertex1.neighbours()), vec![22]); + assert_eq!(to_ids(vertex2.neighbours()), vec![33, 44]); + + assert_eq!(to_ids(vertex.out_neighbours()), vec![22, 33, 44]); + assert_eq!(to_ids(vertex_dft.out_neighbours()), vec![22, 33]); + assert_eq!(to_ids(vertex1.out_neighbours()), vec![22]); + assert_eq!(to_ids(vertex2.out_neighbours()), vec![33, 44]); + + assert_eq!(to_ids(vertex.in_neighbours()), vec![33]); + assert_eq!(to_ids(vertex_dft.in_neighbours()), vec![33]); + assert!(to_ids(vertex1.in_neighbours()).is_empty()); + assert!(to_ids(vertex2.in_neighbours()).is_empty()); + Ok(()) + } + + #[test] + fn test_exploded_edge() { + let g = Graph::new(); + g.add_edge(0, 1, 2, [("weight", Prop::I64(1))], None) + .unwrap(); + g.add_edge(1, 1, 2, [("weight", Prop::I64(2))], None) + .unwrap(); + g.add_edge(2, 1, 2, [("weight", Prop::I64(3))], None) + .unwrap(); + + let exploded = g.edge(1, 2).unwrap().explode(); + + let res = exploded.map(|e| e.properties().as_vec()).collect_vec(); + + let mut expected = Vec::new(); + for i in 1..4 { + expected.push(vec![("weight".into(), Prop::I64(i))]); + } + + assert_eq!(res, expected); + + let e = g + .vertex(1) + .unwrap() + .edges() + .explode() + .map(|e| e.properties().as_vec()) + .collect_vec(); + assert_eq!(e, expected); + } + + #[test] + fn test_edge_earliest_latest() { + let g = Graph::new(); + g.add_edge(0, 1, 2, NO_PROPS, None).unwrap(); + g.add_edge(1, 1, 2, NO_PROPS, None).unwrap(); + g.add_edge(2, 1, 2, NO_PROPS, None).unwrap(); + g.add_edge(0, 1, 3, NO_PROPS, None).unwrap(); + g.add_edge(1, 1, 3, NO_PROPS, None).unwrap(); + g.add_edge(2, 1, 3, NO_PROPS, None).unwrap(); + + let mut res = g.edge(1, 2).unwrap().earliest_time().unwrap(); + assert_eq!(res, 0); + + res = g.edge(1, 2).unwrap().latest_time().unwrap(); + assert_eq!(res, 2); + + res = g.at(1).edge(1, 2).unwrap().earliest_time().unwrap(); + assert_eq!(res, 0); + + res = g.at(1).edge(1, 2).unwrap().latest_time().unwrap(); + assert_eq!(res, 1); + + let res_list: Vec = g + .vertex(1) + .unwrap() + .edges() + .earliest_time() + .flatten() + .collect(); + assert_eq!(res_list, vec![0, 0]); + + let res_list: Vec = g + .vertex(1) + .unwrap() + .edges() + .latest_time() + .flatten() + .collect(); + assert_eq!(res_list, vec![2, 2]); + + let res_list: Vec = g + .vertex(1) + .unwrap() + .at(1) + .edges() + .earliest_time() + .flatten() + .collect(); + assert_eq!(res_list, vec![0, 0]); + + let res_list: Vec = g + .vertex(1) + .unwrap() + .at(1) + .edges() + .latest_time() + .flatten() + .collect(); + assert_eq!(res_list, vec![1, 1]); + } + + #[test] + fn check_vertex_history() { + let g = Graph::new(); + + g.add_vertex(1, 1, NO_PROPS).unwrap(); + g.add_vertex(2, 1, NO_PROPS).unwrap(); + g.add_vertex(3, 1, NO_PROPS).unwrap(); + g.add_vertex(4, 1, NO_PROPS).unwrap(); + g.add_vertex(8, 1, NO_PROPS).unwrap(); + + g.add_vertex(4, "Lord Farquaad", NO_PROPS).unwrap(); + g.add_vertex(6, "Lord Farquaad", NO_PROPS).unwrap(); + g.add_vertex(7, "Lord Farquaad", NO_PROPS).unwrap(); + g.add_vertex(8, "Lord Farquaad", NO_PROPS).unwrap(); + + let times_of_one = g.vertex(1).unwrap().history(); + let times_of_farquaad = g.vertex("Lord Farquaad").unwrap().history(); + + assert_eq!(times_of_one, [1, 2, 3, 4, 8]); + assert_eq!(times_of_farquaad, [4, 6, 7, 8]); + + let view = g.window(1, 8); + + let windowed_times_of_one = view.vertex(1).unwrap().history(); + let windowed_times_of_farquaad = view.vertex("Lord Farquaad").unwrap().history(); + assert_eq!(windowed_times_of_one, [1, 2, 3, 4]); + assert_eq!(windowed_times_of_farquaad, [4, 6, 7]); + } + + #[test] + fn check_edge_history() { + let g = Graph::new(); + + g.add_edge(1, 1, 2, NO_PROPS, None).unwrap(); + g.add_edge(2, 1, 3, NO_PROPS, None).unwrap(); + g.add_edge(3, 1, 2, NO_PROPS, None).unwrap(); + g.add_edge(4, 1, 4, NO_PROPS, None).unwrap(); + + let times_of_onetwo = g.edge(1, 2).unwrap().history(); + let times_of_four = g.edge(1, 4).unwrap().window(1, 5).history(); + let view = g.window(2, 5); + let windowed_times_of_four = view.edge(1, 4).unwrap().window(2, 4).history(); + + assert_eq!(times_of_onetwo, [1, 3]); + assert_eq!(times_of_four, [4]); + assert!(windowed_times_of_four.is_empty()); + } + + #[test] + fn check_edge_history_on_multiple_shards() { + let g = Graph::new(); + + g.add_edge(1, 1, 2, NO_PROPS, None).unwrap(); + g.add_edge(2, 1, 3, NO_PROPS, None).unwrap(); + g.add_edge(3, 1, 2, NO_PROPS, None).unwrap(); + g.add_edge(4, 1, 4, NO_PROPS, None).unwrap(); + g.add_edge(5, 1, 4, NO_PROPS, None).unwrap(); + g.add_edge(6, 1, 4, NO_PROPS, None).unwrap(); + g.add_edge(7, 1, 4, NO_PROPS, None).unwrap(); + g.add_edge(8, 1, 4, NO_PROPS, None).unwrap(); + g.add_edge(9, 1, 4, NO_PROPS, None).unwrap(); + g.add_edge(10, 1, 4, NO_PROPS, None).unwrap(); + + let times_of_onetwo = g.edge(1, 2).unwrap().history(); + let times_of_four = g.edge(1, 4).unwrap().window(1, 5).history(); + let times_of_outside_window = g.edge(1, 4).unwrap().window(1, 4).history(); + let times_of_four_higher = g.edge(1, 4).unwrap().window(6, 11).history(); + + let view = g.window(1, 11); + let windowed_times_of_four = view.edge(1, 4).unwrap().window(2, 5).history(); + let windowed_times_of_four_higher = view.edge(1, 4).unwrap().window(8, 11).history(); + + assert_eq!(times_of_onetwo, [1, 3]); + assert_eq!(times_of_four, [4]); + assert_eq!(times_of_four_higher, [6, 7, 8, 9, 10]); + assert!(times_of_outside_window.is_empty()); + assert_eq!(windowed_times_of_four, [4]); + assert_eq!(windowed_times_of_four_higher, [8, 9, 10]); + } + + #[test] + fn check_vertex_history_multiple_shards() { + let g = Graph::new(); + + g.add_vertex(1, 1, NO_PROPS).unwrap(); + g.add_vertex(2, 1, NO_PROPS).unwrap(); + g.add_vertex(3, 1, NO_PROPS).unwrap(); + g.add_vertex(4, 1, NO_PROPS).unwrap(); + g.add_vertex(5, 2, NO_PROPS).unwrap(); + g.add_vertex(6, 2, NO_PROPS).unwrap(); + g.add_vertex(7, 2, NO_PROPS).unwrap(); + g.add_vertex(8, 1, NO_PROPS).unwrap(); + g.add_vertex(9, 2, NO_PROPS).unwrap(); + g.add_vertex(10, 2, NO_PROPS).unwrap(); + + g.add_vertex(4, "Lord Farquaad", NO_PROPS).unwrap(); + g.add_vertex(6, "Lord Farquaad", NO_PROPS).unwrap(); + g.add_vertex(7, "Lord Farquaad", NO_PROPS).unwrap(); + g.add_vertex(8, "Lord Farquaad", NO_PROPS).unwrap(); + + let times_of_one = g.vertex(1).unwrap().history(); + let times_of_farquaad = g.vertex("Lord Farquaad").unwrap().history(); + let times_of_upper = g.vertex(2).unwrap().history(); + + assert_eq!(times_of_one, [1, 2, 3, 4, 8]); + assert_eq!(times_of_farquaad, [4, 6, 7, 8]); + assert_eq!(times_of_upper, [5, 6, 7, 9, 10]); + + let view = g.window(1, 8); + let windowed_times_of_one = view.vertex(1).unwrap().history(); + let windowed_times_of_two = view.vertex(2).unwrap().history(); + let windowed_times_of_farquaad = view.vertex("Lord Farquaad").unwrap().history(); + + assert_eq!(windowed_times_of_one, [1, 2, 3, 4]); + assert_eq!(windowed_times_of_farquaad, [4, 6, 7]); + assert_eq!(windowed_times_of_two, [5, 6, 7]); + } + + #[derive(Debug)] + struct CustomTime<'a>(&'a str, &'a str); + + impl<'a> TryIntoTime for CustomTime<'a> { + fn try_into_time(self) -> Result { + let CustomTime(time, fmt) = self; + let time = NaiveDateTime::parse_from_str(time, fmt)?; + let time = time.timestamp_millis(); + Ok(time) + } + } + + #[test] + fn test_ingesting_timestamps() { + let earliest_time = "2022-06-06 12:34:00".try_into_time().unwrap(); + let latest_time = "2022-06-07 12:34:00".try_into_time().unwrap(); + + let g = Graph::new(); + g.add_vertex("2022-06-06T12:34:00.000", 0, NO_PROPS) + .unwrap(); + g.add_edge("2022-06-07T12:34:00", 1, 2, NO_PROPS, None) + .unwrap(); + assert_eq!(g.earliest_time().unwrap(), earliest_time); + assert_eq!(g.latest_time().unwrap(), latest_time); + + let g = Graph::new(); + let fmt = "%Y-%m-%d %H:%M"; + + g.add_vertex(CustomTime("2022-06-06 12:34", fmt), 0, NO_PROPS) + .unwrap(); + g.add_edge(CustomTime("2022-06-07 12:34", fmt), 1, 2, NO_PROPS, None) + .unwrap(); + assert_eq!(g.earliest_time().unwrap(), earliest_time); + assert_eq!(g.latest_time().unwrap(), latest_time); + } + + #[test] + fn test_prop_display_str() { + let mut prop = Prop::Str("hello".into()); + assert_eq!(format!("{}", prop), "hello"); + + prop = Prop::I32(42); + assert_eq!(format!("{}", prop), "42"); + + prop = Prop::I64(9223372036854775807); + assert_eq!(format!("{}", prop), "9223372036854775807"); + + prop = Prop::U32(4294967295); + assert_eq!(format!("{}", prop), "4294967295"); + + prop = Prop::U64(18446744073709551615); + assert_eq!(format!("{}", prop), "18446744073709551615"); + + prop = Prop::U8(255); + assert_eq!(format!("{}", prop), "255"); + + prop = Prop::U16(65535); + assert_eq!(format!("{}", prop), "65535"); + + prop = Prop::F32(3.14159); + assert_eq!(format!("{}", prop), "3.14159"); + + prop = Prop::F64(3.141592653589793); + assert_eq!(format!("{}", prop), "3.141592653589793"); + + prop = Prop::Bool(true); + assert_eq!(format!("{}", prop), "true"); + } + + #[quickcheck] + fn test_graph_constant_props(u64_props: HashMap) -> bool { + let g = Graph::new(); + + let as_props = u64_props + .into_iter() + .map(|(name, value)| (name, Prop::U64(value))) + .collect::>(); + + g.add_constant_properties(as_props.clone()).unwrap(); + + let props_map = as_props.into_iter().collect::>(); + + props_map + .into_iter() + .all(|(name, value)| g.properties().constant().get(&name).unwrap() == value) + } + + #[quickcheck] + fn test_graph_constant_props_names(u64_props: HashMap) -> bool { + let g = Graph::new(); + + let as_props = u64_props + .into_iter() + .map(|(name, value)| (name.into(), Prop::U64(value))) + .collect::>(); + + g.add_constant_properties(as_props.clone()).unwrap(); + + let props_names = as_props + .into_iter() + .map(|(name, _)| name) + .collect::>(); + + g.properties() + .constant() + .keys() + .into_iter() + .collect::>() + == props_names + } + + #[quickcheck] + fn test_graph_temporal_props(str_props: HashMap) -> bool { + let g = Graph::new(); + + let (t0, t1) = (1, 2); + + let (t0_props, t1_props): (Vec<_>, Vec<_>) = str_props + .iter() + .enumerate() + .map(|(i, props)| { + let (name, value) = props; + let value = Prop::from(value); + (name.as_str().into(), value, i % 2) + }) + .partition(|(_, _, i)| *i == 0); + + let t0_props: HashMap = t0_props + .into_iter() + .map(|(name, value, _)| (name, value)) + .collect(); + + let t1_props: HashMap = t1_props + .into_iter() + .map(|(name, value, _)| (name, value)) + .collect(); + + g.add_properties(t0, t0_props.clone()).unwrap(); + g.add_properties(t1, t1_props.clone()).unwrap(); + + let check = t0_props.iter().all(|(name, value)| { + g.properties().temporal().get(name).unwrap().at(t0) == Some(value.clone()) + }) && t1_props.iter().all(|(name, value)| { + g.properties().temporal().get(name).unwrap().at(t1) == Some(value.clone()) + }); + if !check { + println!("failed time-specific comparison for {:?}", str_props); + return false; + } + let check = check + && g.at(t0) + .properties() + .temporal() + .iter_latest() + .map(|(k, v)| (k.clone(), v)) + .collect::>() + == t0_props; + if !check { + println!("failed latest value comparison for {:?} at t0", str_props); + return false; + } + let check = check + && t1_props.iter().all(|(k, ve)| { + g.at(t1) + .properties() + .temporal() + .get(k) + .and_then(|v| v.latest()) + == Some(ve.clone()) + }); + if !check { + println!("failed latest value comparison for {:?} at t1", str_props); + return false; + } + check + } + + #[test] + fn test_temporral_edge_props_window() { + let g = Graph::new(); + g.add_edge(1, 1, 2, vec![("weight".to_string(), Prop::I64(1))], None) + .unwrap(); + g.add_edge(2, 1, 2, vec![("weight".to_string(), Prop::I64(2))], None) + .unwrap(); + g.add_edge(3, 1, 2, vec![("weight".to_string(), Prop::I64(3))], None) + .unwrap(); + + let e = g.vertex(1).unwrap().out_edges().next().unwrap(); + let res: HashMap> = e + .window(1, 3) + .properties() + .temporal() + .iter() + .map(|(k, v)| (k.clone(), v.iter().collect())) + .collect(); + + let mut exp = HashMap::new(); + exp.insert( + ArcStr::from("weight"), + vec![(1, Prop::I64(1)), (2, Prop::I64(2))], + ); + assert_eq!(res, exp); + } + + #[test] + fn test_vertex_early_late_times() { + let g = Graph::new(); + g.add_vertex(1, 1, NO_PROPS).unwrap(); + g.add_vertex(2, 1, NO_PROPS).unwrap(); + g.add_vertex(3, 1, NO_PROPS).unwrap(); + + assert_eq!(g.vertex(1).unwrap().earliest_time(), Some(1)); + assert_eq!(g.vertex(1).unwrap().latest_time(), Some(3)); + + assert_eq!(g.at(2).vertex(1).unwrap().earliest_time(), Some(1)); + assert_eq!(g.at(2).vertex(1).unwrap().latest_time(), Some(2)); + } + + #[test] + fn test_vertex_ids() { + let g = Graph::new(); + g.add_vertex(1, 1, NO_PROPS).unwrap(); + g.add_vertex(1, 2, NO_PROPS).unwrap(); + g.add_vertex(2, 3, NO_PROPS).unwrap(); + + assert_eq!(g.vertices().id().collect::>(), vec![1, 2, 3]); + + let g_at = g.at(1); + assert_eq!(g_at.vertices().id().collect::>(), vec![1, 2]); + } + + #[test] + fn test_edge_layer_name() -> Result<(), GraphError> { + let g = Graph::new(); + g.add_edge(0, 0, 1, NO_PROPS, None)?; + g.add_edge(0, 0, 1, NO_PROPS, Some("awesome name"))?; + + let what = g + .edges() + .map(|e| (e.src().id(), e.dst().id())) + .collect_vec(); + assert_eq!(what, vec![(0, 1)]); + + let layer_names = g + .edges() + .flat_map(|e| e.layer_names()) + .sorted() + .collect_vec(); + assert_eq!(layer_names, vec!["_default", "awesome name"]); + Ok(()) + } + + #[test] + fn test_edge_from_single_layer() { + let g = Graph::new(); + g.add_edge(0, 1, 2, NO_PROPS, Some("layer")).unwrap(); + + assert!(g.edge(1, 2).is_some()); + assert!(g.layer("layer").unwrap().edge(1, 2).is_some()) + } + + #[test] + fn test_edge_layer_intersect_layer() { + let g = Graph::new(); + + g.add_edge(1, 1, 2, NO_PROPS, Some("layer1")) + .expect("add edge"); + g.add_edge(1, 1, 3, NO_PROPS, Some("layer3")) + .expect("add edge"); + g.add_edge(1, 1, 4, NO_PROPS, None).expect("add edge"); + + let g_layers = g.layer(vec!["layer1", "layer3"]).expect("layer"); + + assert!(g_layers.edge(1, 2).unwrap().layer("layer1").is_some()); + assert!(g_layers.edge(1, 3).unwrap().layer("layer3").is_some()); + assert!(g_layers.edge(1, 2).is_some()); + assert!(g_layers.edge(1, 3).is_some()); + + assert!(g_layers.edge(1, 4).is_none()); + + let one = g_layers.vertex(1).expect("vertex"); + let ns = one.neighbours().iter().map(|v| v.id()).collect::>(); + assert_eq!(ns, vec![2, 3]); + + let g_layers2 = g_layers.layer(vec!["layer1"]).expect("layer"); + + assert!(g_layers2.edge(1, 2).unwrap().layer("layer1").is_some()); + assert!(g_layers2.edge(1, 2).is_some()); + + assert!(g_layers2.edge(1, 3).is_none()); + + assert!(g_layers2.edge(1, 4).is_none()); + + let one = g_layers2.vertex(1).expect("vertex"); + let ns = one.neighbours().iter().map(|v| v.id()).collect::>(); + assert_eq!(ns, vec![2]); + } + + #[test] + fn simple_triangle() { + let g = Graph::new(); + + let vs = vec![(1, 1, 2), (2, 1, 3), (3, 2, 1), (4, 3, 2)]; + + for (t, src, dst) in &vs { + g.add_edge(*t, *src, *dst, NO_PROPS, None).unwrap(); + } + + let windowed_graph = g.window(0, 5); + let one = windowed_graph.vertex(1).expect("vertex"); + let ns_win = one.neighbours().id().collect::>(); + + let one = g.vertex(1).expect("vertex"); + let ns = one.neighbours().id().collect::>(); + assert_eq!(ns, vec![2, 3]); + assert_eq!(ns_win, ns); + } + + #[test] + fn test_layer_explode() { + let g = Graph::new(); + g.add_edge(0, 1, 2, NO_PROPS, Some("layer1")).unwrap(); + g.add_edge(1, 1, 2, NO_PROPS, Some("layer2")).unwrap(); + g.add_edge(2, 1, 2, NO_PROPS, Some("layer1")).unwrap(); + g.add_edge(3, 1, 2, NO_PROPS, None).unwrap(); + + let e = g.edge(1, 2).expect("edge"); + + let layer_exploded = e + .explode_layers() + .filter_map(|e| { + e.edge + .layer() + .copied() + .map(|layer| (e.src().id(), e.dst().id(), layer)) + }) + .collect::>(); + + assert_eq!(layer_exploded, vec![(1, 2, 0), (1, 2, 1), (1, 2, 2),]); + } + + #[test] + fn test_layer_explode_window() { + let g = Graph::new(); + g.add_edge(0, 1, 2, NO_PROPS, Some("layer1")).unwrap(); + g.add_edge(1, 1, 2, NO_PROPS, Some("layer2")).unwrap(); + g.add_edge(2, 1, 2, NO_PROPS, Some("layer1")).unwrap(); + g.add_edge(3, 1, 2, NO_PROPS, None).unwrap(); + + let g = g.window(0, 3); + let e = g.edge(1, 2).expect("edge"); + + let layer_exploded = e + .explode_layers() + .filter_map(|e| { + e.edge + .layer() + .copied() + .map(|layer| (e.src().id(), e.dst().id(), layer)) + }) + .collect::>(); + + assert_eq!(layer_exploded, vec![(1, 2, 1), (1, 2, 2),]); + } + + #[test] + fn test_layer_explode_stacking() { + let g = Graph::new(); + g.add_edge(0, 1, 2, NO_PROPS, Some("layer1")).unwrap(); + g.add_edge(1, 1, 2, NO_PROPS, Some("layer2")).unwrap(); + g.add_edge(2, 1, 2, NO_PROPS, Some("layer1")).unwrap(); + g.add_edge(3, 1, 2, NO_PROPS, None).unwrap(); + + let e = g.edge(1, 2).expect("edge"); + + let layer_exploded = e + .explode_layers() + .flat_map(|e| { + e.explode().filter_map(|e| { + e.edge + .layer() + .zip(e.time()) + .map(|(layer, t)| (t, e.src().id(), e.dst().id(), *layer)) + }) + }) + .collect::>(); + + assert_eq!( + layer_exploded, + vec![(3, 1, 2, 0), (0, 1, 2, 1), (2, 1, 2, 1), (1, 1, 2, 2),] + ); + } + + #[test] + fn test_layer_explode_stacking_window() { + let g = Graph::new(); + g.add_edge(0, 1, 2, NO_PROPS, Some("layer1")).unwrap(); + g.add_edge(1, 1, 2, NO_PROPS, Some("layer2")).unwrap(); + g.add_edge(2, 1, 2, NO_PROPS, Some("layer1")).unwrap(); + g.add_edge(3, 1, 2, NO_PROPS, None).unwrap(); + + let g = g.window(0, 3); + let e = g.edge(1, 2).expect("edge"); + + let layer_exploded = e + .explode_layers() + .flat_map(|e| { + e.explode().filter_map(|e| { + e.edge + .layer() + .zip(e.time()) + .map(|(layer, t)| (t, e.src().id(), e.dst().id(), *layer)) + }) + }) + .collect::>(); + + assert_eq!( + layer_exploded, + vec![(0, 1, 2, 1), (2, 1, 2, 1), (1, 1, 2, 2),] + ); + } + + #[test] + fn test_multiple_layers_fundamentals() { + let g = Graph::new(); + + g.add_edge(1, 1, 2, [("tx_sent", 10u64)], "btc".into()) + .expect("failed"); + g.add_edge(1, 1, 2, [("tx_sent", 20u64)], "eth".into()) + .expect("failed"); + g.add_edge(1, 1, 2, [("tx_sent", 70u64)], "tether".into()) + .expect("failed"); + + let e = g.edge(1, 2).expect("failed to get edge"); + let sum: u64 = e + .properties() + .temporal() + .get("tx_sent") + .unwrap() + .iter() + .filter_map(|(_, prop)| prop.into_u64()) + .sum(); + + assert_eq!(sum, 100); + + let lg = g.layer(vec!["eth", "btc"]).expect("failed to layer graph"); + + let e = lg.edge(1, 2).expect("failed to get edge"); + + let sum_eth_btc: u64 = e + .properties() + .temporal() + .get("tx_sent") + .unwrap() + .iter() + .filter_map(|(_, prop)| prop.into_u64()) + .sum(); + + assert_eq!(sum_eth_btc, 30); + + assert_eq!(lg.count_edges(), 1); + + let e = g.edge(1, 2).expect("failed to get edge"); + + let e_btc = e.layer("btc").expect("failed to get btc layer"); + let e_eth = e.layer("eth").expect("failed to get eth layer"); + + let edge_btc_sum = e_btc + .properties() + .temporal() + .get("tx_sent") + .unwrap() + .iter() + .filter_map(|(_, prop)| prop.into_u64()) + .sum::(); + + let edge_eth_sum = e_eth + .properties() + .temporal() + .get("tx_sent") + .unwrap() + .iter() + .filter_map(|(_, prop)| prop.into_u64()) + .sum::(); + + assert!(edge_btc_sum < edge_eth_sum); + + let e_eth = e_eth + .layer(vec!["eth", "btc"]) + .expect("failed to get eth,btc layers"); + + let eth_sum = e_eth + .properties() + .temporal() + .get("tx_sent") + .unwrap() + .iter() + .filter_map(|(_, prop)| prop.into_u64()) + .sum::(); + + // layer does not have a way to reset yet! + assert_eq!(eth_sum, 20); + } + + #[test] + fn test_unique_layers() { + let g = Graph::new(); + g.add_edge(0, 1, 2, NO_PROPS, Some("layer1")).unwrap(); + g.add_edge(0, 1, 2, NO_PROPS, Some("layer2")).unwrap(); + assert_eq!( + g.layer("layer2").unwrap().unique_layers().collect_vec(), + vec!["layer2"] + ) + } + + #[quickcheck] + fn vertex_from_id_is_consistent(vertices: Vec) -> bool { + let g = Graph::new(); + for v in vertices.iter() { + g.add_vertex(0, *v, NO_PROPS).unwrap(); + } + g.vertices() + .name() + .map(|name| g.vertex(name)) + .all(|v| v.is_some()) + } + + #[quickcheck] + fn exploded_edge_times_is_consistent(edges: Vec<(u64, u64, Vec)>, offset: i64) -> bool { + check_exploded_edge_times_is_consistent(edges, offset) + } + + #[test] + fn exploded_edge_times_is_consistent_1() { + let edges = vec![(0, 0, vec![0, 1])]; + assert!(check_exploded_edge_times_is_consistent(edges, 0)); + } + + fn check_exploded_edge_times_is_consistent( + edges: Vec<(u64, u64, Vec)>, + offset: i64, + ) -> bool { + let mut correct = true; + let mut check = |condition: bool, message: String| { + if !condition { + println!("Failed: {}", message); + } + correct = correct && condition; + }; + // checks that exploded edges are preserved with correct timestamps + let mut edges: Vec<(u64, u64, Vec)> = + edges.into_iter().filter(|e| !e.2.is_empty()).collect(); + // discard edges without timestamps + for e in edges.iter_mut() { + e.2.sort(); + // FIXME: Should not have to do this, see issue https://github.com/Pometry/Raphtory/issues/973 + e.2.dedup(); // add each timestamp only once (multi-edge per timestamp currently not implemented) + } + edges.sort(); + edges.dedup_by_key(|(src, dst, _)| (*src, *dst)); + + let g = Graph::new(); + for (src, dst, times) in edges.iter() { + for t in times.iter() { + g.add_edge(*t, *src, *dst, NO_PROPS, None).unwrap(); + } + } + + let mut actual_edges: Vec<(u64, u64, Vec)> = g + .edges() + .map(|e| { + ( + e.src().id(), + e.dst().id(), + e.explode() + .map(|ee| { + check( + ee.earliest_time() == ee.latest_time(), + format!("times mismatched for {:?}", ee), + ); // times are the same for exploded edge + let t = ee.earliest_time().unwrap(); + check( + ee.active(t), + format!("exploded edge {:?} inactive at {}", ee, t), + ); + if t < i64::MAX { + // window is broken at MAX! + check(e.active(t), format!("edge {:?} inactive at {}", e, t)); + } + let t_test = t.saturating_add(offset); + if t_test != t && t_test < i64::MAX && t_test > i64::MIN { + check( + !ee.active(t_test), + format!("exploded edge {:?} active at {}", ee, t_test), + ); + } + t + }) + .collect(), + ) + }) + .collect(); + + for e in actual_edges.iter_mut() { + e.2.sort(); + } + actual_edges.sort(); + check( + actual_edges == edges, + format!( + "actual edges didn't match input actual: {:?}, expected: {:?}", + actual_edges, edges + ), + ); + correct + } + + // non overlaping time intervals + #[derive(Clone, Debug)] + struct Intervals(Vec<(i64, i64)>); + + impl Arbitrary for Intervals { + fn arbitrary(g: &mut quickcheck::Gen) -> Self { + let mut some_nums = Vec::::arbitrary(g); + some_nums.sort(); + let intervals = some_nums + .into_iter() + .tuple_windows() + .filter(|(a, b)| a != b) + .collect_vec(); + Intervals(intervals) + } + } +} diff --git a/raphtory/src/db/graph/mod.rs b/raphtory/src/db/graph/mod.rs new file mode 100644 index 0000000000..0c529d4c55 --- /dev/null +++ b/raphtory/src/db/graph/mod.rs @@ -0,0 +1,6 @@ +pub mod edge; +pub mod graph; +pub mod path; +pub mod vertex; +pub mod vertices; +pub mod views; diff --git a/raphtory/src/db/path.rs b/raphtory/src/db/graph/path.rs similarity index 64% rename from raphtory/src/db/path.rs rename to raphtory/src/db/graph/path.rs index 8953c2f0d0..5fcb4e80e3 100644 --- a/raphtory/src/db/path.rs +++ b/raphtory/src/db/graph/path.rs @@ -1,16 +1,23 @@ -use crate::core::time::IntoTime; -use crate::core::vertex_ref::{LocalVertexRef, VertexRef}; -use crate::core::{Direction, Prop}; -use crate::db::edge::EdgeView; -use crate::db::graph_layer::LayeredGraph; -use crate::db::graph_window::WindowedGraph; -use crate::db::vertex::VertexView; -use crate::db::view_api::layer::LayerOps; -use crate::db::view_api::BoxedIter; -use crate::db::view_api::*; -use std::collections::HashMap; -use std::iter; -use std::sync::Arc; +use crate::{ + core::{ + entities::{vertices::vertex_ref::VertexRef, VID}, + utils::time::IntoTime, + Direction, + }, + db::{ + api::{ + properties::Properties, + view::{internal::extend_filter, BoxedIter, Layer, LayerOps}, + }, + graph::{ + edge::EdgeView, + vertex::VertexView, + views::{layer_graph::LayeredGraph, window_graph::WindowedGraph}, + }, + }, + prelude::*, +}; +use std::{iter, sync::Arc}; #[derive(Copy, Clone)] pub enum Operations { @@ -28,25 +35,27 @@ impl Operations { fn op( self, graph: G, - iter: Box + Send>, - ) -> Box + Send> { + iter: Box + Send>, + ) -> Box + Send> { + let layer_ids = graph.layer_ids(); + let edge_filter = graph.edge_filter().cloned(); match self { Operations::Neighbours { dir } => Box::new(iter.flat_map(move |v| { - graph.neighbours(graph.localise_vertex_unchecked(v), dir, None) + graph.neighbours(v, dir, layer_ids.clone(), edge_filter.as_ref()) })), Operations::NeighboursWindow { dir, t_start, t_end, - } => Box::new(iter.flat_map(move |v| { - graph.neighbours_window( - graph.localise_vertex_unchecked(v), - t_start, - t_end, - dir, - None, - ) - })), + } => { + let graph1 = graph.clone(); + let filter = Some(extend_filter(edge_filter, move |e, l| { + graph1.include_edge_window(e, t_start..t_end, l) + })); + Box::new(iter.flat_map(move |v| { + graph.neighbours(v, dir, layer_ids.clone(), filter.as_ref()) + })) + } } } } @@ -58,7 +67,7 @@ pub struct PathFromGraph { } impl PathFromGraph { - pub(crate) fn new(graph: G, operation: Operations) -> PathFromGraph { + pub fn new(graph: G, operation: Operations) -> PathFromGraph { PathFromGraph { graph, operations: Arc::new(vec![operation]), @@ -68,11 +77,14 @@ impl PathFromGraph { pub fn iter(&self) -> Box> + Send> { let g = self.graph.clone(); let ops = self.operations.clone(); - Box::new(g.vertex_refs().map(move |v| PathFromVertex { - graph: g.clone(), - vertex: v, - operations: ops.clone(), - })) + Box::new( + g.vertex_refs(g.layer_ids(), g.edge_filter()) + .map(move |v| PathFromVertex { + graph: g.clone(), + vertex: v, + operations: ops.clone(), + }), + ) } } @@ -98,24 +110,6 @@ impl VertexViewOps for PathFromGraph { Box::new(self.iter().map(|it| it.latest_time())) } - fn property( - &self, - name: String, - include_static: bool, - ) -> Box> + Send>> + Send> { - Box::new( - self.iter() - .map(move |it| it.property(name.clone(), include_static.clone())), - ) - } - - fn property_history( - &self, - name: String, - ) -> Box> + Send>> + Send> { - Box::new(self.iter().map(move |it| it.property_history(name.clone()))) - } - fn history( &self, ) -> Box> + Send>> + Send> { @@ -124,54 +118,9 @@ impl VertexViewOps for PathFromGraph { fn properties( &self, - include_static: bool, - ) -> Box> + Send>> + Send> + ) -> Box>> + Send>> + Send> { - Box::new(self.iter().map(move |it| it.properties(include_static))) - } - - fn property_histories( - &self, - ) -> Box< - dyn Iterator>> + Send>> - + Send, - > { - Box::new(self.iter().map(|it| it.property_histories())) - } - - fn property_names( - &self, - include_static: bool, - ) -> Box> + Send>> + Send> { - Box::new(self.iter().map(move |it| it.property_names(include_static))) - } - - fn has_property( - &self, - name: String, - include_static: bool, - ) -> Box + Send>> + Send> { - Box::new( - self.iter() - .map(move |it| it.has_property(name.clone(), include_static)), - ) - } - - fn has_static_property( - &self, - name: String, - ) -> Box + Send>> + Send> { - Box::new( - self.iter() - .map(move |it| it.has_static_property(name.clone())), - ) - } - - fn static_property( - &self, - name: String, - ) -> Box> + Send>> + Send> { - Box::new(self.iter().map(move |it| it.static_property(name.clone()))) + Box::new(self.iter().map(move |it| it.properties())) } fn degree(&self) -> Box + Send>> + Send> { @@ -264,7 +213,7 @@ impl LayerOps for PathFromGraph { } } - fn layer(&self, name: &str) -> Option { + fn layer>(&self, name: L) -> Option { Some(PathFromGraph { graph: self.graph.layer(name)?, operations: self.operations.clone(), @@ -275,15 +224,13 @@ impl LayerOps for PathFromGraph { #[derive(Clone)] pub struct PathFromVertex { pub graph: G, - pub vertex: LocalVertexRef, + pub vertex: VID, pub operations: Arc>, } impl PathFromVertex { - - pub fn iter_refs(&self) -> Box + Send> { - let init: Box + Send> = - Box::new(iter::once(VertexRef::Local(self.vertex))); + pub fn iter_refs(&self) -> Box + Send> { + let init: Box + Send> = Box::new(iter::once(self.vertex)); let g = self.graph.clone(); let ops = self.operations.clone(); let iter = ops @@ -294,17 +241,18 @@ impl PathFromVertex { pub fn iter(&self) -> Box> + Send> { let g = self.graph.clone(); - let iter = self.iter_refs() - .map(move |v| VertexView::new(g.clone(), v)); + let iter = self + .iter_refs() + .map(move |v| VertexView::new_internal(g.clone(), v)); Box::new(iter) } - pub(crate) fn new>( + pub fn new>( graph: G, vertex: V, operation: Operations, ) -> PathFromVertex { - let v = graph.localise_vertex_unchecked(vertex.into()); + let v = graph.internalise_vertex_unchecked(vertex.into()); PathFromVertex { graph, vertex: v, @@ -312,9 +260,13 @@ impl PathFromVertex { } } - pub(crate) fn neighbours_window(&self, dir:Direction, t_start: i64, t_end:i64) -> Self { + pub fn neighbours_window(&self, dir: Direction, t_start: i64, t_end: i64) -> Self { let mut new_ops = (*self.operations).clone(); - new_ops.push(Operations::NeighboursWindow { dir, t_start, t_end }); + new_ops.push(Operations::NeighboursWindow { + dir, + t_start, + t_end, + }); Self { graph: self.graph.clone(), vertex: self.vertex, @@ -345,40 +297,12 @@ impl VertexViewOps for PathFromVertex { self.iter().latest_time() } - fn property(&self, name: String, include_static: bool) -> Self::ValueType> { - self.iter().property(name, include_static) - } - - fn property_history(&self, name: String) -> Self::ValueType> { - self.iter().property_history(name) - } - fn history(&self) -> Self::ValueType> { self.iter().history() } - fn properties(&self, include_static: bool) -> Self::ValueType> { - self.iter().properties(include_static) - } - - fn property_histories(&self) -> Self::ValueType>> { - self.iter().property_histories() - } - - fn property_names(&self, include_static: bool) -> Self::ValueType> { - self.iter().property_names(include_static) - } - - fn has_property(&self, name: String, include_static: bool) -> Self::ValueType { - self.iter().has_property(name, include_static) - } - - fn has_static_property(&self, name: String) -> Self::ValueType { - self.iter().has_static_property(name) - } - - fn static_property(&self, name: String) -> Self::ValueType> { - self.iter().static_property(name) + fn properties(&self) -> Self::ValueType>> { + self.iter().properties() } fn degree(&self) -> Self::ValueType { @@ -416,7 +340,6 @@ impl VertexViewOps for PathFromVertex { } } - fn in_neighbours(&self) -> Self { let mut new_ops = (*self.operations).clone(); let dir = Direction::IN; @@ -471,7 +394,7 @@ impl LayerOps for PathFromVertex { } } - fn layer(&self, name: &str) -> Option { + fn layer>(&self, name: L) -> Option { Some(PathFromVertex { graph: self.graph.layer(name)?, vertex: self.vertex, diff --git a/raphtory/src/db/graph/vertex.rs b/raphtory/src/db/graph/vertex.rs new file mode 100644 index 0000000000..25c8177d53 --- /dev/null +++ b/raphtory/src/db/graph/vertex.rs @@ -0,0 +1,567 @@ +//! Defines the `Vertex` struct, which represents a vertex in the graph. + +use crate::{ + core::{ + entities::{vertices::vertex_ref::VertexRef, VID}, + storage::timeindex::TimeIndexEntry, + utils::{errors::GraphError, time::IntoTime}, + ArcStr, Direction, + }, + db::{ + api::{ + mutation::{ + internal::{InternalAdditionOps, InternalPropertyAdditionOps}, + CollectProperties, TryIntoInputTime, + }, + properties::{ + internal::{ConstPropertiesOps, TemporalPropertiesOps, TemporalPropertyViewOps}, + Properties, + }, + view::{internal::Static, BoxedIter, Layer, LayerOps}, + }, + graph::{ + edge::{EdgeList, EdgeView}, + path::{Operations, PathFromVertex}, + views::{layer_graph::LayeredGraph, window_graph::WindowedGraph}, + }, + }, + prelude::*, +}; + +#[derive(Debug, Clone)] +pub struct VertexView { + pub graph: G, + pub vertex: VID, +} + +impl PartialEq> for VertexView { + fn eq(&self, other: &VertexView) -> bool { + self.id() == other.id() + } +} + +impl From> for VertexRef { + fn from(value: VertexView) -> Self { + VertexRef::Internal(value.vertex) + } +} + +impl From<&VertexView> for VertexRef { + fn from(value: &VertexView) -> Self { + VertexRef::Internal(value.vertex) + } +} + +impl VertexView { + /// Creates a new `VertexView` wrapping an internal vertex reference and a graph, internalising any global vertex ids. + pub fn new(graph: G, vertex: VertexRef) -> VertexView { + match vertex { + VertexRef::Internal(local) => Self::new_internal(graph, local), + _ => { + let v = graph.internalise_vertex_unchecked(vertex); + VertexView { graph, vertex: v } + } + } + } + + /// Creates a new `VertexView` wrapping an internal vertex reference and a graph + pub fn new_internal(graph: G, vertex: VID) -> VertexView { + VertexView { graph, vertex } + } +} + +impl TemporalPropertiesOps for VertexView { + fn get_temporal_prop_id(&self, name: &str) -> Option { + self.graph + .vertex_meta() + .temporal_prop_meta() + .get_id(name) + .filter(|id| self.graph.has_temporal_vertex_prop(self.vertex, *id)) + } + + fn get_temporal_prop_name(&self, id: usize) -> ArcStr { + self.graph.vertex_meta().temporal_prop_meta().get_name(id) + } + + fn temporal_prop_ids(&self) -> Box + '_> { + Box::new( + self.graph + .temporal_vertex_prop_ids(self.vertex) + .filter(|id| self.graph.has_temporal_vertex_prop(self.vertex, *id)), + ) + } +} + +impl TemporalPropertyViewOps for VertexView { + fn temporal_value(&self, id: usize) -> Option { + self.graph + .temporal_vertex_prop_vec(self.vertex, id) + .last() + .map(|(_, v)| v.to_owned()) + } + + fn temporal_history(&self, id: usize) -> Vec { + self.graph + .temporal_vertex_prop_vec(self.vertex, id) + .into_iter() + .map(|(t, _)| t) + .collect() + } + + fn temporal_values(&self, id: usize) -> Vec { + self.graph + .temporal_vertex_prop_vec(self.vertex, id) + .into_iter() + .map(|(_, v)| v) + .collect() + } + + fn temporal_value_at(&self, id: usize, t: i64) -> Option { + let history = self.temporal_history(id); + match history.binary_search(&t) { + Ok(index) => Some(self.temporal_values(id)[index].clone()), + Err(index) => (index > 0).then(|| self.temporal_values(id)[index - 1].clone()), + } + } +} + +impl ConstPropertiesOps for VertexView { + fn get_const_prop_id(&self, name: &str) -> Option { + self.graph.vertex_meta().const_prop_meta().get_id(name) + } + + fn get_const_prop_name(&self, id: usize) -> ArcStr { + self.graph.vertex_meta().const_prop_meta().get_name(id) + } + + fn const_prop_ids(&self) -> Box + '_> { + self.graph.constant_vertex_prop_ids(self.vertex) + } + + fn get_const_prop(&self, id: usize) -> Option { + self.graph.constant_vertex_prop(self.vertex, id) + } +} + +impl Static for VertexView {} + +/// View of a Vertex in a Graph +impl VertexViewOps for VertexView { + type Graph = G; + type ValueType = T; + type PathType<'a> = PathFromVertex where Self: 'a; + type EList = BoxedIter>; + + fn id(&self) -> u64 { + self.graph.vertex_id(self.vertex) + } + + fn name(&self) -> String { + self.graph.vertex_name(self.vertex) + } + + fn earliest_time(&self) -> Option { + self.graph.vertex_earliest_time(self.vertex) + } + + fn latest_time(&self) -> Option { + self.graph.vertex_latest_time(self.vertex) + } + + fn history(&self) -> Vec { + self.graph.vertex_history(self.vertex) + } + + fn properties(&self) -> Properties { + Properties::new(self.clone()) + } + + fn degree(&self) -> usize { + let dir = Direction::BOTH; + self.graph.degree( + self.vertex, + dir, + &self.graph.layer_ids(), + self.graph.edge_filter(), + ) + } + + fn in_degree(&self) -> usize { + let dir = Direction::IN; + self.graph.degree( + self.vertex, + dir, + &self.graph.layer_ids(), + self.graph.edge_filter(), + ) + } + + fn out_degree(&self) -> usize { + let dir = Direction::OUT; + self.graph.degree( + self.vertex, + dir, + &self.graph.layer_ids(), + self.graph.edge_filter(), + ) + } + + fn edges(&self) -> EdgeList { + let g = self.graph.clone(); + let dir = Direction::BOTH; + Box::new( + g.vertex_edges( + self.vertex, + dir, + self.graph.layer_ids(), + self.graph.edge_filter(), + ) + .map(move |e| EdgeView::new(g.clone(), e)), + ) + } + + fn in_edges(&self) -> EdgeList { + let g = self.graph.clone(); + let dir = Direction::IN; + Box::new( + g.vertex_edges( + self.vertex, + dir, + self.graph.layer_ids(), + self.graph.edge_filter(), + ) + .map(move |e| EdgeView::new(g.clone(), e)), + ) + } + + fn out_edges(&self) -> EdgeList { + let g = self.graph.clone(); + let dir = Direction::OUT; + Box::new( + g.vertex_edges( + self.vertex, + dir, + self.graph.layer_ids(), + self.graph.edge_filter(), + ) + .map(move |e| EdgeView::new(g.clone(), e)), + ) + } + + fn neighbours(&self) -> PathFromVertex { + let g = self.graph.clone(); + let dir = Direction::BOTH; + PathFromVertex::new(g, self, Operations::Neighbours { dir }) + } + + fn in_neighbours(&self) -> PathFromVertex { + let g = self.graph.clone(); + let dir = Direction::IN; + PathFromVertex::new(g, self, Operations::Neighbours { dir }) + } + + fn out_neighbours(&self) -> PathFromVertex { + let g = self.graph.clone(); + let dir = Direction::OUT; + PathFromVertex::new(g, self, Operations::Neighbours { dir }) + } +} + +impl TimeOps for VertexView { + type WindowedViewType = VertexView>; + + fn start(&self) -> Option { + self.graph.start() + } + + fn end(&self) -> Option { + self.graph.end() + } + + fn window(&self, t_start: T, t_end: T) -> Self::WindowedViewType { + VertexView { + graph: self.graph.window(t_start, t_end), + vertex: self.vertex, + } + } +} + +impl LayerOps for VertexView { + type LayeredViewType = VertexView>; + + fn default_layer(&self) -> Self::LayeredViewType { + VertexView { + graph: self.graph.default_layer(), + vertex: self.vertex, + } + } + + fn layer>(&self, name: L) -> Option { + Some(VertexView { + graph: self.graph.layer(name)?, + vertex: self.vertex, + }) + } +} + +impl VertexView { + pub fn add_constant_properties( + &self, + props: C, + ) -> Result<(), GraphError> { + let properties: Vec<(usize, Prop)> = props.collect_properties( + |name, dtype| self.graph.resolve_vertex_property(name, dtype, true), + |prop| self.graph.process_prop_value(prop), + )?; + self.graph + .internal_add_constant_vertex_properties(self.vertex, properties) + } + + pub fn add_updates( + &self, + time: T, + props: C, + ) -> Result<(), GraphError> { + let t = TimeIndexEntry::from_input(&self.graph, time)?; + let properties: Vec<(usize, Prop)> = props.collect_properties( + |name, dtype| self.graph.resolve_vertex_property(name, dtype, false), + |prop| self.graph.process_prop_value(prop), + )?; + self.graph.internal_add_vertex(t, self.vertex, properties) + } +} + +/// Implementation of the VertexListOps trait for an iterator of VertexView objects. +/// +impl VertexListOps for Box> + Send> { + type Graph = G; + type Vertex = VertexView; + type IterType = Box + Send>; + type EList = Box> + Send>; + type ValueType = T; + + fn earliest_time(self) -> BoxedIter> { + Box::new(self.map(|v| v.start())) + } + + fn latest_time(self) -> BoxedIter> { + Box::new(self.map(|v| v.end().map(|t| t - 1))) + } + + fn window(self, t_start: i64, t_end: i64) -> BoxedIter>> { + Box::new(self.map(move |v| v.window(t_start, t_end))) + } + + fn at(self, end: i64) -> Self::IterType<::WindowedViewType> { + Box::new(self.map(move |v| v.at(end))) + } + + fn id(self) -> BoxedIter { + Box::new(self.map(|v| v.id())) + } + + fn name(self) -> BoxedIter { + Box::new(self.map(|v| v.name())) + } + + fn properties(self) -> BoxedIter>> { + Box::new(self.map(move |v| v.properties())) + } + + fn history(self) -> BoxedIter> { + Box::new(self.map(|v| v.history())) + } + + fn degree(self) -> BoxedIter { + Box::new(self.map(|v| v.degree())) + } + + fn in_degree(self) -> BoxedIter { + Box::new(self.map(|v| v.in_degree())) + } + + fn out_degree(self) -> BoxedIter { + Box::new(self.map(|v| v.out_degree())) + } + + fn edges(self) -> Self::EList { + Box::new(self.flat_map(|v| v.edges())) + } + + fn in_edges(self) -> Self::EList { + Box::new(self.flat_map(|v| v.in_edges())) + } + + fn out_edges(self) -> Self::EList { + Box::new(self.flat_map(|v| v.out_edges())) + } + + fn neighbours(self) -> Self { + Box::new(self.flat_map(|v| v.neighbours())) + } + + fn in_neighbours(self) -> Self { + Box::new(self.flat_map(|v| v.in_neighbours())) + } + + fn out_neighbours(self) -> Self { + Box::new(self.flat_map(|v| v.out_neighbours())) + } +} + +impl VertexListOps for BoxedIter>> { + type Graph = G; + type Vertex = VertexView; + type IterType = BoxedIter>; + type EList = BoxedIter>>; + type ValueType = BoxedIter; + + fn earliest_time(self) -> BoxedIter>> { + Box::new(self.map(|it| it.earliest_time())) + } + + fn latest_time(self) -> BoxedIter>> { + Box::new(self.map(|it| it.latest_time())) + } + + fn window( + self, + t_start: i64, + t_end: i64, + ) -> BoxedIter>>> { + Box::new(self.map(move |it| it.window(t_start, t_end))) + } + + fn at(self, end: i64) -> Self::IterType<::WindowedViewType> { + Box::new(self.map(move |v| v.at(end))) + } + + fn id(self) -> BoxedIter> { + Box::new(self.map(|it| it.id())) + } + + fn name(self) -> BoxedIter> { + Box::new(self.map(|it| it.name())) + } + + fn properties(self) -> BoxedIter>>> { + Box::new(self.map(move |it| it.properties())) + } + + fn history(self) -> BoxedIter>> { + Box::new(self.map(move |it| it.history())) + } + + fn degree(self) -> BoxedIter> { + Box::new(self.map(|it| it.degree())) + } + + fn in_degree(self) -> BoxedIter> { + Box::new(self.map(|it| it.in_degree())) + } + + fn out_degree(self) -> BoxedIter> { + Box::new(self.map(|it| it.out_degree())) + } + + fn edges(self) -> Self::EList { + Box::new(self.map(|it| it.edges())) + } + + fn in_edges(self) -> Self::EList { + Box::new(self.map(|it| it.in_edges())) + } + + fn out_edges(self) -> Self::EList { + Box::new(self.map(|it| it.out_edges())) + } + + fn neighbours(self) -> Self { + Box::new(self.map(|it| it.neighbours())) + } + + fn in_neighbours(self) -> Self { + Box::new(self.map(|it| it.in_neighbours())) + } + + fn out_neighbours(self) -> Self { + Box::new(self.map(|it| it.out_neighbours())) + } +} + +#[cfg(test)] +mod vertex_test { + use crate::prelude::*; + use std::collections::HashMap; + + #[test] + fn test_earliest_time() { + let g = Graph::new(); + g.add_vertex(0, 1, NO_PROPS).unwrap(); + g.add_vertex(1, 1, NO_PROPS).unwrap(); + g.add_vertex(2, 1, NO_PROPS).unwrap(); + let mut view = g.at(1); + assert_eq!(view.vertex(1).expect("v").earliest_time().unwrap(), 0); + assert_eq!(view.vertex(1).expect("v").latest_time().unwrap(), 1); + + view = g.at(3); + assert_eq!(view.vertex(1).expect("v").earliest_time().unwrap(), 0); + assert_eq!(view.vertex(1).expect("v").latest_time().unwrap(), 2); + } + + #[test] + fn test_properties() { + let g = Graph::new(); + let props = [("test", "test")]; + g.add_vertex(0, 1, NO_PROPS).unwrap(); + g.add_vertex(2, 1, props).unwrap(); + + let v1 = g.vertex(1).unwrap(); + let v1_w = g.window(0, 1).vertex(1).unwrap(); + assert_eq!( + v1.properties().as_map(), + props + .into_iter() + .map(|(k, v)| (k.into(), v.into_prop())) + .collect() + ); + assert_eq!(v1_w.properties().as_map(), HashMap::default()) + } + + #[test] + fn test_property_additions() { + let g = Graph::new(); + let props = [("test", "test")]; + let v1 = g.add_vertex(0, 1, NO_PROPS).unwrap(); + v1.add_updates(2, props).unwrap(); + let v1_w = v1.window(0, 1); + assert_eq!( + v1.properties().as_map(), + props + .into_iter() + .map(|(k, v)| (k.into(), v.into_prop())) + .collect() + ); + assert_eq!(v1_w.properties().as_map(), HashMap::default()) + } + + #[test] + fn test_constant_property_additions() { + let g = Graph::new(); + let v1 = g.add_vertex(0, 1, NO_PROPS).unwrap(); + v1.add_constant_properties([("test", "test")]).unwrap(); + assert_eq!(v1.properties().get("test"), Some("test".into())) + } + + #[test] + fn test_string_deduplication() { + let g = Graph::new(); + let v1 = g + .add_vertex(0, 1, [("test1", "test"), ("test2", "test")]) + .unwrap(); + let s1 = v1.properties().get("test1").unwrap_str(); + let s2 = v1.properties().get("test2").unwrap_str(); + + assert_eq!(s1.as_ptr(), s2.as_ptr()) + } +} diff --git a/raphtory/src/db/vertices.rs b/raphtory/src/db/graph/vertices.rs similarity index 53% rename from raphtory/src/db/vertices.rs rename to raphtory/src/db/graph/vertices.rs index 95eea7201c..b44646565d 100644 --- a/raphtory/src/db/vertices.rs +++ b/raphtory/src/db/graph/vertices.rs @@ -1,15 +1,19 @@ -use crate::core::time::IntoTime; -use crate::core::vertex_ref::VertexRef; -use crate::core::{Direction, Prop}; -use crate::db::edge::EdgeView; -use crate::db::graph_layer::LayeredGraph; -use crate::db::graph_window::WindowedGraph; -use crate::db::path::{Operations, PathFromGraph}; -use crate::db::vertex::VertexView; -use crate::db::view_api::layer::LayerOps; -use crate::db::view_api::BoxedIter; -use crate::db::view_api::*; -use std::collections::HashMap; +use crate::{ + core::{entities::vertices::vertex_ref::VertexRef, utils::time::IntoTime, Direction}, + db::{ + api::{ + properties::Properties, + view::{BoxedIter, Layer, LayerOps}, + }, + graph::{ + edge::EdgeView, + path::{Operations, PathFromGraph}, + vertex::VertexView, + views::{layer_graph::LayeredGraph, window_graph::WindowedGraph}, + }, + }, + prelude::*, +}; #[derive(Clone)] pub struct Vertices { @@ -24,15 +28,17 @@ impl Vertices { pub fn iter(&self) -> Box> + Send> { let g = self.graph.clone(); Box::new( - g.vertex_refs() - .map(move |v| VertexView::new_local(g.clone(), v)), + g.vertex_refs(g.layer_ids(), g.edge_filter()) + .map(move |v| VertexView::new_internal(g.clone(), v)), ) } + /// Returns the number of vertices in the graph. pub fn len(&self) -> usize { - self.graph.num_vertices() + self.graph.count_vertices() } + /// Returns true if the graph contains no vertices. pub fn is_empty(&self) -> bool { self.graph.is_empty() } @@ -48,92 +54,115 @@ impl VertexViewOps for Vertices { type PathType<'a> = PathFromGraph; type EList = BoxedIter>>; + /// Returns an iterator over the vertices' id fn id(&self) -> Self::ValueType { self.iter().id() } + /// Returns an iterator over the vertices' name fn name(&self) -> Self::ValueType { self.iter().name() } + /// Returns an iterator over the vertices' earliest time fn earliest_time(&self) -> Self::ValueType> { self.iter().earliest_time() } + /// Returns an iterator over the vertices' latest time fn latest_time(&self) -> Self::ValueType> { self.iter().latest_time() } - fn property(&self, name: String, include_static: bool) -> Self::ValueType> { - self.iter().property(name, include_static) - } - - fn property_history(&self, name: String) -> Self::ValueType> { - self.iter().property_history(name) - } - + /// Returns an iterator over the vertices' histories fn history(&self) -> Self::ValueType> { self.iter().history() } - fn properties(&self, include_static: bool) -> Self::ValueType> { - self.iter().properties(include_static) - } - - fn property_histories(&self) -> Self::ValueType>> { - self.iter().property_histories() - } - - fn property_names(&self, include_static: bool) -> Self::ValueType> { - self.iter().property_names(include_static) - } - - fn has_property(&self, name: String, include_static: bool) -> Self::ValueType { - self.iter().has_property(name, include_static) - } - - fn has_static_property(&self, name: String) -> Self::ValueType { - self.iter().has_static_property(name) - } - - fn static_property(&self, name: String) -> Self::ValueType> { - self.iter().static_property(name) + /// Returns an iterator over the vertices' properties + fn properties(&self) -> Self::ValueType>> { + self.iter().properties() } + /// Returns the number of edges of the vertices + /// + /// # Returns + /// + /// An iterator of the number of edges of the vertices fn degree(&self) -> Self::ValueType { self.iter().degree() } + /// Returns the number of in edges of the vertices + /// + /// # Returns + /// + /// An iterator of the number of in edges of the vertices fn in_degree(&self) -> Self::ValueType { self.iter().in_degree() } + /// Returns the number of out edges of the vertices + /// + /// # Returns + /// + /// An iterator of the number of out edges of the vertices fn out_degree(&self) -> Self::ValueType { self.iter().out_degree() } + /// Returns the edges of the vertices + /// + /// # Returns + /// + /// An iterator of edges of the vertices fn edges(&self) -> Self::EList { Box::new(self.iter().map(|v| v.edges())) } + /// Returns the in edges of the vertices + /// + /// # Returns + /// + /// An iterator of in edges of the vertices fn in_edges(&self) -> Self::EList { Box::new(self.iter().map(|v| v.in_edges())) } + /// Returns the out edges of the vertices + /// + /// # Returns + /// + /// An iterator of out edges of the vertices fn out_edges(&self) -> Self::EList { Box::new(self.iter().map(|v| v.out_edges())) } + /// Get the neighbours of the vertices + /// + /// # Returns + /// + /// An iterator of the neighbours of the vertices fn neighbours(&self) -> PathFromGraph { let dir = Direction::BOTH; PathFromGraph::new(self.graph.clone(), Operations::Neighbours { dir }) } + /// Get the in neighbours of the vertices + /// + /// # Returns + /// + /// An iterator of the in neighbours of the vertices fn in_neighbours(&self) -> PathFromGraph { let dir = Direction::IN; PathFromGraph::new(self.graph.clone(), Operations::Neighbours { dir }) } + /// Get the out neighbours of the vertices + /// + /// # Returns + /// + /// An iterator of the out neighbours of the vertices fn out_neighbours(&self) -> PathFromGraph { let dir = Direction::OUT; PathFromGraph::new(self.graph.clone(), Operations::Neighbours { dir }) @@ -161,13 +190,27 @@ impl TimeOps for Vertices { impl LayerOps for Vertices { type LayeredViewType = Vertices>; + /// Create a view including all the vertices in the default layer + /// + /// # Returns + /// + /// A view including all the vertices in the default layer fn default_layer(&self) -> Self::LayeredViewType { Vertices { graph: self.graph.default_layer(), } } - fn layer(&self, name: &str) -> Option { + /// Create a view including all the vertices in the given layer + /// + /// # Arguments + /// + /// * `name` - The name of the layer + /// + /// # Returns + /// + /// A view including all the vertices in the given layer + fn layer>(&self, name: L) -> Option { Some(Vertices { graph: self.graph.layer(name)?, }) diff --git a/raphtory/src/db/graph/views/deletion_graph.rs b/raphtory/src/db/graph/views/deletion_graph.rs new file mode 100644 index 0000000000..c6126ecb36 --- /dev/null +++ b/raphtory/src/db/graph/views/deletion_graph.rs @@ -0,0 +1,673 @@ +use crate::{ + core::{ + entities::{ + edges::{edge_ref::EdgeRef, edge_store::EdgeStore}, + vertices::vertex_store::VertexStore, + LayerIds, VID, + }, + storage::timeindex::{AsTime, TimeIndexOps}, + utils::errors::GraphError, + Direction, Prop, + }, + db::{ + api::{ + mutation::internal::InheritMutationOps, + properties::internal::InheritPropertiesOps, + view::{internal::*, BoxedIter}, + }, + graph::graph::{graph_equal, InternalGraph}, + }, + prelude::*, +}; +use serde::{Deserialize, Serialize}; +use std::{ + cmp::min, + fmt::{Display, Formatter}, + iter, + ops::Range, + path::Path, + sync::Arc, +}; + +/// A graph view where an edge remains active from the time it is added until it is explicitly marked as deleted. +/// +/// Note that the graph will give you access to all edges that were added at any point in time, even those that are marked as deleted. +/// The deletion only has an effect on the exploded edge view that are returned. An edge is included in a windowed view of the graph if +/// it is considered active at any point in the window. +#[derive(Clone, Debug, Serialize, Deserialize)] +pub struct GraphWithDeletions { + graph: Arc, +} + +impl From for GraphWithDeletions { + fn from(value: InternalGraph) -> Self { + Self { + graph: Arc::new(value), + } + } +} + +impl IntoDynamic for GraphWithDeletions { + fn into_dynamic(self) -> DynamicGraph { + DynamicGraph::new(self) + } +} + +impl Display for GraphWithDeletions { + fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result { + Display::fmt(&self.graph, f) + } +} + +impl GraphWithDeletions { + fn edge_alive_at(&self, e: &EdgeStore, t: i64, layer_ids: &LayerIds) -> bool { + // FIXME: assumes additions are before deletions if at the same timestamp (need to have strict ordering/secondary index) + let ( + first_addition, + first_deletion, + last_addition_before_start, + last_deletion_before_start, + ) = match layer_ids { + LayerIds::None => return false, + LayerIds::All => ( + e.additions().iter().flat_map(|v| v.first_t()).min(), + e.deletions().iter().flat_map(|v| v.first_t()).min(), + e.additions() + .iter() + .flat_map(|v| v.range(i64::MIN..t.saturating_add(1)).last_t()) + .max(), + e.deletions() + .iter() + .flat_map(|v| v.range(i64::MIN..t).last_t()) + .max(), + ), + LayerIds::One(l_id) => ( + e.additions().get(*l_id).and_then(|v| v.first_t()), + e.deletions().get(*l_id).and_then(|v| v.first_t()), + e.additions() + .get(*l_id) + .and_then(|v| v.range(i64::MIN..t.saturating_add(1)).last_t()), + e.deletions() + .get(*l_id) + .and_then(|v| v.range(i64::MIN..t).last_t()), + ), + LayerIds::Multiple(ids) => ( + ids.iter() + .flat_map(|l_id| e.additions().get(*l_id).and_then(|v| v.first_t())) + .min(), + ids.iter() + .flat_map(|l_id| e.deletions().get(*l_id).and_then(|v| v.first_t())) + .min(), + ids.iter() + .flat_map(|l_id| { + e.additions() + .get(*l_id) + .and_then(|v| v.range(i64::MIN..t.saturating_add(1)).last_t()) + }) + .max(), + ids.iter() + .flat_map(|l_id| { + e.deletions() + .get(*l_id) + .and_then(|v| v.range(i64::MIN..t).last_t()) + }) + .max(), + ), + }; + + // None is less than any value (see test below) + (first_deletion < first_addition && first_deletion.filter(|v| *v >= t).is_some()) + || last_addition_before_start > last_deletion_before_start + } + + fn vertex_alive_at( + &self, + v: &VertexStore, + t: i64, + layers: &LayerIds, + edge_filter: Option<&EdgeFilter>, + ) -> bool { + let edges = self.graph.inner().storage.edges.read_lock(); + v.edge_tuples(layers, Direction::BOTH) + .map(|eref| edges.get(eref.pid().into())) + .filter(|e| { + edge_filter.map(|f| f(e, layers)).unwrap_or(true) + && self.edge_alive_at(e, t, layers) + }) + .next() + .is_some() + } + + pub fn new() -> Self { + Self { + graph: Arc::new(InternalGraph::default()), + } + } + + /// Save a graph to a directory + /// + /// # Arguments + /// + /// * `path` - The path to the directory + /// + /// # Returns + /// + /// A raphtory graph + /// + /// # Example + /// + /// ```no_run + /// use std::fs::File; + /// use raphtory::prelude::*; + /// let g = Graph::new(); + /// g.add_vertex(1, 1, NO_PROPS).unwrap(); + /// g.save_to_file("path_str").expect("failed to save file"); + /// ``` + pub fn save_to_file>(&self, path: P) -> Result<(), GraphError> { + MaterializedGraph::from(self.clone()).save_to_file(path) + } + + /// Load a graph from a directory + /// + /// # Arguments + /// + /// * `path` - The path to the directory + /// + /// # Returns + /// + /// A raphtory graph + /// + /// # Example + /// + /// ```no_run + /// use raphtory::prelude::*; + /// let g = Graph::load_from_file("path/to/graph"); + /// ``` + pub fn load_from_file>(path: P) -> Result { + let g = MaterializedGraph::load_from_file(path)?; + g.into_persistent().ok_or(GraphError::GraphLoadError) + } +} + +impl PartialEq for GraphWithDeletions { + fn eq(&self, other: &G) -> bool { + graph_equal(self, other) + } +} + +impl Base for GraphWithDeletions { + type Base = InternalGraph; + #[inline(always)] + fn base(&self) -> &Self::Base { + &self.graph + } +} + +impl InternalMaterialize for GraphWithDeletions { + fn new_base_graph(&self, graph: InternalGraph) -> MaterializedGraph { + MaterializedGraph::PersistentGraph(GraphWithDeletions { + graph: Arc::new(graph), + }) + } + + fn include_deletions(&self) -> bool { + true + } +} + +impl InheritMutationOps for GraphWithDeletions {} + +impl InheritCoreOps for GraphWithDeletions {} + +impl InheritCoreDeletionOps for GraphWithDeletions {} + +impl InheritGraphOps for GraphWithDeletions {} + +impl InheritPropertiesOps for GraphWithDeletions {} + +impl InheritLayerOps for GraphWithDeletions {} + +impl InheritEdgeFilterOps for GraphWithDeletions {} + +impl TimeSemantics for GraphWithDeletions { + fn vertex_earliest_time(&self, v: VID) -> Option { + self.graph.vertex_earliest_time(v) + } + + fn view_start(&self) -> Option { + self.graph.view_start() + } + + fn view_end(&self) -> Option { + self.graph.view_end() + } + + fn earliest_time_global(&self) -> Option { + self.graph.earliest_time_global() + } + + fn latest_time_global(&self) -> Option { + self.graph.latest_time_global() + } + + fn earliest_time_window(&self, t_start: i64, t_end: i64) -> Option { + self.graph.earliest_time_window(t_start, t_end) + } + + fn latest_time_window(&self, t_start: i64, t_end: i64) -> Option { + self.graph.latest_time_window(t_start, t_end) + } + + fn include_vertex_window( + &self, + v: VID, + w: Range, + layer_ids: &LayerIds, + edge_filter: Option<&EdgeFilter>, + ) -> bool { + let v = self.graph.inner().storage.get_node(v); + v.active(w.clone()) || self.vertex_alive_at(&v, w.start, layer_ids, edge_filter) + } + + fn include_edge_window(&self, e: &EdgeStore, w: Range, layer_ids: &LayerIds) -> bool { + // includes edge if it is alive at the start of the window or added during the window + e.active(layer_ids, w.clone()) || self.edge_alive_at(e, w.start, layer_ids) + } + + fn vertex_history(&self, v: VID) -> Vec { + self.graph.vertex_history(v) + } + + fn vertex_history_window(&self, v: VID, w: Range) -> Vec { + self.graph.vertex_history_window(v, w) + } + + fn edge_exploded(&self, e: EdgeRef, layer_ids: LayerIds) -> BoxedIter { + //Fixme: Need support for duration on exploded edges + if self.edge_alive_at(&self.core_edge(e.pid()), i64::MIN, &layer_ids) { + Box::new( + iter::once(e.at(i64::MIN.into())).chain(self.graph.edge_window_exploded( + e, + (i64::MIN + 1)..i64::MAX, + layer_ids, + )), + ) + } else { + self.graph.edge_exploded(e, layer_ids) + } + } + + fn edge_layers(&self, e: EdgeRef, layer_ids: LayerIds) -> BoxedIter { + self.graph.edge_layers(e, layer_ids) + } + + fn edge_window_exploded( + &self, + e: EdgeRef, + w: Range, + layer_ids: LayerIds, + ) -> BoxedIter { + // FIXME: Need better iterators on LockedView that capture the guard + let entry = self.core_edge(e.pid()); + if self.edge_alive_at(&entry, w.start, &layer_ids) { + Box::new( + iter::once(e.at(w.start.into())).chain(self.graph.edge_window_exploded( + e, + w.start.saturating_add(1)..w.end, + layer_ids, + )), + ) + } else { + self.graph.edge_window_exploded(e, w, layer_ids) + } + } + + fn edge_window_layers( + &self, + e: EdgeRef, + w: Range, + layer_ids: LayerIds, + ) -> BoxedIter { + let g = self.clone(); + Box::new( + self.graph + .edge_layers(e, layer_ids.clone()) + .filter(move |&e| { + let entry = g.core_edge(e.pid()); + g.include_edge_window( + &entry, + w.clone(), + &layer_ids.clone().constrain_from_edge(e), + ) + }), + ) + } + + fn edge_earliest_time(&self, e: EdgeRef, layer_ids: LayerIds) -> Option { + e.time().map(|ti| *ti.t()).or_else(|| { + let entry = self.core_edge(e.pid()); + if self.edge_alive_at(&entry, i64::MIN, &layer_ids.clone()) { + Some(i64::MIN) + } else { + self.edge_additions(e, layer_ids).first().map(|ti| *ti.t()) + } + }) + } + + fn edge_earliest_time_window( + &self, + e: EdgeRef, + w: Range, + layer_ids: LayerIds, + ) -> Option { + let entry = self.core_edge(e.pid()); + if self.edge_alive_at(&entry, w.start, &layer_ids) { + Some(w.start) + } else { + self.edge_additions(e, layer_ids).range(w).first_t() + } + } + + fn edge_latest_time(&self, e: EdgeRef, layer_ids: LayerIds) -> Option { + match e.time().map(|ti| *ti.t()) { + Some(t) => Some(min( + self.edge_additions(e, layer_ids.clone()) + .range(t.saturating_add(1)..i64::MAX) + .first_t() + .unwrap_or(i64::MAX), + self.edge_deletions(e, layer_ids) + .range(t.saturating_add(1)..i64::MAX) + .first_t() + .unwrap_or(i64::MAX), + )), + None => { + let entry = self.core_edge(e.pid()); + if self.edge_alive_at(&entry, i64::MAX, &layer_ids) { + Some(i64::MAX) + } else { + self.edge_deletions(e, layer_ids).last_t() + } + } + } + } + + fn edge_latest_time_window( + &self, + e: EdgeRef, + w: Range, + layer_ids: LayerIds, + ) -> Option { + match e.time().map(|ti| *ti.t()) { + Some(t) => Some(min( + self.edge_additions(e, layer_ids.clone()) + .range(t.saturating_add(1)..w.end) + .first_t() + .unwrap_or(w.end - 1), + self.edge_deletions(e, layer_ids) + .range(t.saturating_add(1)..w.end) + .first_t() + .unwrap_or(w.end - 1), + )), + None => { + let entry = self.core_edge(e.pid()); + if self.edge_alive_at(&entry, w.end - 1, &layer_ids) { + Some(w.end - 1) + } else { + self.edge_deletions(e, layer_ids).range(w).last_t() + } + } + } + } + + fn edge_deletion_history(&self, e: EdgeRef, layer_ids: LayerIds) -> Vec { + self.edge_deletions(e, layer_ids) + .iter_t() + .copied() + .collect() + } + + fn edge_deletion_history_window( + &self, + e: EdgeRef, + w: Range, + layer_ids: LayerIds, + ) -> Vec { + self.edge_deletions(e, layer_ids) + .range(w) + .iter_t() + .copied() + .collect() + } + + #[inline] + fn has_temporal_prop(&self, prop_id: usize) -> bool { + self.graph.has_temporal_prop(prop_id) + } + + fn temporal_prop_vec(&self, prop_id: usize) -> Vec<(i64, Prop)> { + self.graph.temporal_prop_vec(prop_id) + } + + #[inline] + fn has_temporal_prop_window(&self, prop_id: usize, w: Range) -> bool { + self.graph.has_temporal_prop_window(prop_id, w) + } + + fn temporal_prop_vec_window( + &self, + prop_id: usize, + t_start: i64, + t_end: i64, + ) -> Vec<(i64, Prop)> { + self.graph.temporal_prop_vec_window(prop_id, t_start, t_end) + } + + #[inline] + fn has_temporal_vertex_prop(&self, v: VID, prop_id: usize) -> bool { + self.graph.has_temporal_vertex_prop(v, prop_id) + } + + fn temporal_vertex_prop_vec(&self, v: VID, prop_id: usize) -> Vec<(i64, Prop)> { + self.graph.temporal_vertex_prop_vec(v, prop_id) + } + + fn has_temporal_vertex_prop_window(&self, v: VID, prop_id: usize, w: Range) -> bool { + self.graph.has_temporal_vertex_prop_window(v, prop_id, w) + } + + fn temporal_vertex_prop_vec_window( + &self, + v: VID, + prop_id: usize, + t_start: i64, + t_end: i64, + ) -> Vec<(i64, Prop)> { + self.graph + .temporal_vertex_prop_vec_window(v, prop_id, t_start, t_end) + } + + fn has_temporal_edge_prop_window( + &self, + e: EdgeRef, + prop_id: usize, + w: Range, + layer_ids: LayerIds, + ) -> bool { + let entry = self.core_edge(e.pid()); + + if entry.has_temporal_prop(&layer_ids, prop_id) { + let search_start = entry + .last_deletion_before(&layer_ids, w.start) + .unwrap_or(i64::MIN); // if property was added at any point since the last deletion, it is still there + match layer_ids { + LayerIds::None => false, + LayerIds::All => entry.layer_ids_iter().any(|id| { + entry + .temporal_prop_layer(id, prop_id) + .filter(|prop| prop.iter_window(search_start..w.end).next().is_some()) + .is_some() + }), + LayerIds::One(id) => entry + .temporal_prop_layer(id, prop_id) + .filter(|prop| prop.iter_window(search_start..w.end).next().is_some()) + .is_some(), + LayerIds::Multiple(ids) => ids.iter().any(|&id| { + entry + .temporal_prop_layer(id, prop_id) + .filter(|prop| prop.iter_window(search_start..w.end).next().is_some()) + .is_some() + }), + } + } else { + false + } + } + + fn temporal_edge_prop_vec_window( + &self, + e: EdgeRef, + prop_id: usize, + t_start: i64, + t_end: i64, + layer_ids: LayerIds, + ) -> Vec<(i64, Prop)> { + let prop = self.temporal_edge_prop(e, prop_id, layer_ids.clone()); + match prop { + Some(p) => { + let entry = self.core_edge(e.pid()); + if self.edge_alive_at(&entry, t_start, &layer_ids) { + p.last_before(t_start.saturating_add(1)) + .into_iter() + .map(|(_, v)| (t_start, v)) + .chain(p.iter_window(t_start.saturating_add(1)..t_end)) + .collect() + } else { + p.iter_window(t_start..t_end).collect() + } + } + None => Default::default(), + } + } + + fn has_temporal_edge_prop(&self, e: EdgeRef, prop_id: usize, layer_ids: LayerIds) -> bool { + self.graph.has_temporal_edge_prop(e, prop_id, layer_ids) + } + + fn temporal_edge_prop_vec( + &self, + e: EdgeRef, + prop_id: usize, + layer_ids: LayerIds, + ) -> Vec<(i64, Prop)> { + self.graph.temporal_edge_prop_vec(e, prop_id, layer_ids) + } +} + +#[cfg(test)] +mod test_deletions { + use crate::{db::graph::views::deletion_graph::GraphWithDeletions, prelude::*}; + use itertools::Itertools; + + #[test] + fn test_edge_deletions() { + let g = GraphWithDeletions::new(); + + g.add_edge(0, 0, 1, [("added", Prop::I64(0))], None) + .unwrap(); + g.delete_edge(10, 0, 1, None).unwrap(); + + assert_eq!(g.edges().id().collect::>(), vec![(0, 1)]); + + assert_eq!( + g.window(1, 2).edges().id().collect::>(), + vec![(0, 1)] + ); + + assert_eq!(g.window(1, 2).count_edges(), 1); + + assert!(g.window(11, 12).is_empty()); + + assert_eq!( + g.window(1, 2) + .edge(0, 1) + .unwrap() + .properties() + .get("added") + .unwrap_i64(), + 0 + ); + + assert!(g.window(11, 12).edge(0, 1).is_none()); + + assert_eq!( + g.window(1, 2) + .edge(0, 1) + .unwrap() + .properties() + .temporal() + .get("added") + .unwrap() + .iter() + .collect_vec(), + vec![(1, Prop::I64(0))] + ); + + assert_eq!(g.window(1, 2).vertex(0).unwrap().out_degree(), 1) + } + + #[test] + fn test_materialize_only_deletion() { + let g = GraphWithDeletions::new(); + g.delete_edge(1, 1, 2, None).unwrap(); + + assert_eq!(g.materialize().unwrap().into_persistent().unwrap(), g); + } + + #[test] + fn test_materialize_window() { + let g = GraphWithDeletions::new(); + g.add_edge(0, 1, 2, NO_PROPS, None).unwrap(); + g.delete_edge(10, 1, 2, None).unwrap(); + + let gm = g + .window(3, 5) + .materialize() + .unwrap() + .into_persistent() + .unwrap(); + assert_eq!(gm, g.window(3, 5)) + } + + #[test] + fn test_exploded_latest_time() { + let g = GraphWithDeletions::new(); + let e = g.add_edge(0, 1, 2, NO_PROPS, None).unwrap(); + g.delete_edge(10, 1, 2, None).unwrap(); + assert_eq!(e.latest_time(), Some(10)); + assert_eq!(e.explode().latest_time().collect_vec(), vec![Some(10)]); + } + + #[test] + fn test_edge_properties() { + let g = GraphWithDeletions::new(); + let e = g.add_edge(0, 1, 2, [("test", "test")], None).unwrap(); + assert_eq!(e.properties().get("test").unwrap_str(), "test"); + e.delete(10, None).unwrap(); + assert_eq!(e.properties().get("test").unwrap_str(), "test"); + e.add_updates(11, [("test", "test11")], None).unwrap(); + assert_eq!( + e.window(10, 12).properties().get("test").unwrap_str(), + "test11" + ); + assert_eq!( + e.window(5, 12) + .properties() + .temporal() + .get("test") + .unwrap() + .iter() + .collect_vec(), + vec![(5, Prop::str("test")), (11i64, Prop::str("test11"))], + ); + } +} diff --git a/raphtory/src/db/graph/views/layer_graph.rs b/raphtory/src/db/graph/views/layer_graph.rs new file mode 100644 index 0000000000..8b01b0c94c --- /dev/null +++ b/raphtory/src/db/graph/views/layer_graph.rs @@ -0,0 +1,182 @@ +use crate::{ + core::entities::{edges::edge_store::EdgeStore, LayerIds}, + db::api::{ + properties::internal::InheritPropertiesOps, + view::{ + internal::{ + Base, EdgeFilter, EdgeFilterOps, Immutable, InheritCoreOps, InheritGraphOps, + InheritMaterialize, InheritTimeSemantics, InternalLayerOps, + }, + Layer, + }, + }, + prelude::GraphViewOps, +}; +use itertools::Itertools; +use std::{ + fmt::{Debug, Formatter}, + sync::Arc, +}; + +#[derive(Clone)] +pub struct LayeredGraph { + /// The underlying `Graph` object. + pub graph: G, + /// The layer this graphs points to. + pub layers: LayerIds, + + edge_filter: EdgeFilter, +} + +impl Immutable for LayeredGraph {} + +impl Debug for LayeredGraph { + fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result { + f.debug_struct("LayeredGraph") + .field("graph", &self.graph) + .field("layers", &self.layers) + .finish() + } +} + +impl Base for LayeredGraph { + type Base = G; + #[inline(always)] + fn base(&self) -> &Self::Base { + &self.graph + } +} + +impl InheritTimeSemantics for LayeredGraph {} + +impl InheritCoreOps for LayeredGraph {} + +impl InheritMaterialize for LayeredGraph {} + +impl InheritPropertiesOps for LayeredGraph {} + +impl InheritGraphOps for LayeredGraph {} + +impl EdgeFilterOps for LayeredGraph { + #[inline] + fn edge_filter(&self) -> Option<&EdgeFilter> { + Some(&self.edge_filter) + } +} + +impl LayeredGraph { + pub fn new(graph: G, layers: LayerIds) -> Self { + let edge_filter: EdgeFilter = match graph.edge_filter().cloned() { + None => Arc::new(|e, l| e.has_layer(l)), + Some(f) => Arc::new(move |e, l| e.has_layer(l) && f(e, l)), + }; + Self { + graph, + layers, + edge_filter, + } + } + + /// Get the intersection between the previously requested layers and the layers of + /// this view + fn constrain(&self, layers: LayerIds) -> LayerIds { + match layers { + LayerIds::None => LayerIds::None, + LayerIds::All => self.layers.clone(), + _ => match &self.layers { + LayerIds::All => layers, + LayerIds::One(id) => match layers.find(*id) { + Some(layer) => LayerIds::One(layer), + None => LayerIds::None, + }, + LayerIds::Multiple(ids) => { + // intersect the layers + let new_layers = ids.iter().filter_map(|id| layers.find(*id)).collect_vec(); + match new_layers.len() { + 0 => LayerIds::None, + 1 => LayerIds::One(new_layers[0]), + _ => LayerIds::Multiple(new_layers.into()), + } + } + LayerIds::None => LayerIds::None, + }, + } + } +} + +impl InternalLayerOps for LayeredGraph { + fn layer_ids(&self) -> LayerIds { + self.layers.clone() + } + + fn layer_ids_from_names(&self, key: Layer) -> LayerIds { + self.constrain(self.graph.layer_ids_from_names(key)) + } + + fn edge_layer_ids(&self, e: &EdgeStore) -> LayerIds { + let layer_ids = self.graph.edge_layer_ids(e); + self.constrain(layer_ids) + } +} + +#[cfg(test)] +mod test_layers { + use crate::prelude::*; + use itertools::Itertools; + #[test] + fn test_layer_vertex() { + let g = Graph::new(); + + g.add_edge(0, 1, 2, NO_PROPS, Some("layer1")).unwrap(); + g.add_edge(0, 2, 3, NO_PROPS, Some("layer2")).unwrap(); + g.add_edge(3, 2, 4, NO_PROPS, Some("layer1")).unwrap(); + let neighbours = g + .layer(vec!["layer1", "layer2"]) + .unwrap() + .vertex(1) + .unwrap() + .neighbours() + .into_iter() + .collect_vec(); + assert_eq!( + neighbours[0] + .layer("layer2") + .unwrap() + .edges() + .id() + .collect_vec(), + vec![(2, 3)] + ); + assert_eq!( + g.layer("layer2") + .unwrap() + .vertex(neighbours[0].name()) + .unwrap() + .edges() + .id() + .collect_vec(), + vec![(2, 3)] + ); + let mut edges = g + .layer("layer1") + .unwrap() + .vertex(neighbours[0].name()) + .unwrap() + .edges() + .id() + .collect_vec(); + edges.sort(); + assert_eq!(edges, vec![(1, 2), (2, 4)]); + let mut edges = g.layer("layer1").unwrap().edges().id().collect_vec(); + edges.sort(); + assert_eq!(edges, vec![(1, 2), (2, 4)]); + let mut edges = g + .layer(vec!["layer1", "layer2"]) + .unwrap() + .edges() + .id() + .collect_vec(); + edges.sort(); + assert_eq!(edges, vec![(1, 2), (2, 3), (2, 4)]); + } +} diff --git a/raphtory/src/db/graph/views/mod.rs b/raphtory/src/db/graph/views/mod.rs new file mode 100644 index 0000000000..099efc6951 --- /dev/null +++ b/raphtory/src/db/graph/views/mod.rs @@ -0,0 +1,4 @@ +pub mod deletion_graph; +pub mod layer_graph; +pub mod vertex_subgraph; +pub mod window_graph; diff --git a/raphtory/src/db/graph/views/vertex_subgraph.rs b/raphtory/src/db/graph/views/vertex_subgraph.rs new file mode 100644 index 0000000000..3569646148 --- /dev/null +++ b/raphtory/src/db/graph/views/vertex_subgraph.rs @@ -0,0 +1,252 @@ +use crate::{ + core::{ + entities::{edges::edge_ref::EdgeRef, vertices::vertex_ref::VertexRef, LayerIds, EID, VID}, + Direction, + }, + db::api::{ + properties::internal::InheritPropertiesOps, + view::internal::{ + Base, EdgeFilter, EdgeFilterOps, GraphOps, Immutable, InheritCoreOps, InheritLayerOps, + InheritMaterialize, InheritTimeSemantics, + }, + }, + prelude::GraphViewOps, +}; +use itertools::Itertools; +use rayon::prelude::*; +use rustc_hash::FxHashSet; +use std::{ + fmt::{Debug, Formatter}, + sync::Arc, +}; + +#[derive(Clone)] +pub struct VertexSubgraph { + graph: G, + vertices: Arc>, + edge_filter: EdgeFilter, +} + +impl Debug for VertexSubgraph { + fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result { + f.debug_struct("VertexSubgraph") + .field("graph", &self.graph) + .field("vertices", &self.vertices) + .finish() + } +} + +impl Base for VertexSubgraph { + type Base = G; + #[inline(always)] + fn base(&self) -> &Self::Base { + &self.graph + } +} + +impl Immutable for VertexSubgraph {} + +impl InheritCoreOps for VertexSubgraph {} +impl InheritTimeSemantics for VertexSubgraph {} +impl InheritPropertiesOps for VertexSubgraph {} +impl InheritMaterialize for VertexSubgraph {} +impl InheritLayerOps for VertexSubgraph {} + +impl VertexSubgraph { + pub fn new(graph: G, vertices: FxHashSet) -> Self { + let vertices = Arc::new(vertices); + let vertices_cloned = vertices.clone(); + let edge_filter: EdgeFilter = match graph.edge_filter().cloned() { + Some(f) => Arc::new(move |e, l| { + vertices_cloned.contains(&e.src()) && vertices_cloned.contains(&e.dst()) && f(e, l) + }), + None => Arc::new(move |e, _l| { + vertices_cloned.contains(&e.src()) && vertices_cloned.contains(&e.dst()) + }), + }; + Self { + graph, + vertices, + edge_filter, + } + } +} + +impl EdgeFilterOps for VertexSubgraph { + #[inline] + fn edge_filter(&self) -> Option<&EdgeFilter> { + Some(&self.edge_filter) + } +} + +impl GraphOps for VertexSubgraph { + fn internal_vertex_ref( + &self, + v: VertexRef, + layer_ids: &LayerIds, + filter: Option<&EdgeFilter>, + ) -> Option { + self.graph + .internal_vertex_ref(v, layer_ids, filter) + .filter(|v| self.vertices.contains(v)) + } + + fn find_edge_id( + &self, + e_id: EID, + layer_ids: &LayerIds, + filter: Option<&EdgeFilter>, + ) -> Option { + self.graph + .find_edge_id(e_id, layer_ids, filter) + .filter(|e| self.vertices.contains(&e.src()) && self.vertices.contains(&e.dst())) + } + + fn vertices_len(&self, _layer_ids: LayerIds, _filter: Option<&EdgeFilter>) -> usize { + self.vertices.len() + } + + fn edges_len(&self, layer: LayerIds, filter: Option<&EdgeFilter>) -> usize { + self.vertices + .par_iter() + .map(|v| self.degree(*v, Direction::OUT, &layer, filter)) + .sum() + } + + fn has_edge_ref( + &self, + src: VID, + dst: VID, + layer: &LayerIds, + filter: Option<&EdgeFilter>, + ) -> bool { + self.graph.has_edge_ref(src, dst, layer, filter) + } + + fn has_vertex_ref( + &self, + v: VertexRef, + layer_ids: &LayerIds, + edge_filter: Option<&EdgeFilter>, + ) -> bool { + self.internal_vertex_ref(v, layer_ids, edge_filter) + .is_some() + } + + fn degree(&self, v: VID, d: Direction, layer: &LayerIds, filter: Option<&EdgeFilter>) -> usize { + self.graph.degree(v, d, layer, filter) + } + + fn vertex_ref(&self, v: u64, layers: &LayerIds, filter: Option<&EdgeFilter>) -> Option { + self.internal_vertex_ref(v.into(), layers, filter) + } + + fn vertex_refs( + &self, + _layers: LayerIds, + _filter: Option<&EdgeFilter>, + ) -> Box + Send> { + // this sucks but seems to be the only way currently (see also http://smallcultfollowing.com/babysteps/blog/2018/09/02/rust-pattern-iterating-an-over-a-rc-vec-t/) + let verts = Vec::from_iter(self.vertices.iter().copied()); + Box::new(verts.into_iter()) + } + + fn edge_ref( + &self, + src: VID, + dst: VID, + layer: &LayerIds, + filter: Option<&EdgeFilter>, + ) -> Option { + self.graph.edge_ref(src, dst, layer, filter) + } + + fn edge_refs( + &self, + layer: LayerIds, + filter: Option<&EdgeFilter>, + ) -> Box + Send> { + let g1 = self.clone(); + let vertices = self.vertices.clone().iter().copied().collect_vec(); + let filter = filter.cloned(); + Box::new( + vertices.into_iter().flat_map(move |v| { + g1.vertex_edges(v, Direction::OUT, layer.clone(), filter.as_ref()) + }), + ) + } + + fn vertex_edges( + &self, + v: VID, + d: Direction, + layer: LayerIds, + filter: Option<&EdgeFilter>, + ) -> Box + Send> { + self.graph.vertex_edges(v, d, layer, filter) + } + + fn neighbours( + &self, + v: VID, + d: Direction, + layers: LayerIds, + filter: Option<&EdgeFilter>, + ) -> Box + Send> { + self.graph.neighbours(v, d, layers, filter) + } +} + +#[cfg(test)] +mod subgraph_tests { + use crate::{algorithms::triangle_count::triangle_count, prelude::*}; + + #[test] + fn test_materialize_no_edges() { + let g = Graph::new(); + + g.add_vertex(1, 1, NO_PROPS).unwrap(); + g.add_vertex(2, 2, NO_PROPS).unwrap(); + let sg = g.subgraph([1, 2]); + + let actual = sg.materialize().unwrap().into_events().unwrap(); + assert_eq!(actual, sg); + } + + #[test] + fn test_remove_degree1_triangle_count() { + let graph = Graph::new(); + let edges = vec![ + (1, 2, 1), + (1, 3, 2), + (1, 4, 3), + (3, 1, 4), + (3, 4, 5), + (3, 5, 6), + (4, 5, 7), + (5, 6, 8), + (5, 8, 9), + (7, 5, 10), + (8, 5, 11), + (1, 9, 12), + (9, 1, 13), + (6, 3, 14), + (4, 8, 15), + (8, 3, 16), + (5, 10, 17), + (10, 5, 18), + (10, 8, 19), + (1, 11, 20), + (11, 1, 21), + (9, 11, 22), + (11, 9, 23), + ]; + for (src, dst, ts) in edges { + graph.add_edge(ts, src, dst, NO_PROPS, None).unwrap(); + } + let subgraph = graph.subgraph(graph.vertices().into_iter().filter(|v| v.degree() > 1)); + let ts = triangle_count(&subgraph, None); + let tg = triangle_count(&graph, None); + assert_eq!(ts, tg) + } +} diff --git a/raphtory/src/db/graph/views/window_graph.rs b/raphtory/src/db/graph/views/window_graph.rs new file mode 100644 index 0000000000..d5da752c58 --- /dev/null +++ b/raphtory/src/db/graph/views/window_graph.rs @@ -0,0 +1,1127 @@ +//! A windowed view is a subset of a graph between a specific time window. +//! For example, lets say you wanted to run an algorithm each month over a graph, graph window +//! would allow you to split the graph into 30 day chunks to do so. +//! +//! This module also defines the `GraphWindow` trait, which represents a window of time over +//! which a graph can be queried. +//! +//! GraphWindowSet implements the `Iterator` trait, producing `WindowedGraph` views +//! for each perspective within it. +//! +//! # Types +//! +//! * `GraphWindowSet` - A struct that allows iterating over a Graph broken down into multiple +//! windowed views. It contains a `Graph` and an iterator of `Perspective`. +//! +//! * `WindowedGraph` - A struct that represents a windowed view of a `Graph`. +//! It contains a `Graph`, a start time (`t_start`) and an end time (`t_end`). +//! +//! # Traits +//! +//! * `GraphViewInternalOps` - A trait that provides operations to a `WindowedGraph` +//! used internally by the `GraphWindowSet`. +//! +//! # Examples +//! +//! ```rust +//! +//! use raphtory::prelude::*; +//! use raphtory::db::api::view::*; +//! +//! let graph = Graph::new(); +//! graph.add_edge(0, 1, 2, NO_PROPS, None).unwrap(); +//! graph.add_edge(1, 1, 3, NO_PROPS, None).unwrap(); +//! graph.add_edge(2, 2, 3, NO_PROPS, None).unwrap(); +//! +//! let wg = graph.window(0, 1); +//! assert_eq!(wg.edge(1, 2).unwrap().src().id(), 1); +//! ``` + +use crate::{ + core::{ + entities::{ + edges::{edge_ref::EdgeRef, edge_store::EdgeStore}, + vertices::vertex_ref::VertexRef, + LayerIds, EID, VID, + }, + utils::time::IntoTime, + ArcStr, Direction, Prop, + }, + db::api::{ + properties::internal::{ + InheritStaticPropertiesOps, TemporalPropertiesOps, TemporalPropertyViewOps, + }, + view::{ + internal::{ + Base, DynamicGraph, EdgeFilter, EdgeFilterOps, GraphOps, Immutable, InheritCoreOps, + InheritLayerOps, InheritMaterialize, IntoDynamic, TimeSemantics, + }, + BoxedIter, + }, + }, + prelude::{GraphViewOps, TimeOps}, + search::IndexedGraph, +}; +use std::{ + cmp::{max, min}, + fmt::{Debug, Formatter}, + ops::Range, + sync::Arc, +}; + +/// A struct that represents a windowed view of a `Graph`. +#[derive(Clone)] +pub struct WindowedGraph { + /// The underlying `Graph` object. + pub graph: G, + /// The inclusive start time of the window. + pub t_start: i64, + /// The exclusive end time of the window. + pub t_end: i64, + filter: EdgeFilter, +} + +impl Debug for WindowedGraph { + fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result { + write!( + f, + "WindowedGraph({:?}, {}..{})", + self.graph, self.t_start, self.t_end + ) + } +} + +impl WindowedGraph> { + pub fn into_dynamic_indexed(self) -> IndexedGraph { + IndexedGraph { + graph: self + .graph + .graph + .window(self.t_start, self.t_end) + .into_dynamic(), + vertex_index: self.graph.vertex_index, + edge_index: self.graph.edge_index, + reader: self.graph.reader, + edge_reader: self.graph.edge_reader, + } + } +} + +impl Base for WindowedGraph { + type Base = G; + #[inline(always)] + fn base(&self) -> &Self::Base { + &self.graph + } +} + +impl Immutable for WindowedGraph {} +impl InheritCoreOps for WindowedGraph {} + +impl InheritMaterialize for WindowedGraph {} + +impl InheritStaticPropertiesOps for WindowedGraph {} + +impl InheritLayerOps for WindowedGraph {} + +impl TemporalPropertyViewOps for WindowedGraph { + fn temporal_history(&self, id: usize) -> Vec { + self.temporal_prop_vec(id) + .into_iter() + .map(|(t, _)| t) + .collect() + } + + fn temporal_values(&self, id: usize) -> Vec { + self.temporal_prop_vec(id) + .into_iter() + .map(|(_, v)| v) + .collect() + } +} + +impl TemporalPropertiesOps for WindowedGraph { + fn get_temporal_prop_id(&self, name: &str) -> Option { + self.graph + .get_temporal_prop_id(name) + .filter(|id| self.has_temporal_prop(*id)) + } + + fn get_temporal_prop_name(&self, id: usize) -> ArcStr { + self.graph.get_temporal_prop_name(id) + } + + fn temporal_prop_ids(&self) -> Box + '_> { + Box::new( + self.graph + .temporal_prop_ids() + .filter(|id| self.has_temporal_prop(*id)), + ) + } +} + +impl TimeSemantics for WindowedGraph { + fn vertex_earliest_time(&self, v: VID) -> Option { + self.graph + .vertex_earliest_time_window(v, self.t_start, self.t_end) + } + + fn vertex_latest_time(&self, v: VID) -> Option { + self.graph + .vertex_latest_time_window(v, self.t_start, self.t_end) + } + + fn view_start(&self) -> Option { + Some(self.t_start) + } + + fn view_end(&self) -> Option { + Some(self.t_end) + } + + #[inline] + fn earliest_time_global(&self) -> Option { + self.graph.earliest_time_window(self.t_start, self.t_end) + } + + #[inline] + fn latest_time_global(&self) -> Option { + self.graph.latest_time_window(self.t_start, self.t_end) + } + + #[inline] + fn earliest_time_window(&self, t_start: i64, t_end: i64) -> Option { + self.graph + .earliest_time_window(self.actual_start(t_start), self.actual_end(t_end)) + } + + #[inline] + fn latest_time_window(&self, t_start: i64, t_end: i64) -> Option { + self.graph + .latest_time_window(self.actual_start(t_start), self.actual_end(t_end)) + } + + #[inline] + fn vertex_earliest_time_window(&self, v: VID, t_start: i64, t_end: i64) -> Option { + self.graph.vertex_earliest_time_window( + v, + self.actual_start(t_start), + self.actual_end(t_end), + ) + } + + #[inline] + fn vertex_latest_time_window(&self, v: VID, t_start: i64, t_end: i64) -> Option { + self.graph + .vertex_latest_time_window(v, self.actual_start(t_start), self.actual_end(t_end)) + } + + #[inline] + fn include_vertex_window( + &self, + v: VID, + w: Range, + layer_ids: &LayerIds, + edge_filter: Option<&EdgeFilter>, + ) -> bool { + self.graph.include_vertex_window( + v, + self.actual_start(w.start)..self.actual_end(w.end), + layer_ids, + edge_filter, + ) + } + + #[inline] + fn include_edge_window(&self, e: &EdgeStore, w: Range, layer_ids: &LayerIds) -> bool { + self.graph.include_edge_window( + e, + self.actual_start(w.start)..self.actual_end(w.end), + layer_ids, + ) + } + + fn vertex_history(&self, v: VID) -> Vec { + self.graph + .vertex_history_window(v, self.t_start..self.t_end) + } + + fn vertex_history_window(&self, v: VID, w: Range) -> Vec { + self.graph + .vertex_history_window(v, self.actual_start(w.start)..self.actual_end(w.end)) + } + + fn edge_exploded(&self, e: EdgeRef, layer_ids: LayerIds) -> BoxedIter { + self.graph + .edge_window_exploded(e, self.t_start..self.t_end, layer_ids) + } + + fn edge_layers(&self, e: EdgeRef, layer_ids: LayerIds) -> BoxedIter { + self.graph + .edge_window_layers(e, self.t_start..self.t_end, layer_ids) + } + + fn edge_window_exploded( + &self, + e: EdgeRef, + w: Range, + layer_ids: LayerIds, + ) -> BoxedIter { + self.graph.edge_window_exploded( + e, + self.actual_start(w.start)..self.actual_end(w.end), + layer_ids, + ) + } + + fn edge_window_layers( + &self, + e: EdgeRef, + w: Range, + layer_ids: LayerIds, + ) -> BoxedIter { + self.graph.edge_window_layers( + e, + self.actual_start(w.start)..self.actual_end(w.end), + layer_ids, + ) + } + + fn edge_earliest_time(&self, e: EdgeRef, layer_ids: LayerIds) -> Option { + self.graph + .edge_earliest_time_window(e, self.t_start..self.t_end, layer_ids) + } + + fn edge_earliest_time_window( + &self, + e: EdgeRef, + w: Range, + layer_ids: LayerIds, + ) -> Option { + self.graph.edge_earliest_time_window( + e, + self.actual_start(w.start)..self.actual_end(w.end), + layer_ids, + ) + } + + fn edge_latest_time(&self, e: EdgeRef, layer_ids: LayerIds) -> Option { + self.graph + .edge_latest_time_window(e, self.t_start..self.t_end, layer_ids) + } + + fn edge_latest_time_window( + &self, + e: EdgeRef, + w: Range, + layer_ids: LayerIds, + ) -> Option { + self.graph.edge_latest_time_window( + e, + self.actual_start(w.start)..self.actual_end(w.end), + layer_ids, + ) + } + + fn edge_deletion_history(&self, e: EdgeRef, layer_ids: LayerIds) -> Vec { + self.graph + .edge_deletion_history_window(e, self.t_start..self.t_end, layer_ids) + } + + fn edge_deletion_history_window( + &self, + e: EdgeRef, + w: Range, + layer_ids: LayerIds, + ) -> Vec { + self.graph.edge_deletion_history_window( + e, + self.actual_start(w.start)..self.actual_end(w.end), + layer_ids, + ) + } + + fn has_temporal_prop(&self, prop_id: usize) -> bool { + self.graph + .has_temporal_prop_window(prop_id, self.t_start..self.t_end) + } + + fn temporal_prop_vec(&self, prop_id: usize) -> Vec<(i64, Prop)> { + self.graph + .temporal_prop_vec_window(prop_id, self.t_start, self.t_end) + } + + fn has_temporal_prop_window(&self, prop_id: usize, w: Range) -> bool { + self.graph + .has_temporal_prop_window(prop_id, self.actual_start(w.start)..self.actual_end(w.end)) + } + + fn temporal_prop_vec_window( + &self, + prop_id: usize, + t_start: i64, + t_end: i64, + ) -> Vec<(i64, Prop)> { + self.graph.temporal_prop_vec_window( + prop_id, + self.actual_start(t_start), + self.actual_end(t_end), + ) + } + + fn has_temporal_vertex_prop(&self, v: VID, prop_id: usize) -> bool { + self.graph + .has_temporal_vertex_prop_window(v, prop_id, self.t_start..self.t_end) + } + + fn temporal_vertex_prop_vec(&self, v: VID, prop_id: usize) -> Vec<(i64, Prop)> { + self.graph + .temporal_vertex_prop_vec_window(v, prop_id, self.t_start, self.t_end) + } + + fn has_temporal_vertex_prop_window(&self, v: VID, prop_id: usize, w: Range) -> bool { + self.graph.has_temporal_vertex_prop_window( + v, + prop_id, + self.actual_start(w.start)..self.actual_end(w.end), + ) + } + + fn temporal_vertex_prop_vec_window( + &self, + v: VID, + prop_id: usize, + t_start: i64, + t_end: i64, + ) -> Vec<(i64, Prop)> { + self.graph.temporal_vertex_prop_vec_window( + v, + prop_id, + self.actual_start(t_start), + self.actual_end(t_end), + ) + } + + fn has_temporal_edge_prop_window( + &self, + e: EdgeRef, + prop_id: usize, + w: Range, + layer_ids: LayerIds, + ) -> bool { + self.graph.has_temporal_edge_prop_window( + e, + prop_id, + self.actual_start(w.start)..self.actual_end(w.end), + layer_ids, + ) + } + + fn temporal_edge_prop_vec_window( + &self, + e: EdgeRef, + prop_id: usize, + t_start: i64, + t_end: i64, + layer_ids: LayerIds, + ) -> Vec<(i64, Prop)> { + self.graph.temporal_edge_prop_vec_window( + e, + prop_id, + self.actual_start(t_start), + self.actual_end(t_end), + layer_ids, + ) + } + + fn has_temporal_edge_prop(&self, e: EdgeRef, prop_id: usize, layer_ids: LayerIds) -> bool { + self.graph + .has_temporal_edge_prop_window(e, prop_id, self.t_start..self.t_end, layer_ids) + } + + fn temporal_edge_prop_vec( + &self, + e: EdgeRef, + prop_id: usize, + layer_ids: LayerIds, + ) -> Vec<(i64, Prop)> { + self.graph + .temporal_edge_prop_vec_window(e, prop_id, self.t_start, self.t_end, layer_ids) + } +} + +impl EdgeFilterOps for WindowedGraph { + #[inline] + fn edge_filter(&self) -> Option<&EdgeFilter> { + Some(&self.filter) + } +} + +/// Implementation of the GraphViewInternalOps trait for WindowedGraph. +/// This trait provides operations to a `WindowedGraph` used internally by the `GraphWindowSet`. +/// *Note: All functions in this are bound by the time set in the windowed graph. +impl GraphOps for WindowedGraph { + #[inline] + fn internal_vertex_ref( + &self, + v: VertexRef, + layers: &LayerIds, + filter: Option<&EdgeFilter>, + ) -> Option { + self.graph + .internal_vertex_ref(v, layers, filter) + .filter(|v| self.include_vertex_window(*v, self.t_start..self.t_end, layers, filter)) + } + + #[inline] + fn find_edge_id( + &self, + e_id: EID, + layer_ids: &LayerIds, + filter: Option<&EdgeFilter>, + ) -> Option { + self.graph.find_edge_id(e_id, layer_ids, filter) + } + + /// Returns the number of vertices in the windowed view. + #[inline] + fn vertices_len(&self, layer_ids: LayerIds, filter: Option<&EdgeFilter>) -> usize { + self.vertex_refs(layer_ids, filter).count() + } + + /// Returns the number of edges in the windowed view. + #[inline] + fn edges_len(&self, layer: LayerIds, filter: Option<&EdgeFilter>) -> usize { + // filter takes care of checking the window + self.graph.edges_len(layer, filter) + } + + /// Check if there is an edge from src to dst in the window. + /// + /// # Arguments + /// + /// - `src` - The source vertex. + /// - `dst` - The destination vertex. + /// + /// # Returns + /// + /// A result containing `true` if there is an edge from src to dst in the window, `false` otherwise. + /// + /// # Errors + /// + /// Returns an error if either `src` or `dst` is not a valid vertex. + #[inline] + fn has_edge_ref( + &self, + src: VID, + dst: VID, + layer: &LayerIds, + filter: Option<&EdgeFilter>, + ) -> bool { + // filter takes care of checking the window + self.graph.has_edge_ref(src, dst, layer, filter) + } + + /// Check if a vertex v exists in the window. + /// + /// # Arguments + /// + /// - `v` - The vertex to check. + /// + /// # Returns + /// + /// A result containing `true` if the vertex exists in the window, `false` otherwise. + /// + /// # Errors + /// + /// Returns an error if `v` is not a valid vertex. + #[inline] + fn has_vertex_ref(&self, v: VertexRef, layers: &LayerIds, filter: Option<&EdgeFilter>) -> bool { + self.internal_vertex_ref(v, layers, filter).is_some() + } + + /// Returns the number of edges from a vertex in the window. + /// + /// # Arguments + /// + /// - `v` - The vertex to check. + /// - `d` - The direction of the edges to count. + /// + /// # Returns + /// + /// A result containing the number of edges from the vertex in the window. + /// + /// # Errors + /// + /// Returns an error if `v` is not a valid vertex. + #[inline] + fn degree(&self, v: VID, d: Direction, layer: &LayerIds, filter: Option<&EdgeFilter>) -> usize { + self.graph.degree(v, d, layer, filter) + } + + /// Get the reference of the vertex with ID v if it exists + /// + /// # Arguments + /// + /// - `v` - The ID of the vertex to get + /// + /// # Returns + /// + /// A result of an option containing the vertex reference if it exists, `None` otherwise. + /// + /// # Errors + /// + /// Returns an error if `v` is not a valid vertex. + #[inline] + fn vertex_ref(&self, v: u64, layers: &LayerIds, filter: Option<&EdgeFilter>) -> Option { + self.internal_vertex_ref(v.into(), layers, filter) + } + + /// Get an iterator over the references of all vertices as references + /// + /// # Returns + /// + /// An iterator over the references of all vertices + #[inline] + fn vertex_refs( + &self, + layers: LayerIds, + filter: Option<&EdgeFilter>, + ) -> Box + Send> { + let g = self.clone(); + let filter_cloned = filter.cloned(); + Box::new( + self.graph + .vertex_refs(layers.clone(), filter) + .filter(move |v| { + g.include_vertex_window(*v, g.t_start..g.t_end, &layers, filter_cloned.as_ref()) + }), + ) + } + + /// Get an iterator over the references of an edges as a reference + /// + /// # Arguments + /// + /// - `src` - The source vertex of the edge + /// - `dst` - The destination vertex of the edge + /// + /// # Returns + /// + /// A result of an option containing the edge reference if it exists, `None` otherwise. + /// + /// # Errors + /// + /// Returns an error if `src` or `dst` are not valid vertices. + #[inline] + fn edge_ref( + &self, + src: VID, + dst: VID, + layer: &LayerIds, + filter: Option<&EdgeFilter>, + ) -> Option { + self.graph.edge_ref(src, dst, layer, filter) + } + + /// Get an iterator of all edges as references + /// + /// # Returns + /// + /// An iterator over all edges as references + #[inline] + fn edge_refs( + &self, + layer: LayerIds, + filter: Option<&EdgeFilter>, + ) -> Box + Send> { + self.graph.edge_refs(layer, filter) + } + + #[inline] + fn vertex_edges( + &self, + v: VID, + d: Direction, + layer: LayerIds, + filter: Option<&EdgeFilter>, + ) -> Box + Send> { + self.graph.vertex_edges(v, d, layer, filter) + } + + /// Get the neighbours of a vertex as references in a given direction + /// + /// # Arguments + /// + /// - `v` - The vertex to get the neighbours for + /// - `d` - The direction of the edges + /// + /// # Returns + /// + /// An iterator over all neighbours in that vertex direction as references + #[inline] + fn neighbours( + &self, + v: VID, + d: Direction, + layer: LayerIds, + filter: Option<&EdgeFilter>, + ) -> Box + Send> { + self.graph.neighbours(v, d, layer, filter) + } +} + +/// A windowed graph is a graph that only allows access to vertices and edges within a time window. +/// +/// This struct is used to represent a graph with a time window. It is constructed +/// by providing a `Graph` object and a time range that defines the window. +/// +/// # Examples +/// +/// ```rust +/// use raphtory::db::api::view::*; +/// use raphtory::prelude::*; +/// +/// let graph = Graph::new(); +/// graph.add_edge(0, 1, 2, NO_PROPS, None).unwrap(); +/// graph.add_edge(1, 2, 3, NO_PROPS, None).unwrap(); +/// let windowed_graph = graph.window(0, 1); +/// ``` +impl WindowedGraph { + /// Create a new windowed graph + /// + /// # Arguments + /// + /// - `graph` - The graph to create the windowed graph from + /// - `t_start` - The inclusive start time of the window. + /// - `t_end` - The exclusive end time of the window. + /// + /// # Returns + /// + /// A new windowed graph + pub fn new(graph: G, t_start: T, t_end: T) -> Self { + let filter_graph = graph.clone(); + let t_start = t_start.into_time(); + let t_end = t_end.into_time(); + let base_filter = filter_graph.edge_filter_window().cloned(); + let filter: EdgeFilter = match base_filter { + Some(f) => Arc::new(move |e, layers| { + f(e, layers) && filter_graph.include_edge_window(e, t_start..t_end, layers) + }), + None => Arc::new(move |e, layers| { + filter_graph.include_edge_window(e, t_start..t_end, layers) + }), + }; + WindowedGraph { + graph, + t_start, + t_end, + filter, + } + } + + /// the larger of `t_start` and `self.start()` (useful for creating nested windows) + #[inline] + fn actual_start(&self, t_start: i64) -> i64 { + max(t_start, self.t_start) + } + + /// the smaller of `t_end` and `self.end()` (useful for creating nested windows) + #[inline] + fn actual_end(&self, t_end: i64) -> i64 { + min(t_end, self.t_end) + } +} + +#[cfg(test)] +mod views_test { + + use super::*; + use crate::{db::api::view::Layer, prelude::*}; + use itertools::Itertools; + use quickcheck::TestResult; + use rand::prelude::*; + use rayon::prelude::*; + + #[test] + fn windowed_graph_vertices_degree() { + let vs = vec![ + (1, 1, 2), + (2, 1, 3), + (-1, 2, 1), + (0, 1, 1), + (7, 3, 2), + (1, 1, 1), + ]; + + let g = Graph::new(); + + for (t, src, dst) in &vs { + g.add_edge(*t, *src, *dst, NO_PROPS, None).unwrap(); + } + + let wg = WindowedGraph::new(g, -1, 1); + + let actual = wg + .vertices() + .iter() + .map(|v| (v.id(), v.degree())) + .collect::>(); + + let expected = vec![(1, 2), (2, 1)]; + + assert_eq!(actual, expected); + } + + #[test] + fn windowed_graph_edge() { + let vs = vec![ + (1, 1, 2), + (2, 1, 3), + (-1, 2, 1), + (0, 1, 1), + (7, 3, 2), + (1, 1, 1), + ]; + + let g = Graph::new(); + + for (t, src, dst) in vs { + g.add_edge(t, src, dst, NO_PROPS, None).unwrap(); + } + + let wg = g.window(i64::MIN, i64::MAX); + assert_eq!(wg.edge(1, 3).unwrap().src().id(), 1); + assert_eq!(wg.edge(1, 3).unwrap().dst().id(), 3); + } + + #[test] + fn windowed_graph_vertex_edges() { + let vs = vec![ + (1, 1, 2), + (2, 1, 3), + (-1, 2, 1), + (0, 1, 1), + (7, 3, 2), + (1, 1, 1), + ]; + + let g = Graph::new(); + + for (t, src, dst) in &vs { + g.add_edge(*t, *src, *dst, NO_PROPS, None).unwrap(); + } + + let wg = WindowedGraph::new(g, -1, 1); + + assert_eq!(wg.vertex(1).unwrap().id(), 1); + } + + #[test] + fn graph_has_vertex_check_fail() { + let vs: Vec<(i64, u64)> = vec![ + (1, 0), + (-100, 262), + // (327226439, 108748364996394682), + (1, 9135428456135679950), + // (0, 1), + // (2, 2), + ]; + let g = Graph::new(); + + for (t, v) in &vs { + g.add_vertex(*t, *v, NO_PROPS) + .map_err(|err| println!("{:?}", err)) + .ok(); + } + + let wg = WindowedGraph::new(g, 1, 2); + assert!(!wg.has_vertex(262)) + } + + #[quickcheck] + fn windowed_graph_has_vertex(mut vs: Vec<(i64, u64)>) -> TestResult { + if vs.is_empty() { + return TestResult::discard(); + } + + vs.sort_by_key(|v| v.1); // Sorted by vertex + vs.dedup_by_key(|v| v.1); // Have each vertex only once to avoid headaches + vs.sort_by_key(|v| v.0); // Sorted by time + + let rand_start_index = thread_rng().gen_range(0..vs.len()); + let rand_end_index = thread_rng().gen_range(rand_start_index..vs.len()); + + let g = Graph::new(); + + for (t, v) in &vs { + g.add_vertex(*t, *v, NO_PROPS) + .map_err(|err| println!("{:?}", err)) + .ok(); + } + + let start = vs.get(rand_start_index).expect("start index in range").0; + let end = vs.get(rand_end_index).expect("end index in range").0; + + let wg = WindowedGraph::new(g, start, end); + + let rand_test_index: usize = thread_rng().gen_range(0..vs.len()); + + let (i, v) = vs.get(rand_test_index).expect("test index in range"); + if (start..end).contains(i) { + if wg.has_vertex(*v) { + TestResult::passed() + } else { + TestResult::error(format!( + "Vertex {:?} was not in window {:?}", + (i, v), + start..end + )) + } + } else if !wg.has_vertex(*v) { + TestResult::passed() + } else { + TestResult::error(format!( + "Vertex {:?} was in window {:?}", + (i, v), + start..end + )) + } + } + + #[quickcheck] + fn windowed_graph_has_edge(mut edges: Vec<(i64, (u64, u64))>) -> TestResult { + if edges.is_empty() { + return TestResult::discard(); + } + + edges.sort_by_key(|e| e.1); // Sorted by edge + edges.dedup_by_key(|e| e.1); // Have each edge only once to avoid headaches + edges.sort_by_key(|e| e.0); // Sorted by time + + let rand_start_index = thread_rng().gen_range(0..edges.len()); + let rand_end_index = thread_rng().gen_range(rand_start_index..edges.len()); + + let g = Graph::new(); + + for (t, e) in &edges { + g.add_edge(*t, e.0, e.1, NO_PROPS, None).unwrap(); + } + + let start = edges.get(rand_start_index).expect("start index in range").0; + let end = edges.get(rand_end_index).expect("end index in range").0; + + let wg = WindowedGraph::new(g, start, end); + + let rand_test_index: usize = thread_rng().gen_range(0..edges.len()); + + let (i, e) = edges.get(rand_test_index).expect("test index in range"); + if (start..end).contains(i) { + if wg.has_edge(e.0, e.1, Layer::All) { + TestResult::passed() + } else { + TestResult::error(format!( + "Edge {:?} was not in window {:?}", + (i, e), + start..end + )) + } + } else if !wg.has_edge(e.0, e.1, Layer::All) { + TestResult::passed() + } else { + TestResult::error(format!("Edge {:?} was in window {:?}", (i, e), start..end)) + } + } + + #[quickcheck] + fn windowed_graph_edge_count( + mut edges: Vec<(i64, (u64, u64))>, + window: Range, + ) -> TestResult { + if window.end < window.start { + return TestResult::discard(); + } + edges.sort_by_key(|e| e.1); // Sorted by edge + edges.dedup_by_key(|e| e.1); // Have each edge only once to avoid headaches + + let true_edge_count = edges.iter().filter(|e| window.contains(&e.0)).count(); + + let g = Graph::new(); + + for (t, e) in &edges { + g.add_edge(*t, e.0, e.1, [("test".to_owned(), Prop::Bool(true))], None) + .unwrap(); + } + + let wg = WindowedGraph::new(g, window.start, window.end); + if wg.count_edges() != true_edge_count { + println!( + "failed, g.num_edges() = {}, true count = {}", + wg.count_edges(), + true_edge_count + ); + println!("g.edges() = {:?}", wg.edges().collect_vec()); + } + TestResult::from_bool(wg.count_edges() == true_edge_count) + } + + #[quickcheck] + fn trivial_window_has_all_edges(edges: Vec<(i64, u64, u64)>) -> bool { + let g = Graph::new(); + edges + .into_par_iter() + .filter(|e| e.0 < i64::MAX) + .for_each(|(t, src, dst)| { + g.add_edge(t, src, dst, [("test".to_owned(), Prop::Bool(true))], None) + .unwrap(); + }); + let w = g.window(i64::MIN, i64::MAX); + g.edges() + .all(|e| w.has_edge(e.src().id(), e.dst().id(), Layer::All)) + } + + #[quickcheck] + fn large_vertex_in_window(dsts: Vec) -> bool { + let dsts: Vec = dsts.into_iter().unique().collect(); + let n = dsts.len(); + let g = Graph::new(); + + for dst in dsts { + let t = 1; + g.add_edge(t, 0, dst, NO_PROPS, None).unwrap(); + } + let w = g.window(i64::MIN, i64::MAX); + w.count_edges() == n + } + + #[test] + fn windowed_graph_vertex_ids() { + let vs = vec![(1, 1, 2), (3, 3, 4), (5, 5, 6), (7, 7, 1)]; + + let args = vec![(i64::MIN, 8), (i64::MIN, 2), (i64::MIN, 4), (3, 6)]; + + let expected = vec![ + vec![1, 2, 3, 4, 5, 6, 7], + vec![1, 2], + vec![1, 2, 3, 4], + vec![3, 4, 5, 6], + ]; + + let g = Graph::new(); + + for (t, src, dst) in &vs { + g.add_edge(*t, *src, *dst, NO_PROPS, None).unwrap(); + } + + let res: Vec<_> = (0..=3) + .map(|i| { + let wg = g.window(args[i].0, args[i].1); + let mut e = wg.vertices().id().collect::>(); + e.sort(); + e + }) + .collect_vec(); + + assert_eq!(res, expected); + + let g = Graph::new(); + for (src, dst, t) in &vs { + g.add_edge(*src, *dst, *t, NO_PROPS, None).unwrap(); + } + let res: Vec<_> = (0..=3) + .map(|i| { + let wg = g.window(args[i].0, args[i].1); + let mut e = wg.vertices().id().collect::>(); + e.sort(); + e + }) + .collect_vec(); + assert_eq!(res, expected); + } + + #[test] + fn windowed_graph_vertices() { + let vs = vec![ + (1, 1, 2), + (2, 1, 3), + (-1, 2, 1), + (0, 1, 1), + (7, 3, 2), + (1, 1, 1), + ]; + + let g = Graph::new(); + + g.add_vertex( + 0, + 1, + [("type", "wallet".into_prop()), ("cost", 99.5.into_prop())], + ) + .map_err(|err| println!("{:?}", err)) + .ok(); + + g.add_vertex( + -1, + 2, + [("type", "wallet".into_prop()), ("cost", 10.0.into_prop())], + ) + .map_err(|err| println!("{:?}", err)) + .ok(); + + g.add_vertex( + 6, + 3, + [("type", "wallet".into_prop()), ("cost", 76.2.into_prop())], + ) + .map_err(|err| println!("{:?}", err)) + .ok(); + + for (t, src, dst) in &vs { + g.add_edge(*t, *src, *dst, [("eprop", "commons")], None) + .unwrap(); + } + + let wg = g.window(-2, 0); + + let actual = wg.vertices().id().collect::>(); + + let expected = vec![1, 2]; + + assert_eq!(actual, expected); + + // Check results from multiple graphs with different number of shards + let g = Graph::new(); + + g.add_vertex( + 0, + 1, + [("type", "wallet".into_prop()), ("cost", 99.5.into_prop())], + ) + .map_err(|err| println!("{:?}", err)) + .ok(); + + g.add_vertex( + -1, + 2, + [("type", "wallet".into_prop()), ("cost", 10.0.into_prop())], + ) + .map_err(|err| println!("{:?}", err)) + .ok(); + + g.add_vertex( + 6, + 3, + [("type", "wallet".into_prop()), ("cost", 76.2.into_prop())], + ) + .map_err(|err| println!("{:?}", err)) + .ok(); + + for (t, src, dst) in &vs { + g.add_edge(*t, *src, *dst, NO_PROPS, None).unwrap(); + } + + let expected = wg.vertices().id().collect::>(); + + assert_eq!(actual, expected); + } +} diff --git a/raphtory/src/db/graph_immutable.rs b/raphtory/src/db/graph_immutable.rs deleted file mode 100644 index 5a133583a9..0000000000 --- a/raphtory/src/db/graph_immutable.rs +++ /dev/null @@ -1,729 +0,0 @@ -//! Defines the `ImmutableGraph` struct, which represents a raphtory graph in a frozen state. -//! This graph can be queried in a read-only format avoiding any locks placed when using a -//! non-immutable graph. -//! -//! # Examples -//! -//! ```rust -//! use raphtory::db::graph::Graph; -//! use raphtory::db::view_api::*; -//! -//! let graph = Graph::new(2); -//! // Add vertices and edges -//! -//! let immutable_graph = graph.freeze(); -//! ``` - -use crate::core::edge_ref::EdgeRef; -use crate::core::tgraph::TemporalGraph; -use crate::core::tgraph_shard::ImmutableTGraphShard; -use crate::core::utils; -use crate::core::vertex_ref::{LocalVertexRef, VertexRef}; -use crate::core::Direction; -use crate::db::graph::Graph; -use itertools::Itertools; -use rustc_hash::FxHashMap; -use serde::{Deserialize, Serialize}; -use std::cmp::{max, min}; -use std::iter; -use std::sync::Arc; - -use super::view_api::internal::GraphViewInternalOps; - -/// A raphtory graph in a frozen state that is read-only. -/// This graph can be queried in a read-only format avoiding any locks placed when using a -/// non-immutable graph. -/// -/// # Examples -/// -/// ```rust -/// use raphtory::db::graph::Graph; -/// use raphtory::db::view_api::*; -/// -/// let graph = Graph::new(2); -/// // Add vertices and edges -/// -/// let immutable_graph = graph.freeze(); -/// ``` -#[derive(Debug, Clone, Serialize, Deserialize)] -pub struct ImmutableGraph { - pub(crate) nr_shards: usize, - pub(crate) shards: Vec>, - pub(crate) layer_ids: Arc>, -} - -/// Failure if there is an issue with unfreezing a frozen graph -#[derive(Debug, PartialEq)] -pub struct UnfreezeFailure; - -/// Implements the `ImmutableGraph` struct. -impl ImmutableGraph { - /// Unfreeze the immutable graph and convert it to a mutable `Graph`. - /// - /// # Examples - /// - /// ```rust - /// use raphtory::db::graph::Graph; - /// use raphtory::db::view_api::*; - /// - /// let graph = Graph::new(2); - /// // Add vertices and edges - /// let immutable_graph = graph.freeze(); - /// // Unfreeze the graph - /// let graph = immutable_graph.unfreeze().unwrap(); - /// ``` - pub fn unfreeze(self) -> Result { - let mut shards = Vec::with_capacity(self.shards.len()); - for shard in self.shards { - match shard.unfreeze() { - Ok(t) => shards.push(t), - Err(_) => return Err(UnfreezeFailure), - } - } - Ok(Graph::new_from_frozen( - self.nr_shards, - shards, - Arc::new(parking_lot::RwLock::new((*self.layer_ids).clone())), - )) - } - - /// Get the shard id for a given global vertex id. - /// - /// # Examples - /// - /// ```rust - /// use raphtory::db::graph::Graph; - /// use raphtory::db::view_api::*; - /// - /// let graph = Graph::new(2); - /// graph.add_vertex(0, 1, &vec![]).unwrap(); - /// // ... Add vertices and edges ... - /// let immutable_graph = graph.freeze(); - /// // Unfreeze the graph - /// immutable_graph.shard_id(1); - /// ``` - pub fn shard_id(&self, g_id: u64) -> usize { - utils::get_shard_id_from_global_vid(g_id, self.nr_shards) - } - - /// Get an immutable graph shard for a given global vertex id. - /// - /// # Examples - /// - /// ```rust - /// use raphtory::db::graph::Graph; - /// use raphtory::db::view_api::*; - /// - /// let graph = Graph::new(2); - /// graph.add_vertex(0, 1, &vec![]).unwrap(); - /// // ... Add vertices and edges ... - /// let immutable_graph = graph.freeze(); - /// // Unfreeze the graph - /// let shard = immutable_graph.get_shard_from_id(1); - /// ``` - pub fn get_shard_from_id(&self, g_id: u64) -> &ImmutableTGraphShard { - &self.shards[self.shard_id(g_id)] - } - - /// Get an immutable graph shard for a given vertex. - /// - pub fn get_shard_from_v(&self, v: VertexRef) -> &ImmutableTGraphShard { - match v { - VertexRef::Local(local) => &self.shards[local.shard_id], - VertexRef::Remote(g_id) => &self.shards[self.shard_id(g_id)], - } - } - - pub fn get_shard_from_local_v( - &self, - v: LocalVertexRef, - ) -> &ImmutableTGraphShard { - &self.shards[v.shard_id] - } - - /// Get an immutable graph shard for a given edge. - /// - pub fn get_shard_from_e(&self, e: EdgeRef) -> &ImmutableTGraphShard { - &self.shards[e.shard()] - } - - // Get the earliest time in the graph. - /// - /// # Examples - /// - /// ```rust - /// use raphtory::db::graph::Graph; - /// use raphtory::db::view_api::*; - /// - /// let graph = Graph::new(2); - /// graph.add_vertex(0, 1, &vec![]).unwrap(); - /// // ... Add vertices and edges ... - /// let immutable_graph = graph.freeze(); - /// // Unfreeze the graph - /// let time = immutable_graph.earliest_time(); - /// ``` - pub fn earliest_time(&self) -> Option { - let min_from_shards = self.shards.iter().map(|shard| shard.earliest_time()).min(); - min_from_shards.filter(|&min| min != i64::MAX) - } - - // Get the latest time in the graph. - /// - /// # Examples - /// - /// ```rust - /// use raphtory::db::graph::Graph; - /// use raphtory::db::view_api::*; - /// - /// let graph = Graph::new(2); - /// graph.add_vertex(0, 1, &vec![]).unwrap(); - /// // ... Add vertices and edges ... - /// let immutable_graph = graph.freeze(); - /// // Unfreeze the graph - /// let time = immutable_graph.latest_time(); - /// ``` - pub fn latest_time(&self) -> Option { - let max_from_shards = self.shards.iter().map(|shard| shard.latest_time()).max(); - max_from_shards.filter(|&max| max != i64::MIN) - } - - /// Get the degree for a vertex in the graph given its direction. - pub fn degree(&self, v: LocalVertexRef, d: Direction) -> usize { - self.get_shard_from_local_v(v).degree(v, d, None) - } - - /// Get all vertices in the graph. - /// - /// # Examples - /// - /// ```rust - /// use raphtory::db::graph::Graph; - /// use raphtory::db::view_api::*; - /// - /// let graph = Graph::new(2); - /// graph.add_vertex(0, 1, &vec![]).unwrap(); - /// // ... Add vertices and edges ... - /// let immutable_graph = graph.freeze(); - /// // Unfreeze the graph - /// let vertices = immutable_graph.vertices(); - /// ``` - pub fn vertices(&self) -> Box + Send + '_> { - Box::new(self.shards.iter().flat_map(|s| s.vertices())) - } - - /// Get all edges in the graph. - /// - /// # Examples - /// - /// ```rust - /// use raphtory::db::graph::Graph; - /// use raphtory::db::view_api::*; - /// - /// let graph = Graph::new(2); - /// graph.add_edge(0, 1, 1, &vec![], None).unwrap(); - /// // ... Add vertices and edges ... - /// let immutable_graph = graph.freeze(); - /// // Unfreeze the graph - /// let edges = immutable_graph.edges(); - /// ``` - pub fn edges(&self) -> Box + Send + '_> { - Box::new(self.vertices().flat_map(|v| { - self.get_shard_from_local_v(v) - .vertex_edges(v, Direction::OUT, None) - })) - } - - /// Get number of edges in the graph. - /// - /// # Examples - /// - /// ```rust - /// use raphtory::db::graph::Graph; - /// use raphtory::db::view_api::*; - /// - /// let graph = Graph::new(2); - /// graph.add_edge(0, 1, 2, &vec![], None).unwrap(); - /// // ... Add vertices and edges ... - /// let immutable_graph = graph.freeze(); - /// // Unfreeze the graph - /// let num_edges = immutable_graph.num_edges(); - /// ``` - pub fn num_edges(&self) -> usize { - self.shards - .iter() - .map(|shard| shard.out_edges_len(None)) - .sum() - } - - fn localise_edge(&self, src: VertexRef, dst: VertexRef) -> (usize, VertexRef, VertexRef) { - match src { - VertexRef::Local(local_src) => match dst { - VertexRef::Local(local_dst) => { - if local_src.shard_id == local_dst.shard_id { - (local_src.shard_id, src, dst) - } else { - ( - local_src.shard_id, - src, - VertexRef::Remote(self.vertex_id(local_dst)), - ) - } - } - VertexRef::Remote(_) => (local_src.shard_id, src, dst), - }, - VertexRef::Remote(gid) => match dst { - VertexRef::Local(local_dst) => (local_dst.shard_id, src, dst), - VertexRef::Remote(_) => (self.shard_id(gid), src, dst), - }, - } - } -} - -impl GraphViewInternalOps for ImmutableGraph { - fn local_vertex(&self, v: VertexRef) -> Option { - self.get_shard_from_v(v).local_vertex(v) - } - - fn local_vertex_window( - &self, - v: VertexRef, - t_start: i64, - t_end: i64, - ) -> Option { - self.get_shard_from_v(v) - .local_vertex_window(v, t_start..t_end) - } - - fn get_unique_layers_internal(&self) -> Vec { - let a = iter::once(0); - let b = self.layer_ids.values().copied(); - a.chain(b).collect_vec() - } - - fn get_layer_name_by_id(&self, layer_id: usize) -> String { - self.layer_ids - .iter() - .find_map(|(name, &id)| (layer_id == id).then_some(name)) - .expect(&format!("layer id '{layer_id}' doesn't exist")) - .to_string() - } - - fn get_layer(&self, key: Option<&str>) -> Option { - match key { - None => Some(0), - Some(key) => self.layer_ids.get(key).copied(), - } - } - - fn view_start(&self) -> Option { - self.earliest_time_global() - } - - fn view_end(&self) -> Option { - self.latest_time_global().map(|t| t + 1) // so it is exclusive - } - - fn earliest_time_global(&self) -> Option { - let min_from_shards = self.shards.iter().map(|shard| shard.earliest_time()).min(); - min_from_shards.filter(|&min| min != i64::MAX) - } - - fn earliest_time_window(&self, t_start: i64, t_end: i64) -> Option { - //FIXME: this is not correct, should actually be the earliest activity in window - let earliest = self.earliest_time_global()?; - if earliest > t_end { - None - } else { - Some(max(earliest, t_start)) - } - } - - fn latest_time_global(&self) -> Option { - let max_from_shards = self.shards.iter().map(|shard| shard.latest_time()).max(); - max_from_shards.filter(|&max| max != i64::MIN) - } - - fn latest_time_window(&self, t_start: i64, t_end: i64) -> Option { - //FIXME: this is not correct, should actually be the latest activity in window - let latest = self.latest_time_global()?; - if latest < t_start { - None - } else { - Some(min(latest, t_end)) - } - } - - fn vertices_len(&self) -> usize { - self.shards.iter().map(|shard| shard.len()).sum() - } - - fn vertices_len_window(&self, t_start: i64, t_end: i64) -> usize { - //FIXME: This nees to be optimised ideally - self.shards - .iter() - .map(|shard| shard.vertices_window(t_start..t_end).count()) - .sum() - } - - fn edges_len(&self, layer: Option) -> usize { - let vs: Vec = self - .shards - .iter() - .map(|shard| shard.out_edges_len(layer)) - .collect(); - vs.iter().sum() - } - - fn edges_len_window(&self, t_start: i64, t_end: i64, layer: Option) -> usize { - self.shards - .iter() - .map(|shard| shard.out_edges_len_window(&(t_start..t_end), layer)) - .sum() - } - - fn has_edge_ref(&self, src: VertexRef, dst: VertexRef, layer: usize) -> bool { - let (shard, src, dst) = self.localise_edge(src, dst); - self.shards[shard].has_edge(src, dst, layer) - } - - fn has_edge_ref_window( - &self, - src: VertexRef, - dst: VertexRef, - t_start: i64, - t_end: i64, - layer: usize, - ) -> bool { - let (shard, src, dst) = self.localise_edge(src, dst); - self.shards[shard].has_edge_window(src, dst, t_start..t_end, layer) - } - - fn has_vertex_ref(&self, v: VertexRef) -> bool { - self.get_shard_from_v(v).has_vertex(v) - } - - fn has_vertex_ref_window(&self, v: VertexRef, t_start: i64, t_end: i64) -> bool { - self.get_shard_from_v(v) - .has_vertex_window(v, t_start..t_end) - } - - fn degree(&self, v: LocalVertexRef, d: Direction, layer: Option) -> usize { - self.get_shard_from_local_v(v).degree(v, d, layer) - } - - fn degree_window( - &self, - v: LocalVertexRef, - t_start: i64, - t_end: i64, - d: Direction, - layer: Option, - ) -> usize { - self.get_shard_from_local_v(v) - .degree_window(v, t_start..t_end, d, layer) - } - - fn vertex_ref(&self, v: u64) -> Option { - self.get_shard_from_id(v).vertex(v) - } - - fn vertex_id(&self, v: LocalVertexRef) -> u64 { - self.shards[v.shard_id].vertex_id(v) - } - - fn vertex_ref_window(&self, v: u64, t_start: i64, t_end: i64) -> Option { - self.get_shard_from_id(v).vertex_window(v, t_start..t_end) - } - - fn vertex_earliest_time(&self, v: LocalVertexRef) -> Option { - self.get_shard_from_local_v(v).vertex_earliest_time(v) - } - - fn vertex_earliest_time_window( - &self, - v: LocalVertexRef, - t_start: i64, - t_end: i64, - ) -> Option { - self.get_shard_from_local_v(v) - .vertex_earliest_time_window(v, t_start..t_end) - } - - fn vertex_latest_time(&self, v: LocalVertexRef) -> Option { - self.get_shard_from_local_v(v).vertex_latest_time(v) - } - - fn vertex_latest_time_window( - &self, - v: LocalVertexRef, - t_start: i64, - t_end: i64, - ) -> Option { - self.get_shard_from_local_v(v) - .vertex_latest_time_window(v, t_start..t_end) - } - - fn vertex_refs(&self) -> Box + Send> { - let shards = self.shards.clone(); - Box::new(shards.into_iter().flat_map(|s| s.vertices())) - } - - fn vertex_refs_window( - &self, - t_start: i64, - t_end: i64, - ) -> Box + Send> { - let shards = self.shards.clone(); - Box::new( - shards - .into_iter() - .flat_map(move |s| s.vertices_window(t_start..t_end)), - ) - } - - fn vertex_refs_shard(&self, shard: usize) -> Box + Send> { - let shard = self.shards[shard].clone(); - Box::new(shard.vertices()) - } - - fn vertex_refs_window_shard( - &self, - shard: usize, - t_start: i64, - t_end: i64, - ) -> Box + Send> { - let shard = self.shards[shard].clone(); - Box::new(shard.vertices_window(t_start..t_end)) - } - - fn edge_ref(&self, src: VertexRef, dst: VertexRef, layer: usize) -> Option { - let (shard_id, src, dst) = self.localise_edge(src, dst); - self.shards[shard_id].edge(src, dst, layer) - } - - fn edge_ref_window( - &self, - src: VertexRef, - dst: VertexRef, - t_start: i64, - t_end: i64, - layer: usize, - ) -> Option { - let (shard_id, src, dst) = self.localise_edge(src, dst); - self.shards[shard_id].edge_window(src, dst, t_start..t_end, layer) - } - - fn edge_refs(&self, layer: Option) -> Box + Send> { - //FIXME: needs low-level primitive - let g = self.clone(); - match layer { - Some(layer) => Box::new( - self.vertex_refs() - .flat_map(move |v| g.vertex_edges(v, Direction::OUT, Some(layer))), - ), - None => Box::new( - self.vertex_refs() - .flat_map(move |v| g.vertex_edges(v, Direction::OUT, None)), - ), - } - } - - fn edge_refs_window( - &self, - t_start: i64, - t_end: i64, - layer: Option, - ) -> Box + Send> { - //FIXME: needs low-level primitive - let g = self.clone(); - Box::new( - self.vertex_refs() - .flat_map(move |v| g.vertex_edges_window(v, t_start, t_end, Direction::OUT, layer)), - ) - } - - fn vertex_edges( - &self, - v: LocalVertexRef, - d: Direction, - layer: Option, - ) -> Box + Send> { - Box::new(self.get_shard_from_local_v(v).vertex_edges(v, d, layer)) - } - - fn vertex_edges_t( - &self, - v: LocalVertexRef, - d: Direction, - layer: Option, - ) -> Box + Send> { - // FIXME: missing low-level implementation - Box::new(self.get_shard_from_local_v(v).vertex_edges_window_t( - v, - i64::MIN..i64::MAX, - d, - layer, - )) - } - - fn vertex_edges_window( - &self, - v: LocalVertexRef, - t_start: i64, - t_end: i64, - d: Direction, - layer: Option, - ) -> Box + Send> { - Box::new( - self.get_shard_from_local_v(v) - .vertex_edges_window(v, t_start..t_end, d, layer), - ) - } - - fn vertex_edges_window_t( - &self, - v: LocalVertexRef, - t_start: i64, - t_end: i64, - d: Direction, - layer: Option, - ) -> Box + Send> { - Box::new( - self.get_shard_from_local_v(v) - .vertex_edges_window_t(v, t_start..t_end, d, layer), - ) - } - - fn neighbours( - &self, - v: LocalVertexRef, - d: Direction, - layer: Option, - ) -> Box + Send> { - Box::new(self.get_shard_from_local_v(v).neighbours(v, d, layer)) - } - - fn neighbours_window( - &self, - v: LocalVertexRef, - t_start: i64, - t_end: i64, - d: Direction, - layer: Option, - ) -> Box + Send> { - Box::new( - self.get_shard_from_local_v(v) - .neighbours_window(v, t_start..t_end, d, layer), - ) - } - - fn static_vertex_prop(&self, v: LocalVertexRef, name: String) -> Option { - self.get_shard_from_local_v(v).static_vertex_prop(v, name) - } - - fn static_vertex_prop_names(&self, v: LocalVertexRef) -> Vec { - self.get_shard_from_local_v(v).static_vertex_prop_names(v) - } - - fn temporal_vertex_prop_names(&self, v: LocalVertexRef) -> Vec { - self.get_shard_from_local_v(v).temporal_vertex_prop_names(v) - } - - fn temporal_vertex_prop_vec( - &self, - v: LocalVertexRef, - name: String, - ) -> Vec<(i64, crate::core::Prop)> { - self.get_shard_from_local_v(v) - .temporal_vertex_prop_vec(v, name) - } - - fn vertex_timestamps(&self, v: LocalVertexRef) -> Vec { - self.get_shard_from_local_v(v).vertex_timestamps(v) - } - - fn vertex_timestamps_window(&self, v: LocalVertexRef, t_start: i64, t_end: i64) -> Vec { - self.get_shard_from_local_v(v) - .vertex_timestamps_window(v, t_start..t_end) - } - - fn temporal_vertex_prop_vec_window( - &self, - v: LocalVertexRef, - name: String, - t_start: i64, - t_end: i64, - ) -> Vec<(i64, crate::core::Prop)> { - self.get_shard_from_local_v(v) - .temporal_vertex_prop_vec_window(v, name, t_start..t_end) - } - - fn temporal_vertex_props( - &self, - v: LocalVertexRef, - ) -> std::collections::HashMap> { - self.get_shard_from_local_v(v).temporal_vertex_props(v) - } - - fn temporal_vertex_props_window( - &self, - v: LocalVertexRef, - t_start: i64, - t_end: i64, - ) -> std::collections::HashMap> { - self.get_shard_from_local_v(v) - .temporal_vertex_props_window(v, t_start..t_end) - } - - fn static_edge_prop(&self, e: EdgeRef, name: String) -> Option { - self.get_shard_from_e(e).static_edge_prop(e, name) - } - - fn static_edge_prop_names(&self, e: EdgeRef) -> Vec { - self.get_shard_from_e(e).static_edge_prop_names(e) - } - - fn temporal_edge_prop_names(&self, e: EdgeRef) -> Vec { - self.get_shard_from_e(e).temporal_edge_prop_names(e) - } - - fn temporal_edge_props_vec(&self, e: EdgeRef, name: String) -> Vec<(i64, crate::core::Prop)> { - self.get_shard_from_e(e).temporal_edge_prop_vec(e, name) - } - - fn temporal_edge_props_vec_window( - &self, - e: EdgeRef, - name: String, - t_start: i64, - t_end: i64, - ) -> Vec<(i64, crate::core::Prop)> { - self.get_shard_from_e(e) - .temporal_edge_props_vec_window(e, name, t_start..t_end) - } - - fn edge_timestamps(&self, e: EdgeRef, window: Option>) -> Vec { - self.get_shard_from_e(e).edge_timestamps(e, window) - } - - fn temporal_edge_props( - &self, - e: EdgeRef, - ) -> std::collections::HashMap> { - self.get_shard_from_e(e).temporal_edge_props(e) - } - - fn temporal_edge_props_window( - &self, - e: EdgeRef, - t_start: i64, - t_end: i64, - ) -> std::collections::HashMap> { - self.get_shard_from_e(e) - .temporal_edge_props_window(e, t_start..t_end) - } - - fn num_shards(&self) -> usize { - self.nr_shards - } -} diff --git a/raphtory/src/db/graph_layer.rs b/raphtory/src/db/graph_layer.rs deleted file mode 100644 index 26e6ef2c0b..0000000000 --- a/raphtory/src/db/graph_layer.rs +++ /dev/null @@ -1,426 +0,0 @@ -use crate::core::edge_ref::EdgeRef; -use crate::core::vertex_ref::{LocalVertexRef, VertexRef}; -use crate::core::{Direction, Prop}; -use crate::db::view_api::internal::GraphViewInternalOps; -use itertools::Itertools; -use std::{collections::HashMap, ops::Range}; - -#[derive(Debug, Clone)] -pub struct LayeredGraph { - /// The underlying `Graph` object. - pub graph: G, - /// The layer this graphs points to. - pub layer: usize, -} - -impl LayeredGraph { - pub fn new(graph: G, layer: usize) -> Self { - Self { graph, layer } - } - - /// Return None if the intersection between the previously requested layers and the layer of - /// this view is null - fn constrain(&self, layer: Option) -> Option { - match layer { - None => Some(self.layer), - Some(layer) if layer == self.layer => Some(layer), - _ => None, - } - } -} - -impl GraphViewInternalOps for LayeredGraph { - fn get_unique_layers_internal(&self) -> Vec { - let layers = self.graph.get_unique_layers_internal(); - layers - .into_iter() - .filter(|id| *id == self.layer) - .collect_vec() - } - - fn get_layer(&self, key: Option<&str>) -> Option { - self.graph.get_layer(key) - } - - fn get_layer_name_by_id(&self, layer_id: usize) -> String { - self.graph.get_layer_name_by_id(layer_id) - } - - fn view_start(&self) -> Option { - self.graph.view_start() - } - - fn view_end(&self) -> Option { - self.graph.view_end() - } - - fn earliest_time_global(&self) -> Option { - self.graph.earliest_time_global() - } - - fn earliest_time_window(&self, t_start: i64, t_end: i64) -> Option { - self.graph.earliest_time_window(t_start, t_end) - } - - fn latest_time_global(&self) -> Option { - self.graph.latest_time_global() - } - - fn latest_time_window(&self, t_start: i64, t_end: i64) -> Option { - self.graph.latest_time_window(t_start, t_end) - } - - fn vertices_len(&self) -> usize { - self.graph.vertices_len() - } - - fn vertices_len_window(&self, t_start: i64, t_end: i64) -> usize { - self.graph.vertices_len_window(t_start, t_end) - } - - fn edges_len(&self, layer: Option) -> usize { - self.constrain(layer) - .map(|layer| self.graph.edges_len(Some(layer))) - .unwrap_or(0) - } - - fn edges_len_window(&self, t_start: i64, t_end: i64, layer: Option) -> usize { - self.constrain(layer) - .map(|layer| self.graph.edges_len_window(t_start, t_end, Some(layer))) - .unwrap_or(0) - } - - fn has_edge_ref(&self, src: VertexRef, dst: VertexRef, layer: usize) -> bool { - // FIXME: there is something wrong here, the layer should be able to be None, which would mean, whatever layer this is - layer == self.layer && self.graph.has_edge_ref(src, dst, layer) - } - - fn has_edge_ref_window( - &self, - src: VertexRef, - dst: VertexRef, - t_start: i64, - t_end: i64, - layer: usize, - ) -> bool { - layer == self.layer - && self - .graph - .has_edge_ref_window(src, dst, t_start, t_end, layer) - } - - fn has_vertex_ref(&self, v: VertexRef) -> bool { - self.graph.has_vertex_ref(v) - } - - fn has_vertex_ref_window(&self, v: VertexRef, t_start: i64, t_end: i64) -> bool { - self.graph.has_vertex_ref_window(v, t_start, t_end) - } - - fn degree(&self, v: LocalVertexRef, d: Direction, layer: Option) -> usize { - self.constrain(layer) - .map(|layer| self.graph.degree(v, d, Some(layer))) - .unwrap_or(0) - } - - fn degree_window( - &self, - v: LocalVertexRef, - t_start: i64, - t_end: i64, - d: Direction, - layer: Option, - ) -> usize { - self.constrain(layer) - .map(|layer| self.graph.degree_window(v, t_start, t_end, d, Some(layer))) - .unwrap_or(0) - } - - fn vertex_ref(&self, v: u64) -> Option { - self.graph.vertex_ref(v) - } - - fn vertex_ref_window(&self, v: u64, t_start: i64, t_end: i64) -> Option { - self.graph.vertex_ref_window(v, t_start, t_end) - } - - fn vertex_earliest_time(&self, v: LocalVertexRef) -> Option { - self.graph.vertex_earliest_time(v) - } - - fn vertex_earliest_time_window( - &self, - v: LocalVertexRef, - t_start: i64, - t_end: i64, - ) -> Option { - self.graph.vertex_earliest_time_window(v, t_start, t_end) - } - - fn vertex_latest_time(&self, v: LocalVertexRef) -> Option { - self.graph.vertex_latest_time(v) - } - - fn vertex_latest_time_window( - &self, - v: LocalVertexRef, - t_start: i64, - t_end: i64, - ) -> Option { - self.graph.vertex_latest_time_window(v, t_start, t_end) - } - - fn vertex_refs(&self) -> Box + Send> { - self.graph.vertex_refs() - } - - fn vertex_refs_window( - &self, - t_start: i64, - t_end: i64, - ) -> Box + Send> { - self.graph.vertex_refs_window(t_start, t_end) - } - - fn vertex_refs_shard(&self, shard: usize) -> Box + Send> { - self.graph.vertex_refs_shard(shard) - } - - fn vertex_refs_window_shard( - &self, - shard: usize, - t_start: i64, - t_end: i64, - ) -> Box + Send> { - self.graph.vertex_refs_window_shard(shard, t_start, t_end) - } - - fn edge_ref(&self, src: VertexRef, dst: VertexRef, layer: usize) -> Option { - (layer == self.layer) - .then(|| self.graph.edge_ref(src, dst, layer)) - .flatten() - } - - fn edge_ref_window( - &self, - src: VertexRef, - dst: VertexRef, - t_start: i64, - t_end: i64, - layer: usize, - ) -> Option { - (layer == self.layer) - .then(|| self.graph.edge_ref_window(src, dst, t_start, t_end, layer)) - .flatten() - } - - fn edge_refs(&self, layer: Option) -> Box + Send> { - // TODO: create a function empty_iter which returns a boxed empty iterator so we use it in all these functions - self.constrain(layer) - .map(|layer| self.graph.edge_refs(Some(layer))) - .unwrap_or_else(|| Box::new(std::iter::empty())) - } - - fn edge_refs_window( - &self, - t_start: i64, - t_end: i64, - layer: Option, - ) -> Box + Send> { - self.constrain(layer) - .map(|layer| self.graph.edge_refs_window(t_start, t_end, Some(layer))) - .unwrap_or_else(|| Box::new(std::iter::empty())) - } - - fn vertex_edges_t( - &self, - v: LocalVertexRef, - d: Direction, - layer: Option, - ) -> Box + Send> { - self.constrain(layer) - .map(|layer| self.graph.vertex_edges_t(v, d, Some(layer))) - .unwrap_or(Box::new(std::iter::empty())) - } - - fn vertex_edges_window( - &self, - v: LocalVertexRef, - t_start: i64, - t_end: i64, - d: Direction, - layer: Option, - ) -> Box + Send> { - self.constrain(layer) - .map(|layer| { - self.graph - .vertex_edges_window(v, t_start, t_end, d, Some(layer)) - }) - .unwrap_or_else(|| Box::new(std::iter::empty())) - } - - fn vertex_edges_window_t( - &self, - v: LocalVertexRef, - t_start: i64, - t_end: i64, - d: Direction, - layer: Option, - ) -> Box + Send> { - self.constrain(layer) - .map(|layer| { - self.graph - .vertex_edges_window_t(v, t_start, t_end, d, Some(layer)) - }) - .unwrap_or_else(|| Box::new(std::iter::empty())) - } - - fn neighbours( - &self, - v: LocalVertexRef, - d: Direction, - layer: Option, - ) -> Box + Send> { - self.constrain(layer) - .map(|layer| self.graph.neighbours(v, d, Some(layer))) - .unwrap_or_else(|| Box::new(std::iter::empty())) - } - - fn neighbours_window( - &self, - v: LocalVertexRef, - t_start: i64, - t_end: i64, - d: Direction, - layer: Option, - ) -> Box + Send> { - self.constrain(layer) - .map(|layer| { - self.graph - .neighbours_window(v, t_start, t_end, d, Some(layer)) - }) - .unwrap_or_else(|| Box::new(std::iter::empty())) - } - - fn static_vertex_prop(&self, v: LocalVertexRef, name: String) -> Option { - self.graph.static_vertex_prop(v, name) - } - - fn static_vertex_prop_names(&self, v: LocalVertexRef) -> Vec { - self.graph.static_vertex_prop_names(v) - } - - fn temporal_vertex_prop_names(&self, v: LocalVertexRef) -> Vec { - self.graph.temporal_vertex_prop_names(v) - } - - fn temporal_vertex_prop_vec(&self, v: LocalVertexRef, name: String) -> Vec<(i64, Prop)> { - self.graph.temporal_vertex_prop_vec(v, name) - } - - fn temporal_vertex_prop_vec_window( - &self, - v: LocalVertexRef, - name: String, - t_start: i64, - t_end: i64, - ) -> Vec<(i64, Prop)> { - self.graph - .temporal_vertex_prop_vec_window(v, name, t_start, t_end) - } - - fn temporal_vertex_props(&self, v: LocalVertexRef) -> HashMap> { - self.graph.temporal_vertex_props(v) - } - - fn temporal_vertex_props_window( - &self, - v: LocalVertexRef, - t_start: i64, - t_end: i64, - ) -> HashMap> { - self.graph.temporal_vertex_props_window(v, t_start, t_end) - } - - fn static_edge_prop(&self, e: EdgeRef, name: String) -> Option { - self.graph.static_edge_prop(e, name) - } - - fn static_edge_prop_names(&self, e: EdgeRef) -> Vec { - self.graph.static_edge_prop_names(e) - } - - fn temporal_edge_prop_names(&self, e: EdgeRef) -> Vec { - self.graph.temporal_edge_prop_names(e) - } - - fn temporal_edge_props_vec(&self, e: EdgeRef, name: String) -> Vec<(i64, Prop)> { - self.graph.temporal_edge_props_vec(e, name) - } - - fn temporal_edge_props_vec_window( - &self, - e: EdgeRef, - name: String, - t_start: i64, - t_end: i64, - ) -> Vec<(i64, Prop)> { - self.graph - .temporal_edge_props_vec_window(e, name, t_start, t_end) - } - - fn temporal_edge_props(&self, e: EdgeRef) -> HashMap> { - self.graph.temporal_edge_props(e) - } - - fn temporal_edge_props_window( - &self, - e: EdgeRef, - t_start: i64, - t_end: i64, - ) -> HashMap> { - self.graph.temporal_edge_props_window(e, t_start, t_end) - } - - fn num_shards(&self) -> usize { - self.graph.num_shards() - } - - fn vertex_timestamps(&self, v: LocalVertexRef) -> Vec { - self.graph.vertex_timestamps(v) - } - - fn vertex_timestamps_window(&self, v: LocalVertexRef, t_start: i64, t_end: i64) -> Vec { - self.graph.vertex_timestamps_window(v, t_start, t_end) - } - - fn edge_timestamps(&self, e: EdgeRef, window: Option>) -> Vec { - self.graph.edge_timestamps(e, window) - } - - fn vertex_edges( - &self, - v: LocalVertexRef, - d: Direction, - layer: Option, - ) -> Box + Send> { - self.graph.vertex_edges(v, d, self.constrain(layer)) - } - - fn vertex_id(&self, v: LocalVertexRef) -> u64 { - self.graph.vertex_id(v) - } - - fn local_vertex(&self, v: VertexRef) -> Option { - self.graph.local_vertex(v) - } - - fn local_vertex_window( - &self, - v: VertexRef, - t_start: i64, - t_end: i64, - ) -> Option { - self.graph.local_vertex_window(v, t_start, t_end) - } -} diff --git a/raphtory/src/db/graph_window.rs b/raphtory/src/db/graph_window.rs deleted file mode 100644 index e7e822b572..0000000000 --- a/raphtory/src/db/graph_window.rs +++ /dev/null @@ -1,1424 +0,0 @@ -//! A windowed view is a subset of a graph between a specific time window. -//! For example, lets say you wanted to run an algorithm each month over a graph, graph window -//! would allow you to split the graph into 30 day chunks to do so. -//! -//! This module also defines the `GraphWindow` trait, which represents a window of time over -//! which a graph can be queried. -//! -//! GraphWindowSet implements the `Iterator` trait, producing `WindowedGraph` views -//! for each perspective within it. -//! -//! # Types -//! -//! * `GraphWindowSet` - A struct that allows iterating over a Graph broken down into multiple -//! windowed views. It contains a `Graph` and an iterator of `Perspective`. -//! -//! * `WindowedGraph` - A struct that represents a windowed view of a `Graph`. -//! It contains a `Graph`, a start time (`t_start`) and an end time (`t_end`). -//! -//! # Traits -//! -//! * `GraphViewInternalOps` - A trait that provides operations to a `WindowedGraph` -//! used internally by the `GraphWindowSet`. -//! -//! # Examples -//! -//! ```rust -//! -//! use raphtory::db::graph::Graph; -//! use raphtory::db::view_api::*; -//! -//! let graph = Graph::new(2); -//! graph.add_edge(0, 1, 2, &vec![], None); -//! graph.add_edge(1, 1, 3, &vec![], None); -//! graph.add_edge(2, 2, 3, &vec![], None); -//! -//! let wg = graph.window(0, 1); -//! assert_eq!(wg.edge(1, 2, None).unwrap().src().id(), 1); -//! ``` - -use crate::core::edge_ref::EdgeRef; -use crate::core::time::IntoTime; -use crate::core::vertex_ref::{LocalVertexRef, VertexRef}; -use crate::core::{Direction, Prop}; -use crate::db::view_api::internal::GraphViewInternalOps; -use crate::db::view_api::GraphViewOps; -use std::cmp::{max, min}; -use std::{collections::HashMap, ops::Range}; - -/// A struct that represents a windowed view of a `Graph`. -#[derive(Debug, Clone)] -pub struct WindowedGraph { - /// The underlying `Graph` object. - pub graph: G, - /// The inclusive start time of the window. - pub t_start: i64, - /// The exclusive end time of the window. - pub t_end: i64, -} - -/// Implementation of the GraphViewInternalOps trait for WindowedGraph. -/// This trait provides operations to a `WindowedGraph` used internally by the `GraphWindowSet`. -/// *Note: All functions in this are bound by the time set in the windowed graph. -impl GraphViewInternalOps for WindowedGraph { - fn get_unique_layers_internal(&self) -> Vec { - self.graph.get_unique_layers_internal() - } - - fn get_layer(&self, key: Option<&str>) -> Option { - self.graph.get_layer(key) - } - - fn get_layer_name_by_id(&self, layer_id: usize) -> String { - self.graph.get_layer_name_by_id(layer_id) - } - - fn view_start(&self) -> Option { - Some(self.t_start) - } - - fn view_end(&self) -> Option { - Some(self.t_end) - } - - fn earliest_time_global(&self) -> Option { - self.graph.earliest_time_window(self.t_start, self.t_end) - } - - fn earliest_time_window(&self, t_start: i64, t_end: i64) -> Option { - self.graph - .earliest_time_window(self.actual_start(t_start), self.actual_end(t_end)) - } - - fn latest_time_global(&self) -> Option { - self.graph.latest_time_window(self.t_start, self.t_end) - } - - fn latest_time_window(&self, t_start: i64, t_end: i64) -> Option { - self.graph - .latest_time_window(self.actual_start(t_start), self.actual_end(t_end)) - } - - /// Returns the number of vertices in the windowed view. - fn vertices_len(&self) -> usize { - self.graph.vertices_len_window(self.t_start, self.t_end) - } - - /// Returns the number of vertices in the windowed view, for a window specified by start and end times. - /// - /// # Arguments - /// - /// * `t_start` - The inclusive start time of the window. - /// * `t_end` - The exclusive end time of the window. - /// - /// # Returns - /// - /// The number of vertices in the windowed view for the given window. - fn vertices_len_window(&self, t_start: i64, t_end: i64) -> usize { - self.graph - .vertices_len_window(self.actual_start(t_start), self.actual_end(t_end)) - } - - /// Returns the number of edges in the windowed view. - fn edges_len(&self, layer: Option) -> usize { - self.graph.edges_len_window(self.t_start, self.t_end, layer) - } - - /// Returns the number of edges in the windowed view, for a window specified by start and end times. - /// - /// # Arguments - /// - /// * `t_start` - The inclusive start time of the window. - /// * `t_end` - The exclusive end time of the window. - /// - /// # Returns - /// - /// The number of edges in the windowed view for the given window. - fn edges_len_window(&self, t_start: i64, t_end: i64, layer: Option) -> usize { - self.graph - .edges_len_window(self.actual_start(t_start), self.actual_end(t_end), layer) - } - - /// Check if there is an edge from src to dst in the window. - /// - /// # Arguments - /// - /// - `src` - The source vertex. - /// - `dst` - The destination vertex. - /// - /// # Returns - /// - /// A result containing `true` if there is an edge from src to dst in the window, `false` otherwise. - /// - /// # Errors - /// - /// Returns an error if either `src` or `dst` is not a valid vertex. - fn has_edge_ref(&self, src: VertexRef, dst: VertexRef, layer: usize) -> bool { - self.graph - .has_edge_ref_window(src, dst, self.t_start, self.t_end, layer) - } - - /// Check if there is an edge from src to dst in the window defined by t_start and t_end. - /// - /// # Arguments - /// - /// - `src` - The source vertex. - /// - `dst` - The destination vertex. - /// - `t_start` - The inclusive start time of the window. - /// - `t_end` - The exclusive end time of the window. - /// - /// # Returns - /// - /// A result containing `true` if there is an edge from src to dst in the window, `false` otherwise. - /// - /// # Errors - /// - /// Returns an error if either `src` or `dst` is not a valid vertex. - fn has_edge_ref_window( - &self, - src: VertexRef, - dst: VertexRef, - t_start: i64, - t_end: i64, - layer: usize, - ) -> bool { - self.graph.has_edge_ref_window( - src, - dst, - self.actual_start(t_start), - self.actual_end(t_end), - layer, - ) - } - - /// Check if a vertex v exists in the window. - /// - /// # Arguments - /// - /// - `v` - The vertex to check. - /// - /// # Returns - /// - /// A result containing `true` if the vertex exists in the window, `false` otherwise. - /// - /// # Errors - /// - /// Returns an error if `v` is not a valid vertex. - fn has_vertex_ref(&self, v: VertexRef) -> bool { - self.graph - .has_vertex_ref_window(v, self.t_start, self.t_end) - } - - /// Check if a vertex v exists in the window defined by t_start and t_end. - /// - /// # Arguments - /// - /// - `v` - The vertex to check. - /// - `t_start` - The inclusive start time of the window. - /// - `t_end` - The exclusive end time of the window. - /// - /// # Returns - /// - /// A result containing `true` if the vertex exists in the window, `false` otherwise. - /// - /// # Errors - /// - /// Returns an error if `v` is not a valid vertex. - fn has_vertex_ref_window(&self, v: VertexRef, t_start: i64, t_end: i64) -> bool { - self.graph - .has_vertex_ref_window(v, self.actual_start(t_start), self.actual_end(t_end)) - } - - /// Returns the number of edges from a vertex in the window. - /// - /// # Arguments - /// - /// - `v` - The vertex to check. - /// - `d` - The direction of the edges to count. - /// - /// # Returns - /// - /// A result containing the number of edges from the vertex in the window. - /// - /// # Errors - /// - /// Returns an error if `v` is not a valid vertex. - fn degree(&self, v: LocalVertexRef, d: Direction, layer: Option) -> usize { - self.graph - .degree_window(v, self.t_start, self.t_end, d, layer) - } - - /// Returns the number of edges from a vertex in the window defined by t_start and t_end. - /// - /// # Arguments - /// - /// - `v` - The vertex to check. - /// - `t_start` - The inclusive start time of the window. - /// - `t_end` - The exclusive end time of the window. - /// - `d` - The direction of the edges to count. - /// - /// # Returns - /// - /// A result containing the number of edges from the vertex in the window. - /// - /// # Errors - /// - /// Returns an error if `v` is not a valid vertex. - fn degree_window( - &self, - v: LocalVertexRef, - t_start: i64, - t_end: i64, - d: Direction, - layer: Option, - ) -> usize { - self.graph.degree_window( - v, - self.actual_start(t_start), - self.actual_end(t_end), - d, - layer, - ) - } - - /// Get the reference of the vertex with ID v if it exists - /// - /// # Arguments - /// - /// - `v` - The ID of the vertex to get - /// - /// # Returns - /// - /// A result of an option containing the vertex reference if it exists, `None` otherwise. - /// - /// # Errors - /// - /// Returns an error if `v` is not a valid vertex. - fn vertex_ref(&self, v: u64) -> Option { - self.graph.vertex_ref_window(v, self.t_start, self.t_end) - } - - /// Get the reference of the vertex with ID v if it exists in a window - /// - /// # Arguments - /// - /// - `v` - The ID of the vertex to get - /// - `t_start` - The inclusive start time of the window. - /// - `t_end` - The exclusive end time of the window. - /// - /// # Returns - /// - /// A result of an option containing the vertex reference if it exists, `None` otherwise. - /// - /// # Errors - /// - /// Returns an error if `v` is not a valid vertex. - fn vertex_ref_window(&self, v: u64, t_start: i64, t_end: i64) -> Option { - self.graph - .vertex_ref_window(v, self.actual_start(t_start), self.actual_end(t_end)) - } - - fn vertex_earliest_time(&self, v: LocalVertexRef) -> Option { - self.graph - .vertex_earliest_time_window(v, self.t_start, self.t_end) - } - - fn vertex_earliest_time_window( - &self, - v: LocalVertexRef, - t_start: i64, - t_end: i64, - ) -> Option { - self.graph.vertex_earliest_time_window( - v, - self.actual_start(t_start), - self.actual_end(t_end), - ) - } - - fn vertex_latest_time(&self, v: LocalVertexRef) -> Option { - self.graph - .vertex_latest_time_window(v, self.t_start, self.t_end) - } - - fn vertex_latest_time_window( - &self, - v: LocalVertexRef, - t_start: i64, - t_end: i64, - ) -> Option { - self.graph - .vertex_latest_time_window(v, self.actual_start(t_start), self.actual_end(t_end)) - } - - /// Get an iterator over the references of all vertices as references - /// - /// # Returns - /// - /// An iterator over the references of all vertices - fn vertex_refs(&self) -> Box + Send> { - self.graph.vertex_refs_window(self.t_start, self.t_end) - } - - fn vertex_refs_window( - &self, - t_start: i64, - t_end: i64, - ) -> Box + Send> { - self.graph - .vertex_refs_window(self.actual_start(t_start), self.actual_end(t_end)) - } - - fn vertex_refs_shard(&self, shard: usize) -> Box + Send> { - self.graph - .vertex_refs_window_shard(shard, self.t_start, self.t_end) - } - - fn vertex_refs_window_shard( - &self, - shard: usize, - t_start: i64, - t_end: i64, - ) -> Box + Send> { - self.graph.vertex_refs_window_shard( - shard, - self.actual_start(t_start), - self.actual_end(t_end), - ) - } - - /// Get an iterator over the references of an edges as a reference - /// - /// # Arguments - /// - /// - `src` - The source vertex of the edge - /// - `dst` - The destination vertex of the edge - /// - /// # Returns - /// - /// A result of an option containing the edge reference if it exists, `None` otherwise. - /// - /// # Errors - /// - /// Returns an error if `src` or `dst` are not valid vertices. - fn edge_ref(&self, src: VertexRef, dst: VertexRef, layer: usize) -> Option { - self.graph - .edge_ref_window(src, dst, self.t_start, self.t_end, layer) - } - - /// Get an iterator over the references of an edges as a reference in a window - /// - /// # Arguments - /// - /// - `src` - The source vertex of the edge - /// - `dst` - The destination vertex of the edge - /// - `t_start` - The inclusive start time of the window. - /// - `t_end` - The exclusive end time of the window. - /// - /// # Returns - /// - /// A result of an option containing the edge reference if it exists, `None` otherwise. - /// - /// # Errors - /// - /// Returns an error if `src` or `dst` are not valid vertices. - fn edge_ref_window( - &self, - src: VertexRef, - dst: VertexRef, - t_start: i64, - t_end: i64, - layer: usize, - ) -> Option { - self.graph.edge_ref_window( - src, - dst, - self.actual_start(t_start), - self.actual_end(t_end), - layer, - ) - } - - /// Get an iterator of all edges as references - /// - /// # Returns - /// - /// An iterator over all edges as references - fn edge_refs(&self, layer: Option) -> Box + Send> { - self.graph.edge_refs_window(self.t_start, self.t_end, layer) - } - - /// Get an iterator of all edges as references in a window - /// - /// # Arguments - /// - /// - `t_start` - The inclusive start time of the window. - /// - `t_end` - The exclusive end time of the window. - /// - /// # Returns - /// - /// An iterator over all edges as references - fn edge_refs_window( - &self, - t_start: i64, - t_end: i64, - layer: Option, - ) -> Box + Send> { - self.graph - .edge_refs_window(self.actual_start(t_start), self.actual_end(t_end), layer) - } - - fn vertex_edges_t( - &self, - v: LocalVertexRef, - d: Direction, - layer: Option, - ) -> Box + Send> { - self.graph - .vertex_edges_window_t(v, self.t_start, self.t_end, d, layer) - } - - /// Get an iterator of all edges as references for a given vertex and direction in a window - /// - /// # Arguments - /// - /// - `v` - The vertex to get the edges for - /// - `t_start` - The inclusive start time of the window. - /// - `t_end` - The exclusive end time of the window. - /// - `d` - The direction of the edges - /// - /// # Returns - /// - /// An iterator over all edges in that vertex direction as references - fn vertex_edges_window( - &self, - v: LocalVertexRef, - t_start: i64, - t_end: i64, - d: Direction, - layer: Option, - ) -> Box + Send> { - self.graph.vertex_edges_window( - v, - self.actual_start(t_start), - self.actual_end(t_end), - d, - layer, - ) - } - - /// Get an iterator of all edges as references for a given vertex and direction in a window - /// but exploded. This means, if a timestamp has two edges, they will be returned as two - /// seperate edges. - /// - /// # Arguments - /// - /// - `v` - The vertex to get the edges for - /// - `t_start` - The inclusive start time of the window. - /// - `t_end` - The exclusive end time of the window. - /// - `d` - The direction of the edges - /// - /// # Returns - /// - /// An iterator over all edges in that vertex direction as references - - fn vertex_edges_window_t( - &self, - v: LocalVertexRef, - t_start: i64, - t_end: i64, - d: Direction, - layer: Option, - ) -> Box + Send> { - self.graph.vertex_edges_window_t( - v, - self.actual_start(t_start), - self.actual_end(t_end), - d, - layer, - ) - } - - /// Get the neighbours of a vertex as references in a given direction - /// - /// # Arguments - /// - /// - `v` - The vertex to get the neighbours for - /// - `d` - The direction of the edges - /// - /// # Returns - /// - /// An iterator over all neighbours in that vertex direction as references - fn neighbours( - &self, - v: LocalVertexRef, - d: Direction, - layer: Option, - ) -> Box + Send> { - self.graph - .neighbours_window(v, self.t_start, self.t_end, d, layer) - } - - /// Get the neighbours of a vertex as references in a given direction across a window - /// - /// # Arguments - /// - /// - `v` - The vertex to get the neighbours for - /// - `t_start` - The inclusive start time of the window. - /// - `t_end` - The exclusive end time of the window. - /// - `d` - The direction of the edges - /// - /// # Returns - /// - /// An iterator over all neighbours in that vertex direction as references - fn neighbours_window( - &self, - v: LocalVertexRef, - t_start: i64, - t_end: i64, - d: Direction, - layer: Option, - ) -> Box + Send> { - self.graph.neighbours_window( - v, - self.actual_start(t_start), - self.actual_end(t_end), - d, - layer, - ) - } - - /// Get the static property of a vertex - /// - /// # Arguments - /// - /// - `v` - The vertex to get the property for - /// - `name` - The name of the property - /// - /// # Returns - /// - /// A result of an option of a property - fn static_vertex_prop(&self, v: LocalVertexRef, name: String) -> Option { - self.graph.static_vertex_prop(v, name) - } - - /// Get all static property names of a vertex - /// - /// # Arguments - /// - /// - `v` - The vertex to get the property for - /// - /// # Returns - /// - /// a Vector of Strings representing all the property names - fn static_vertex_prop_names(&self, v: LocalVertexRef) -> Vec { - self.graph.static_vertex_prop_names(v) - } - - /// Get all temporal property names of a vertex - /// - /// # Arguments - /// - /// - `v` - The vertex to get the property for - /// - /// # Returns - /// - /// a Vector of Strings representing all the property names - fn temporal_vertex_prop_names(&self, v: LocalVertexRef) -> Vec { - self.graph.temporal_vertex_prop_names(v) - } - - /// Get the temporal property of a vertex - /// - /// # Arguments - /// - /// - `v` - The vertex to get the property for - /// - `name` - The name of the property - /// - /// # Returns - /// - /// A result of an vector of a tuple of a timestamp and a property - fn temporal_vertex_prop_vec(&self, v: LocalVertexRef, name: String) -> Vec<(i64, Prop)> { - self.graph - .temporal_vertex_prop_vec_window(v, name, self.t_start, self.t_end) - } - - /// Get the temporal property of a vertex in a window - /// - /// # Arguments - /// - /// - `v` - The vertex to get the property for - /// - `name` - The name of the property - /// - `t_start` - The inclusive start time of the window. - /// - `t_end` - The exclusive end time of the window. - /// - /// # Returns - /// - /// A result of an vector of a tuple of a timestamp and a property - /// - /// # Errors - /// - /// - `GraphError` - Raised if vertex or property does not exist - fn temporal_vertex_prop_vec_window( - &self, - v: LocalVertexRef, - name: String, - t_start: i64, - t_end: i64, - ) -> Vec<(i64, Prop)> { - self.graph.temporal_vertex_prop_vec_window( - v, - name, - self.actual_start(t_start), - self.actual_end(t_end), - ) - } - - /// Get the timestamps of a vertex - /// - /// # Arguments - /// - /// - `v` - The vertex to get the timestamps for - /// - /// # Returns - /// - /// A result of a vector of timestamps - /// - /// # Errors - /// - /// - `GraphError` - Raised if vertex does not exist - fn vertex_timestamps(&self, v: LocalVertexRef) -> Vec { - self.graph - .vertex_timestamps_window(v, self.t_start, self.t_end) - } - - /// Get the timestamps of a vertex in a window - /// - /// # Arguments - /// - /// - `v` - The vertex to get the timestamps for - /// - `t_start` - The start of the window - /// - `t_end` - The end of the window - /// - /// # Returns - /// - /// A result of a vector of timestamps - /// - /// # Errors - /// - /// - `GraphError` - Raised if vertex does not exist - - fn vertex_timestamps_window(&self, v: LocalVertexRef, t_start: i64, t_end: i64) -> Vec { - self.graph - .vertex_timestamps_window(v, self.actual_start(t_start), self.actual_end(t_end)) - } - - /// Get the timestamps of an edge in a window - /// - /// # Arguments - /// - /// - `e` - The edge to get the timestamps for - /// - `window` - The window to get the timestamps for - /// - /// # Returns - /// - /// A result of a vector of timestamps - /// - /// # Errors - /// - /// - `GraphError` - Raised if edge does not exist - - fn edge_timestamps(&self, e: EdgeRef, window: Option>) -> Vec { - let window = match window { - Some(Range { start, end, .. }) => self.actual_start(start)..self.actual_end(end), - None => self.t_start..self.t_end, - }; - self.graph.edge_timestamps(e, Some(window)) - } - - /// Get all temporal properties of a vertex - /// - /// # Arguments - /// - /// - `v` - The vertex to get the property for - /// - /// # Returns - /// - /// A result of an vector of a tuple of a timestamp and a property - /// - /// # Errors - /// - /// - `GraphError` - Raised if vertex or property does not exist - fn temporal_vertex_props(&self, v: LocalVertexRef) -> HashMap> { - self.graph - .temporal_vertex_props_window(v, self.t_start, self.t_end) - } - - /// Get all temporal properties of a vertex in a window - /// - /// # Arguments - /// - /// - `v` - The vertex to get the property for - /// - `t_start` - The inclusive start time of the window. - /// - `t_end` - The exclusive end time of the window. - /// - /// # Returns - /// - /// A result of an hashmap of a tuple of a string being names and - /// vectors of timestamp and the property value - /// - /// # Errors - /// - /// - `GraphError` - Raised if vertex or property does not exist - fn temporal_vertex_props_window( - &self, - v: LocalVertexRef, - t_start: i64, - t_end: i64, - ) -> HashMap> { - self.graph.temporal_vertex_props_window( - v, - self.actual_start(t_start), - self.actual_end(t_end), - ) - } - - /// Get the static property of an edge - /// - /// # Arguments - /// - /// - `e` - The edge to get the property for - /// - `name` - The name of the property - /// - /// # Returns - /// - /// A result of an option of a property or a graph error - /// - /// # Errors - /// - /// - `GraphError` - Raised if edge or property does not exist - fn static_edge_prop(&self, e: EdgeRef, name: String) -> Option { - self.graph.static_edge_prop(e, name) - } - - /// Get the names of all static properties of an edge - /// - /// # Arguments - /// - /// - `e` - The edge to get the property for - /// - /// # Returns - /// - /// A result of an vector of all property names - fn static_edge_prop_names(&self, e: EdgeRef) -> Vec { - self.graph.static_edge_prop_names(e) - } - - /// Get the names of all temporal properties of an edge - /// - /// # Arguments - /// - /// - `e` - The edge to get the property for - /// - /// # Returns - /// - /// A result of an vector of all property names - fn temporal_edge_prop_names(&self, e: EdgeRef) -> Vec { - self.graph.temporal_edge_prop_names(e) - } - - /// Get the temporal property of an edge - /// - /// # Arguments - /// - /// - `e` - The edge to get the property for - /// - `name` - The name of the property - /// - /// # Returns - /// - /// A result of an option of a property or a graph error - /// - /// # Errors - /// - /// - `GraphError` - Raised if edge or property does not exist - fn temporal_edge_props_vec(&self, e: EdgeRef, name: String) -> Vec<(i64, Prop)> { - self.graph - .temporal_edge_props_vec_window(e, name, self.t_start, self.t_end) - } - - /// Get the temporal property of an edge in a window - /// - /// # Arguments - /// - /// - `e` - The edge to get the property for - /// - `name` - The name of the property - /// - `t_start` - The inclusive start time of the window. - /// - `t_end` - The exclusive end time of the window. - /// - /// # Returns - /// - /// A result of an vector of a timestamp and property or a graph error - /// - /// # Errors - /// - /// - `GraphError` - Returned if edge or property does not exist - fn temporal_edge_props_vec_window( - &self, - e: EdgeRef, - name: String, - t_start: i64, - t_end: i64, - ) -> Vec<(i64, Prop)> { - self.graph.temporal_edge_props_vec_window( - e, - name, - self.actual_start(t_start), - self.actual_end(t_end), - ) - } - - /// Get all temporal properties of an edge - /// - /// # Arguments - /// - /// - `e` - The edge to get the property for - /// - /// # Returns - /// - /// A hashmap containing the name of a property as a key - /// and the vector of a timestamp and property value - fn temporal_edge_props(&self, e: EdgeRef) -> HashMap> { - self.graph - .temporal_edge_props_window(e, self.t_start, self.t_end) - } - - /// Get all temporal properties of an edge in a window - /// - /// # Arguments - /// - /// - `e` - The edge to get the property for - /// - `t_start` - The inclusive start time of the window. - /// - `t_end` - The exclusive end time of the window. - /// - /// # Returns - /// - /// A hashmap containing the name of a property as a key - /// and the vector of a timestamp and property value - fn temporal_edge_props_window( - &self, - e: EdgeRef, - t_start: i64, - t_end: i64, - ) -> HashMap> { - self.graph - .temporal_edge_props_window(e, self.actual_start(t_start), self.actual_end(t_end)) - } - - fn num_shards(&self) -> usize { - self.graph.num_shards() - } - - fn vertex_edges( - &self, - v: LocalVertexRef, - d: Direction, - layer: Option, - ) -> Box + Send> { - self.graph - .vertex_edges_window(v, self.t_start, self.t_end, d, layer) - } - - fn vertex_id(&self, v: LocalVertexRef) -> u64 { - self.graph.vertex_id(v) - } - - fn local_vertex(&self, v: VertexRef) -> Option { - self.graph.local_vertex_window(v, self.t_start, self.t_end) - } - - fn local_vertex_window( - &self, - v: VertexRef, - t_start: i64, - t_end: i64, - ) -> Option { - self.graph - .local_vertex_window(v, self.actual_start(t_start), self.actual_end(t_end)) - } -} - -/// A windowed graph is a graph that only allows access to vertices and edges within a time window. -/// -/// This struct is used to represent a graph with a time window. It is constructed -/// by providing a `Graph` object and a time range that defines the window. -/// -/// # Examples -/// -/// ```rust -/// use raphtory::db::graph::Graph; -/// use raphtory::db::view_api::*; -/// -/// let graph = Graph::new(1); -/// graph.add_edge(0, 1, 2, &vec![], None); -/// graph.add_edge(1, 2, 3, &vec![], None); -/// let windowed_graph = graph.window(0, 1); -/// ``` -impl WindowedGraph { - /// Create a new windowed graph - /// - /// # Arguments - /// - /// - `graph` - The graph to create the windowed graph from - /// - `t_start` - The inclusive start time of the window. - /// - `t_end` - The exclusive end time of the window. - /// - /// # Returns - /// - /// A new windowed graph - pub fn new(graph: G, t_start: T, t_end: T) -> Self { - WindowedGraph { - graph, - t_start: t_start.into_time(), - t_end: t_end.into_time(), - } - } - - /// the larger of `t_start` and `self.start()` (useful for creating nested windows) - fn actual_start(&self, t_start: i64) -> i64 { - max(t_start, self.t_start) - } - - /// the smaller of `t_end` and `self.end()` (useful for creating nested windows) - fn actual_end(&self, t_end: i64) -> i64 { - min(t_end, self.t_end) - } -} - -#[cfg(test)] -mod views_test { - - use super::*; - use crate::core::Prop; - use crate::db::graph::Graph; - use crate::db::view_api::edge::EdgeViewOps; - use crate::db::view_api::*; - use itertools::Itertools; - use quickcheck::TestResult; - use rand::prelude::*; - use rayon::prelude::*; - - #[test] - fn windowed_graph_vertices_degree() { - let vs = vec![ - (1, 1, 2), - (2, 1, 3), - (-1, 2, 1), - (0, 1, 1), - (7, 3, 2), - (1, 1, 1), - ]; - - let g = Graph::new(2); - - for (t, src, dst) in &vs { - g.add_edge(*t, *src, *dst, &vec![], None).unwrap(); - } - - let wg = WindowedGraph::new(g, -1, 1); - - let actual = wg - .vertices() - .iter() - .map(|v| (v.id(), v.degree())) - .collect::>(); - - let expected = vec![(2, 1), (1, 2)]; - - assert_eq!(actual, expected); - } - - #[test] - fn windowed_graph_edge() { - let vs = vec![ - (1, 1, 2), - (2, 1, 3), - (-1, 2, 1), - (0, 1, 1), - (7, 3, 2), - (1, 1, 1), - ]; - - let g = Graph::new(2); - - for (t, src, dst) in vs { - g.add_edge(t, src, dst, &vec![], None).unwrap(); - } - - let wg = g.window(i64::MIN, i64::MAX); - assert_eq!(wg.edge(1, 3, None).unwrap().src().id(), 1); - assert_eq!(wg.edge(1, 3, None).unwrap().dst().id(), 3); - } - - #[test] - fn windowed_graph_vertex_edges() { - let vs = vec![ - (1, 1, 2), - (2, 1, 3), - (-1, 2, 1), - (0, 1, 1), - (7, 3, 2), - (1, 1, 1), - ]; - - let g = Graph::new(2); - - for (t, src, dst) in &vs { - g.add_edge(*t, *src, *dst, &vec![], None).unwrap(); - } - - let wg = WindowedGraph::new(g, -1, 1); - - assert_eq!(wg.vertex(1).unwrap().id(), 1); - } - - #[test] - fn graph_has_vertex_check_fail() { - let vs: Vec<(i64, u64)> = vec![ - (1, 0), - (-100, 262), - // (327226439, 108748364996394682), - (1, 9135428456135679950), - // (0, 1), - // (2, 2), - ]; - let g = Graph::new(2); - - for (t, v) in &vs { - g.add_vertex(*t, *v, &vec![]) - .map_err(|err| println!("{:?}", err)) - .ok(); - } - - let wg = WindowedGraph::new(g, 1, 2); - assert!(!wg.has_vertex(262)) - } - - #[quickcheck] - fn windowed_graph_has_vertex(mut vs: Vec<(i64, u64)>) -> TestResult { - if vs.is_empty() { - return TestResult::discard(); - } - - vs.sort_by_key(|v| v.1); // Sorted by vertex - vs.dedup_by_key(|v| v.1); // Have each vertex only once to avoid headaches - vs.sort_by_key(|v| v.0); // Sorted by time - - let rand_start_index = thread_rng().gen_range(0..vs.len()); - let rand_end_index = thread_rng().gen_range(rand_start_index..vs.len()); - - let g = Graph::new(2); - - for (t, v) in &vs { - g.add_vertex(*t, *v, &vec![]) - .map_err(|err| println!("{:?}", err)) - .ok(); - } - - let start = vs.get(rand_start_index).expect("start index in range").0; - let end = vs.get(rand_end_index).expect("end index in range").0; - - let wg = WindowedGraph::new(g, start, end); - - let rand_test_index: usize = thread_rng().gen_range(0..vs.len()); - - let (i, v) = vs.get(rand_test_index).expect("test index in range"); - if (start..end).contains(i) { - if wg.has_vertex(*v) { - TestResult::passed() - } else { - TestResult::error(format!( - "Vertex {:?} was not in window {:?}", - (i, v), - start..end - )) - } - } else if !wg.has_vertex(*v) { - TestResult::passed() - } else { - TestResult::error(format!( - "Vertex {:?} was in window {:?}", - (i, v), - start..end - )) - } - } - - #[quickcheck] - fn windowed_graph_has_edge(mut edges: Vec<(i64, (u64, u64))>) -> TestResult { - if edges.is_empty() { - return TestResult::discard(); - } - - edges.sort_by_key(|e| e.1); // Sorted by edge - edges.dedup_by_key(|e| e.1); // Have each edge only once to avoid headaches - edges.sort_by_key(|e| e.0); // Sorted by time - - let rand_start_index = thread_rng().gen_range(0..edges.len()); - let rand_end_index = thread_rng().gen_range(rand_start_index..edges.len()); - - let g = Graph::new(2); - - for (t, e) in &edges { - g.add_edge(*t, e.0, e.1, &vec![], None).unwrap(); - } - - let start = edges.get(rand_start_index).expect("start index in range").0; - let end = edges.get(rand_end_index).expect("end index in range").0; - - let wg = WindowedGraph::new(g, start, end); - - let rand_test_index: usize = thread_rng().gen_range(0..edges.len()); - - let (i, e) = edges.get(rand_test_index).expect("test index in range"); - if (start..end).contains(i) { - if wg.has_edge(e.0, e.1, None) { - TestResult::passed() - } else { - TestResult::error(format!( - "Edge {:?} was not in window {:?}", - (i, e), - start..end - )) - } - } else if !wg.has_edge(e.0, e.1, None) { - TestResult::passed() - } else { - TestResult::error(format!("Edge {:?} was in window {:?}", (i, e), start..end)) - } - } - - #[quickcheck] - fn windowed_graph_edge_count(mut edges: Vec<(i64, (u64, u64))>) -> TestResult { - edges.sort_by_key(|e| e.1); // Sorted by edge - edges.dedup_by_key(|e| e.1); // Have each edge only once to avoid headaches - - let mut window: [i64; 2] = thread_rng().gen(); - window.sort(); - let window = window[0]..window[1]; - let true_edge_count = edges.iter().filter(|e| window.contains(&e.0)).count(); - - let g = Graph::new(2); - - for (t, e) in &edges { - g.add_edge( - *t, - e.0, - e.1, - &vec![("test".to_owned(), Prop::Bool(true))], - None, - ) - .unwrap(); - } - - let wg = WindowedGraph::new(g, window.start, window.end); - if wg.num_edges() != true_edge_count { - println!( - "failed, g.num_edges() = {}, true count = {}", - wg.num_edges(), - true_edge_count - ); - println!("g.edges() = {:?}", wg.edges().collect_vec()); - } - TestResult::from_bool(wg.num_edges() == true_edge_count) - } - - #[quickcheck] - fn trivial_window_has_all_edges(edges: Vec<(i64, u64, u64)>) -> bool { - let g = Graph::new(10); - edges - .into_par_iter() - .filter(|e| e.0 < i64::MAX) - .for_each(|(t, src, dst)| { - g.add_edge( - t, - src, - dst, - &vec![("test".to_owned(), Prop::Bool(true))], - None, - ) - .unwrap() - }); - let w = g.window(i64::MIN, i64::MAX); - g.edges() - .all(|e| w.has_edge(e.src().id(), e.dst().id(), None)) - } - - #[quickcheck] - fn large_vertex_in_window(dsts: Vec) -> bool { - let dsts: Vec = dsts.into_iter().unique().collect(); - let n = dsts.len(); - let g = Graph::new(1); - - for dst in dsts { - let t = 1; - g.add_edge(t, 0, dst, &vec![], None).unwrap(); - } - let w = g.window(i64::MIN, i64::MAX); - w.num_edges() == n - } - - #[test] - fn windowed_graph_vertex_ids() { - let vs = vec![(1, 1, 2), (3, 3, 4), (5, 5, 6), (7, 7, 1)]; - - let args = vec![(i64::MIN, 8), (i64::MIN, 2), (i64::MIN, 4), (3, 6)]; - - let expected = vec![ - vec![1, 2, 3, 4, 5, 6, 7], - vec![1, 2], - vec![1, 2, 3, 4], - vec![3, 4, 5, 6], - ]; - - let g = Graph::new(1); - - for (t, src, dst) in &vs { - g.add_edge(*t, *src, *dst, &vec![], None).unwrap(); - } - - let res: Vec<_> = (0..=3) - .map(|i| { - let wg = g.window(args[i].0, args[i].1); - let mut e = wg.vertices().id().collect::>(); - e.sort(); - e - }) - .collect_vec(); - - assert_eq!(res, expected); - - let g = Graph::new(3); - for (src, dst, t) in &vs { - g.add_edge(*src, *dst, *t, &vec![], None).unwrap(); - } - let res: Vec<_> = (0..=3) - .map(|i| { - let wg = g.window(args[i].0, args[i].1); - let mut e = wg.vertices().id().collect::>(); - e.sort(); - e - }) - .collect_vec(); - assert_eq!(res, expected); - } - - #[test] - fn windowed_graph_vertices() { - let vs = vec![ - (1, 1, 2), - (2, 1, 3), - (-1, 2, 1), - (0, 1, 1), - (7, 3, 2), - (1, 1, 1), - ]; - - let g = Graph::new(1); - - g.add_vertex( - 0, - 1, - &vec![ - ("type".into(), Prop::Str("wallet".into())), - ("cost".into(), Prop::F32(99.5)), - ], - ) - .map_err(|err| println!("{:?}", err)) - .ok(); - - g.add_vertex( - -1, - 2, - &vec![ - ("type".into(), Prop::Str("wallet".into())), - ("cost".into(), Prop::F32(10.0)), - ], - ) - .map_err(|err| println!("{:?}", err)) - .ok(); - - g.add_vertex( - 6, - 3, - &vec![ - ("type".into(), Prop::Str("wallet".into())), - ("cost".into(), Prop::F32(76.2)), - ], - ) - .map_err(|err| println!("{:?}", err)) - .ok(); - - for (t, src, dst) in &vs { - g.add_edge( - *t, - *src, - *dst, - &vec![("eprop".into(), Prop::Str("commons".into()))], - None, - ) - .unwrap(); - } - - let wg = g.window(-2, 0); - - let actual = wg.vertices().id().collect::>(); - - let expected = vec![1, 2]; - - assert_eq!(actual, expected); - - // Check results from multiple graphs with different number of shards - let g = Graph::new(10); - - g.add_vertex( - 0, - 1, - &vec![ - ("type".into(), Prop::Str("wallet".into())), - ("cost".into(), Prop::F32(99.5)), - ], - ) - .map_err(|err| println!("{:?}", err)) - .ok(); - - g.add_vertex( - -1, - 2, - &vec![ - ("type".into(), Prop::Str("wallet".into())), - ("cost".into(), Prop::F32(10.0)), - ], - ) - .map_err(|err| println!("{:?}", err)) - .ok(); - - g.add_vertex( - 6, - 3, - &vec![ - ("type".into(), Prop::Str("wallet".into())), - ("cost".into(), Prop::F32(76.2)), - ], - ) - .map_err(|err| println!("{:?}", err)) - .ok(); - - for (t, src, dst) in &vs { - g.add_edge(*t, *src, *dst, &vec![], None).unwrap(); - } - - let expected = wg.vertices().id().collect::>(); - - assert_eq!(actual, expected); - } -} diff --git a/raphtory/src/db/internal/addition.rs b/raphtory/src/db/internal/addition.rs new file mode 100644 index 0000000000..fe117a1f57 --- /dev/null +++ b/raphtory/src/db/internal/addition.rs @@ -0,0 +1,89 @@ +use crate::{ + core::{ + entities::{graph::tgraph::InnerTemporalGraph, EID, VID}, + storage::timeindex::TimeIndexEntry, + utils::errors::GraphError, + PropType, + }, + db::api::mutation::internal::InternalAdditionOps, + prelude::Prop, +}; +use std::sync::atomic::Ordering; + +impl InternalAdditionOps for InnerTemporalGraph { + #[inline] + fn next_event_id(&self) -> usize { + self.inner().event_counter.fetch_add(1, Ordering::Relaxed) + } + + #[inline] + fn resolve_layer(&self, layer: Option<&str>) -> usize { + layer + .map(|name| self.inner().edge_meta.get_or_create_layer_id(name)) + .unwrap_or(0) + } + + #[inline] + fn resolve_vertex(&self, id: u64, name: Option<&str>) -> VID { + self.inner().resolve_vertex(id, name) + } + + #[inline] + fn resolve_graph_property(&self, prop: &str, is_static: bool) -> usize { + self.inner().graph_props.resolve_property(prop, is_static) + } + + #[inline] + fn resolve_vertex_property( + &self, + prop: &str, + dtype: PropType, + is_static: bool, + ) -> Result { + self.inner() + .vertex_meta + .resolve_prop_id(prop, dtype, is_static) + } + + #[inline] + fn resolve_edge_property( + &self, + prop: &str, + dtype: PropType, + is_static: bool, + ) -> Result { + self.inner() + .edge_meta + .resolve_prop_id(prop, dtype, is_static) + } + + #[inline] + fn process_prop_value(&self, prop: Prop) -> Prop { + match prop { + Prop::Str(value) => Prop::Str(self.inner().resolve_str(value)), + _ => prop, + } + } + + #[inline] + fn internal_add_vertex( + &self, + t: TimeIndexEntry, + v: VID, + props: Vec<(usize, Prop)>, + ) -> Result<(), GraphError> { + self.inner().add_vertex_internal(t, v, props) + } + + #[inline] + fn internal_add_edge( + &self, + t: TimeIndexEntry, + src: VID, + dst: VID, + props: Vec<(usize, Prop)>, + layer: usize, + ) -> Result { + self.inner().add_edge_internal(t, src, dst, props, layer) + } +} diff --git a/raphtory/src/db/internal/core_ops.rs b/raphtory/src/db/internal/core_ops.rs new file mode 100644 index 0000000000..aa8ed11d7c --- /dev/null +++ b/raphtory/src/db/internal/core_ops.rs @@ -0,0 +1,332 @@ +use crate::{ + core::{ + entities::{ + edges::{edge_ref::EdgeRef, edge_store::EdgeStore}, + graph::tgraph::InnerTemporalGraph, + properties::{ + graph_props::GraphProps, + props::Meta, + tprop::{LockedLayeredTProp, TProp}, + }, + vertices::{vertex_ref::VertexRef, vertex_store::VertexStore}, + LayerIds, EID, VID, + }, + storage::{ + locked_view::LockedView, + timeindex::{LockedLayeredIndex, TimeIndex, TimeIndexEntry}, + ArcEntry, + }, + ArcStr, + }, + db::api::view::{internal::CoreGraphOps, BoxedIter}, + prelude::Prop, +}; +use itertools::Itertools; +use std::{collections::HashMap, iter}; + +impl CoreGraphOps for InnerTemporalGraph { + #[inline] + fn unfiltered_num_vertices(&self) -> usize { + self.inner().internal_num_vertices() + } + + #[inline] + fn vertex_meta(&self) -> &Meta { + &self.inner().vertex_meta + } + + #[inline] + fn edge_meta(&self) -> &Meta { + &self.inner().edge_meta + } + + #[inline] + fn graph_meta(&self) -> &GraphProps { + &self.inner().graph_props + } + + #[inline] + fn get_layer_name(&self, layer_id: usize) -> ArcStr { + self.inner().edge_meta.layer_meta().get_name(layer_id) + } + + #[inline] + fn get_layer_id(&self, name: &str) -> Option { + self.inner().edge_meta.get_layer_id(name) + } + + #[inline] + fn get_layer_names_from_ids(&self, layer_ids: LayerIds) -> BoxedIter { + self.inner().layer_names(layer_ids) + } + + #[inline] + fn vertex_id(&self, v: VID) -> u64 { + self.inner().global_vertex_id(v) + } + + #[inline] + fn vertex_name(&self, v: VID) -> String { + self.inner().vertex_name(v) + } + + #[inline] + fn edge_additions( + &self, + eref: EdgeRef, + layer_ids: LayerIds, + ) -> LockedLayeredIndex<'_, TimeIndexEntry> { + let layer_ids = layer_ids.constrain_from_edge(eref); + let edge = self.inner().edge(eref.pid()); + edge.additions(layer_ids).unwrap() + } + + #[inline] + fn vertex_additions(&self, v: VID) -> LockedView> { + let vertex = self.inner().vertex(v); + vertex.additions().unwrap() + } + + #[inline] + fn internalise_vertex(&self, v: VertexRef) -> Option { + self.inner().resolve_vertex_ref(v) + } + + #[inline] + fn internalise_vertex_unchecked(&self, v: VertexRef) -> VID { + match v { + VertexRef::Internal(l) => l, + VertexRef::External(_) => self.inner().resolve_vertex_ref(v).unwrap(), + } + } + + #[inline] + fn constant_prop(&self, id: usize) -> Option { + self.inner().get_constant_prop(id) + } + + #[inline] + fn temporal_prop(&self, id: usize) -> Option> { + self.inner().get_temporal_prop(id) + } + + #[inline] + fn constant_vertex_prop(&self, v: VID, prop_id: usize) -> Option { + let entry = self.inner().node_entry(v); + entry.const_prop(prop_id).cloned() + } + + #[inline] + fn constant_vertex_prop_ids(&self, v: VID) -> Box + '_> { + // FIXME: revisit the locking scheme so we don't have to collect the ids + Box::new( + self.inner() + .node_entry(v) + .const_prop_ids() + .collect_vec() + .into_iter(), + ) + } + + #[inline] + fn temporal_vertex_prop(&self, v: VID, prop_id: usize) -> Option> { + let vertex = self.inner().vertex(v); + vertex.temporal_property(prop_id) + } + + #[inline] + fn temporal_vertex_prop_ids(&self, v: VID) -> Box + '_> { + // FIXME: revisit the locking scheme so we don't have to collect the ids + Box::new( + self.inner() + .node_entry(v) + .temporal_prop_ids() + .collect_vec() + .into_iter(), + ) + } + + fn get_const_edge_prop(&self, e: EdgeRef, prop_id: usize, layer_ids: LayerIds) -> Option { + let layer_ids = layer_ids.constrain_from_edge(e); + let entry = self.inner().edge_entry(e.pid()); + match layer_ids { + LayerIds::None => None, + LayerIds::All => { + if self.inner().num_layers() == 1 { + // iterator has at most 1 element + entry + .layer_iter() + .next() + .and_then(|layer| layer.const_prop(prop_id).cloned()) + } else { + let prop_map: HashMap<_, _> = entry + .layer_iter() + .enumerate() + .flat_map(|(id, layer)| { + layer + .const_prop(prop_id) + .map(|p| (self.inner().get_layer_name(id), p.clone())) + }) + .collect(); + if prop_map.is_empty() { + None + } else { + Some(prop_map.into()) + } + } + } + LayerIds::One(id) => entry.layer(id).and_then(|l| l.const_prop(prop_id).cloned()), + LayerIds::Multiple(ids) => { + let prop_map: HashMap<_, _> = ids + .iter() + .flat_map(|&id| { + entry.layer(id).and_then(|layer| { + layer + .const_prop(prop_id) + .map(|p| (self.inner().get_layer_name(id), p.clone())) + }) + }) + .collect(); + if prop_map.is_empty() { + None + } else { + Some(prop_map.into()) + } + } + } + } + + fn const_edge_prop_ids( + &self, + e: EdgeRef, + layer_ids: LayerIds, + ) -> Box + '_> { + // FIXME: revisit the locking scheme so we don't have to collect all the ids + let layer_ids = layer_ids.constrain_from_edge(e); + let entry = self.inner().edge_entry(e.pid()); + let ids: Vec<_> = match layer_ids { + LayerIds::None => vec![], + LayerIds::All => entry + .layer_iter() + .map(|l| l.const_prop_ids()) + .kmerge() + .dedup() + .collect(), + LayerIds::One(id) => match entry.layer(id) { + Some(l) => l.const_prop_ids().collect(), + None => vec![], + }, + LayerIds::Multiple(ids) => ids + .iter() + .flat_map(|id| entry.layer(*id).map(|l| l.const_prop_ids())) + .kmerge() + .dedup() + .collect(), + }; + Box::new(ids.into_iter()) + } + + #[inline] + fn temporal_edge_prop( + &self, + e: EdgeRef, + prop_id: usize, + layer_ids: LayerIds, + ) -> Option { + let layer_ids = layer_ids.constrain_from_edge(e); + let edge = self.inner().edge(e.pid()); + edge.temporal_property(layer_ids, prop_id) + } + + fn temporal_edge_prop_ids( + &self, + e: EdgeRef, + layer_ids: LayerIds, + ) -> Box + '_> { + // FIXME: revisit the locking scheme so we don't have to collect the ids + let entry = self.inner().edge_entry(e.pid()); + match layer_ids { + LayerIds::None => Box::new(iter::empty()), + LayerIds::All => Box::new(entry.temp_prop_ids(None).collect_vec().into_iter()), + LayerIds::One(id) => Box::new(entry.temp_prop_ids(Some(id)).collect_vec().into_iter()), + LayerIds::Multiple(ids) => Box::new( + ids.iter() + .map(|id| entry.temp_prop_ids(Some(*id))) + .kmerge() + .dedup() + .collect_vec() + .into_iter(), + ), + } + } + + #[inline] + fn core_edges(&self) -> Box>> { + Box::new(self.inner().storage.edges.read_lock().into_iter()) + } + + #[inline] + fn core_edge(&self, eid: EID) -> ArcEntry { + self.inner().storage.edges.entry_arc(eid.into()) + } + + #[inline] + fn core_vertices(&self) -> Box>> { + Box::new(self.inner().storage.nodes.read_lock().into_iter()) + } + + #[inline] + fn core_vertex(&self, vid: VID) -> ArcEntry { + self.inner().storage.nodes.entry_arc(vid.into()) + } +} + +#[cfg(test)] +mod test_edges { + use crate::{ + core::{ArcStr, IntoPropMap}, + prelude::*, + }; + use std::collections::HashMap; + + #[test] + fn test_edge_properties_for_layers() { + let g = Graph::new(); + + g.add_edge(0, 1, 2, [("t", 0)], Some("layer1")) + .unwrap() + .add_constant_properties( + [("layer1", "1".into_prop()), ("layer", 1.into_prop())], + Some("layer1"), + ) + .unwrap(); + g.add_edge(1, 1, 2, [("t", 1)], Some("layer2")) + .unwrap() + .add_constant_properties([("layer", 2)], Some("layer2")) + .unwrap(); + + g.add_edge(2, 1, 2, [("t2", 2)], Some("layer3")) + .unwrap() + .add_constant_properties([("layer", 3)], Some("layer3")) + .unwrap(); + + let e_all = g.edge(1, 2).unwrap(); + assert_eq!( + e_all.properties().constant().as_map(), + HashMap::from([ + ( + ArcStr::from("layer"), + [("layer1", 1), ("layer2", 2), ("layer3", 3)].into_prop_map() + ), + (ArcStr::from("layer1"), [("layer1", "1")].into_prop_map()) + ]) + ); + assert_eq!( + e_all.properties().temporal().get("t").unwrap().values(), + vec![0.into(), 1.into()] + ); + + let e = g.edge(1, 2).unwrap().layer("layer1").unwrap(); + assert!(e.properties().constant().contains("layer1")); + } +} diff --git a/raphtory/src/db/internal/deletion.rs b/raphtory/src/db/internal/deletion.rs new file mode 100644 index 0000000000..c4505fb87f --- /dev/null +++ b/raphtory/src/db/internal/deletion.rs @@ -0,0 +1,31 @@ +use crate::{ + core::{ + entities::{edges::edge_ref::EdgeRef, graph::tgraph::InnerTemporalGraph, LayerIds, VID}, + storage::timeindex::{LockedLayeredIndex, TimeIndexEntry}, + utils::errors::GraphError, + }, + db::api::{mutation::internal::InternalDeletionOps, view::internal::CoreDeletionOps}, +}; + +impl InternalDeletionOps for InnerTemporalGraph { + fn internal_delete_edge( + &self, + t: TimeIndexEntry, + src: VID, + dst: VID, + layer: usize, + ) -> Result<(), GraphError> { + self.inner().delete_edge(t, src, dst, layer) + } +} + +impl CoreDeletionOps for InnerTemporalGraph { + fn edge_deletions( + &self, + eref: EdgeRef, + layer_ids: LayerIds, + ) -> LockedLayeredIndex<'_, TimeIndexEntry> { + let edge = self.inner().edge(eref.pid()); + edge.deletions(layer_ids).unwrap() + } +} diff --git a/raphtory/src/db/internal/edge_filter_ops.rs b/raphtory/src/db/internal/edge_filter_ops.rs new file mode 100644 index 0000000000..1991d3b0e0 --- /dev/null +++ b/raphtory/src/db/internal/edge_filter_ops.rs @@ -0,0 +1,11 @@ +use crate::db::{ + api::view::internal::{EdgeFilter, EdgeFilterOps}, + graph::graph::InternalGraph, +}; + +impl EdgeFilterOps for InternalGraph { + #[inline] + fn edge_filter(&self) -> Option<&EdgeFilter> { + None + } +} diff --git a/raphtory/src/db/internal/graph_ops.rs b/raphtory/src/db/internal/graph_ops.rs new file mode 100644 index 0000000000..ec74cdd453 --- /dev/null +++ b/raphtory/src/db/internal/graph_ops.rs @@ -0,0 +1,249 @@ +use crate::{ + core::{ + entities::{ + edges::edge_ref::{Dir, EdgeRef}, + graph::tgraph::InnerTemporalGraph, + vertices::vertex_ref::VertexRef, + LayerIds, EID, VID, + }, + Direction, + }, + db::api::view::internal::{EdgeFilter, GraphOps}, +}; +use itertools::Itertools; +use std::iter; + +impl GraphOps for InnerTemporalGraph { + fn internal_vertex_ref( + &self, + v: VertexRef, + _layer_ids: &LayerIds, + _filter: Option<&EdgeFilter>, + ) -> Option { + match v { + VertexRef::Internal(l) => Some(l), + VertexRef::External(_) => { + let vid = self.inner().resolve_vertex_ref(v)?; + Some(vid) + } + } + } + + fn find_edge_id( + &self, + e_id: EID, + layer_ids: &LayerIds, + filter: Option<&EdgeFilter>, + ) -> Option { + let e_id_usize: usize = e_id.into(); + if e_id_usize >= self.inner().storage.edges.len() { + return None; + } + let e = self.inner().storage.edges.get(e_id_usize); + filter + .map(|f| f(&e, layer_ids)) + .unwrap_or(true) + .then(|| EdgeRef::new_outgoing(e_id, e.src(), e.dst())) + } + + fn vertices_len(&self, _layer_ids: LayerIds, _filter: Option<&EdgeFilter>) -> usize { + self.inner().internal_num_vertices() + } + + fn edges_len(&self, layers: LayerIds, filter: Option<&EdgeFilter>) -> usize { + self.inner().num_edges(&layers, filter) + } + + #[inline] + fn degree( + &self, + v: VID, + d: Direction, + layers: &LayerIds, + filter: Option<&EdgeFilter>, + ) -> usize { + self.inner().degree(v, d, layers, filter) + } + + fn vertex_refs( + &self, + _layers: LayerIds, + _filter: Option<&EdgeFilter>, + ) -> Box + Send> { + Box::new(self.inner().vertex_ids()) + } + + fn edge_ref( + &self, + src: VID, + dst: VID, + layer: &LayerIds, + filter: Option<&EdgeFilter>, + ) -> Option { + self.inner() + .find_edge(src, dst, layer) + .filter(|eid| { + filter + .map(|f| f(&self.inner().storage.edges.get((*eid).into()), layer)) + .unwrap_or(true) + }) + .map(|e_id| EdgeRef::new_outgoing(e_id, src, dst)) + } + + fn edge_refs( + &self, + layers: LayerIds, + filter: Option<&EdgeFilter>, + ) -> Box + Send> { + let filter = filter.cloned(); + match layers { + LayerIds::None => Box::new(iter::empty()), + LayerIds::All => { + let iter = self + .inner() + .storage + .edges + .read_lock() + .into_iter() + .filter(move |e| filter.as_ref().map(|f| f(e, &layers)).unwrap_or(true)) + .map_into(); + Box::new(iter) + } + _ => Box::new( + self.inner() + .storage + .edges + .read_lock() + .into_iter() + .filter(move |edge| { + filter + .as_ref() + .map(|f| f(edge, &layers)) + .unwrap_or_else(|| edge.has_layer(&layers)) + }) + .map(|edge| edge.into()), + ), + } + } + + fn vertex_edges( + &self, + v: VID, + d: Direction, + layers: LayerIds, + filter: Option<&EdgeFilter>, + ) -> Box + Send> { + let entry = self.inner().storage.nodes.entry_arc(v.into()); + match d { + Direction::OUT => { + let iter: Box + Send> = + match &layers { + LayerIds::None => Box::new(iter::empty()), + LayerIds::All => Box::new( + entry + .into_layers() + .map(move |layer| { + layer + .into_tuples(Dir::Out) + .map(move |(n, e)| EdgeRef::new_outgoing(e, v, n)) + }) + .kmerge() + .dedup(), + ), + LayerIds::One(layer) => { + Box::new(entry.into_layer(*layer).into_iter().flat_map(move |it| { + it.into_tuples(Dir::Out) + .map(move |(n, e)| EdgeRef::new_outgoing(e, v, n)) + })) + } + LayerIds::Multiple(ids) => Box::new( + ids.iter() + .map(move |&layer| { + entry.clone().into_layer(layer).into_iter().flat_map( + move |it| { + it.into_tuples(Dir::Out) + .map(move |(n, e)| EdgeRef::new_outgoing(e, v, n)) + }, + ) + }) + .kmerge() + .dedup(), + ), + }; + match filter.cloned() { + None => iter, + Some(filter) => { + let edge_store = self.inner().storage.edges.read_lock(); + Box::new(iter.filter(move |eref| { + filter(&edge_store.get(eref.pid().into()), &layers) + })) + } + } + } + Direction::IN => { + let iter: Box + Send> = + match &layers { + LayerIds::None => Box::new(iter::empty()), + LayerIds::All => Box::new( + entry + .into_layers() + .map(move |layer| { + layer + .into_tuples(Dir::Into) + .map(move |(n, e)| EdgeRef::new_incoming(e, n, v)) + }) + .kmerge() + .dedup(), + ), + LayerIds::One(layer) => { + Box::new(entry.into_layer(*layer).into_iter().flat_map(move |it| { + it.into_tuples(Dir::Into) + .map(move |(n, e)| EdgeRef::new_incoming(e, n, v)) + })) + } + LayerIds::Multiple(ids) => Box::new( + ids.iter() + .map(move |&layer| { + entry.clone().into_layer(layer).into_iter().flat_map( + move |it| { + it.into_tuples(Dir::Into) + .map(move |(n, e)| EdgeRef::new_incoming(e, n, v)) + }, + ) + }) + .kmerge() + .dedup(), + ), + }; + match filter.cloned() { + None => iter, + Some(filter) => { + let edge_store = self.inner().storage.edges.read_lock(); + Box::new(iter.filter(move |eref| { + filter(&edge_store.get(eref.pid().into()), &layers) + })) + } + } + } + Direction::BOTH => Box::new( + self.vertex_edges(v, Direction::IN, layers.clone(), filter) + .merge(self.vertex_edges(v, Direction::OUT, layers, filter)), + ), + } + } + + fn neighbours( + &self, + v: VID, + d: Direction, + layers: LayerIds, + filter: Option<&EdgeFilter>, + ) -> Box + Send> { + let iter = self.vertex_edges(v, d, layers, filter).map(|e| e.remote()); + if matches!(d, Direction::BOTH) { + Box::new(iter.dedup()) + } else { + Box::new(iter) + } + } +} diff --git a/raphtory/src/db/internal/layer_ops.rs b/raphtory/src/db/internal/layer_ops.rs new file mode 100644 index 0000000000..96b465e256 --- /dev/null +++ b/raphtory/src/db/internal/layer_ops.rs @@ -0,0 +1,19 @@ +use crate::{ + core::entities::{edges::edge_store::EdgeStore, LayerIds}, + db::{api::view::internal::InternalLayerOps, graph::graph::InternalGraph}, + prelude::Layer, +}; + +impl InternalLayerOps for InternalGraph { + fn layer_ids(&self) -> LayerIds { + LayerIds::All + } + + fn layer_ids_from_names(&self, key: Layer) -> LayerIds { + self.inner().layer_id(key) + } + + fn edge_layer_ids(&self, e: &EdgeStore) -> LayerIds { + e.layer_ids() + } +} diff --git a/raphtory/src/db/internal/materialize.rs b/raphtory/src/db/internal/materialize.rs new file mode 100644 index 0000000000..3a1daa780c --- /dev/null +++ b/raphtory/src/db/internal/materialize.rs @@ -0,0 +1,18 @@ +use crate::{ + core::entities::graph::tgraph::InnerTemporalGraph, + db::{ + api::view::internal::{InternalMaterialize, MaterializedGraph}, + graph::graph::{Graph, InternalGraph}, + }, +}; +use std::sync::Arc; + +impl InternalMaterialize for InnerTemporalGraph { + fn new_base_graph(&self, graph: InternalGraph) -> MaterializedGraph { + MaterializedGraph::EventGraph(Graph::new_from_inner(Arc::new(graph))) + } + + fn include_deletions(&self) -> bool { + false + } +} diff --git a/raphtory/src/db/internal/mod.rs b/raphtory/src/db/internal/mod.rs new file mode 100644 index 0000000000..15f84749c6 --- /dev/null +++ b/raphtory/src/db/internal/mod.rs @@ -0,0 +1,11 @@ +pub(crate) mod addition; +pub(crate) mod core_ops; +pub(crate) mod deletion; +pub(crate) mod edge_filter_ops; +pub(crate) mod graph_ops; +pub(crate) mod layer_ops; +pub(crate) mod materialize; +pub(crate) mod prop_add; +pub(crate) mod static_properties; +pub(crate) mod temporal_properties; +pub(crate) mod time_semantics; diff --git a/raphtory/src/db/internal/prop_add.rs b/raphtory/src/db/internal/prop_add.rs new file mode 100644 index 0000000000..74408b4ab2 --- /dev/null +++ b/raphtory/src/db/internal/prop_add.rs @@ -0,0 +1,69 @@ +use crate::{ + core::{ + entities::{graph::tgraph::InnerTemporalGraph, EID, VID}, + storage::timeindex::TimeIndexEntry, + utils::errors::GraphError, + }, + db::api::{mutation::internal::InternalPropertyAdditionOps, view::internal::CoreGraphOps}, + prelude::Prop, +}; + +impl InternalPropertyAdditionOps for InnerTemporalGraph { + fn internal_add_properties( + &self, + t: TimeIndexEntry, + props: Vec<(usize, Prop)>, + ) -> Result<(), GraphError> { + self.inner().add_properties(t, props) + } + + fn internal_add_static_properties(&self, props: Vec<(usize, Prop)>) -> Result<(), GraphError> { + self.inner().add_constant_properties(props) + } + + fn internal_add_constant_vertex_properties( + &self, + vid: VID, + props: Vec<(usize, Prop)>, + ) -> Result<(), GraphError> { + let mut node = self.inner().storage.get_node_mut(vid); + for (prop_id, value) in props { + node.add_constant_prop(prop_id, value).map_err(|err| { + let name = self.vertex_meta().get_prop_name(prop_id, true); + GraphError::ConstantPropertyMutationError { + name, + new: err.new_value.expect("new value exists"), + old: err + .previous_value + .expect("previous value exists if set failed"), + } + })?; + } + Ok(()) + } + + fn internal_add_constant_edge_properties( + &self, + eid: EID, + layer: usize, + props: Vec<(usize, Prop)>, + ) -> Result<(), GraphError> { + let mut edge = self.inner().storage.get_edge_mut(eid); + let mut edge_layer = edge.layer_mut(layer); + for (prop_id, value) in props { + edge_layer + .add_constant_prop(prop_id, value) + .map_err(|err| { + let name = self.edge_meta().get_prop_name(prop_id, true); + GraphError::ConstantPropertyMutationError { + name, + new: err.new_value.expect("new value exists"), + old: err + .previous_value + .expect("previous value exists if set failed"), + } + })?; + } + Ok(()) + } +} diff --git a/raphtory/src/db/internal/static_properties.rs b/raphtory/src/db/internal/static_properties.rs new file mode 100644 index 0000000000..37857a0f4e --- /dev/null +++ b/raphtory/src/db/internal/static_properties.rs @@ -0,0 +1,26 @@ +use crate::{ + core::{entities::graph::tgraph::InnerTemporalGraph, ArcStr, Prop}, + db::api::properties::internal::ConstPropertiesOps, +}; + +impl ConstPropertiesOps for InnerTemporalGraph { + fn get_const_prop_id(&self, name: &str) -> Option { + self.inner().graph_props.get_const_prop_id(name) + } + + fn get_const_prop_name(&self, id: usize) -> ArcStr { + self.inner().graph_props.get_const_prop_name(id) + } + + fn const_prop_ids(&self) -> Box> { + Box::new(self.inner().graph_props.const_prop_ids()) + } + + fn const_prop_keys(&self) -> Box> { + Box::new(self.inner().const_prop_names().into_iter()) + } + + fn get_const_prop(&self, prop_id: usize) -> Option { + self.inner().get_constant_prop(prop_id) + } +} diff --git a/raphtory/src/db/internal/temporal_properties.rs b/raphtory/src/db/internal/temporal_properties.rs new file mode 100644 index 0000000000..2a3e734109 --- /dev/null +++ b/raphtory/src/db/internal/temporal_properties.rs @@ -0,0 +1,50 @@ +use crate::{ + core::{entities::graph::tgraph::InnerTemporalGraph, ArcStr, Prop}, + db::api::properties::internal::{TemporalPropertiesOps, TemporalPropertyViewOps}, +}; + +impl TemporalPropertyViewOps for InnerTemporalGraph { + fn temporal_value(&self, id: usize) -> Option { + self.inner() + .get_temporal_prop(id) + .and_then(|prop| prop.last_before(i64::MAX).map(|(_, v)| v)) + } + + fn temporal_history(&self, id: usize) -> Vec { + self.inner() + .get_temporal_prop(id) + .map(|prop| prop.iter().map(|(t, _)| t).collect()) + .unwrap_or_default() + } + + fn temporal_values(&self, id: usize) -> Vec { + self.inner() + .get_temporal_prop(id) + .map(|prop| prop.iter().map(|(_, v)| v).collect()) + .unwrap_or_default() + } + + fn temporal_value_at(&self, id: usize, t: i64) -> Option { + self.inner() + .get_temporal_prop(id) + .and_then(|prop| prop.last_before(t.saturating_add(1)).map(|(_, v)| v)) + } +} + +impl TemporalPropertiesOps for InnerTemporalGraph { + fn get_temporal_prop_id(&self, name: &str) -> Option { + self.inner().graph_props.get_temporal_id(name) + } + + fn get_temporal_prop_name(&self, id: usize) -> ArcStr { + self.inner().graph_props.get_temporal_name(id) + } + + fn temporal_prop_ids(&self) -> Box + '_> { + Box::new(self.inner().graph_props.temporal_ids()) + } + + fn temporal_prop_keys(&self) -> Box + '_> { + Box::new(self.inner().graph_props.temporal_names().into_iter()) + } +} diff --git a/raphtory/src/db/internal/time_semantics.rs b/raphtory/src/db/internal/time_semantics.rs new file mode 100644 index 0000000000..a4bd71511b --- /dev/null +++ b/raphtory/src/db/internal/time_semantics.rs @@ -0,0 +1,335 @@ +use crate::{ + core::{ + entities::{ + edges::{edge_ref::EdgeRef, edge_store::EdgeStore}, + graph::tgraph::InnerTemporalGraph, + LayerIds, VID, + }, + storage::timeindex::{AsTime, TimeIndexOps}, + }, + db::api::view::{ + internal::{CoreDeletionOps, CoreGraphOps, EdgeFilter, TimeSemantics}, + BoxedIter, + }, + prelude::Prop, +}; +use genawaiter::sync::GenBoxed; +use rayon::prelude::*; +use std::ops::Range; + +impl TimeSemantics for InnerTemporalGraph { + fn vertex_earliest_time(&self, v: VID) -> Option { + self.inner().node_entry(v).value().timestamps().first_t() + } + + fn vertex_latest_time(&self, v: VID) -> Option { + self.inner().node_entry(v).value().timestamps().last_t() + } + + fn view_start(&self) -> Option { + self.earliest_time_global() + } + + fn view_end(&self) -> Option { + self.latest_time_global().map(|t| t.saturating_add(1)) // so it is exclusive + } + + fn earliest_time_global(&self) -> Option { + self.inner().graph_earliest_time() + } + + fn latest_time_global(&self) -> Option { + self.inner().graph_latest_time() + } + + fn earliest_time_window(&self, t_start: i64, t_end: i64) -> Option { + self.inner() + .storage + .nodes + .read_lock() + .into_par_iter() + .flat_map(|v| v.timestamps().range(t_start..t_end).first_t()) + .min() + } + + fn latest_time_window(&self, t_start: i64, t_end: i64) -> Option { + self.inner() + .storage + .nodes + .read_lock() + .into_par_iter() + .flat_map(|v| v.timestamps().range(t_start..t_end).last_t()) + .max() + } + + fn vertex_earliest_time_window(&self, v: VID, t_start: i64, t_end: i64) -> Option { + self.inner() + .node_entry(v) + .value() + .timestamps() + .range(t_start..t_end) + .first_t() + } + + fn vertex_latest_time_window(&self, v: VID, t_start: i64, t_end: i64) -> Option { + self.inner() + .node_entry(v) + .value() + .timestamps() + .range(t_start..t_end) + .last_t() + } + + #[inline] + fn include_vertex_window( + &self, + v: VID, + w: Range, + _layer_ids: &LayerIds, + _edge_filter: Option<&EdgeFilter>, + ) -> bool { + self.inner().node_entry(v).timestamps().active(w) + } + + #[inline] + fn include_edge_window(&self, e: &EdgeStore, w: Range, layer_ids: &LayerIds) -> bool { + e.active(layer_ids, w) + } + + fn vertex_history(&self, v: VID) -> Vec { + self.vertex_additions(v).iter_t().copied().collect() + } + + fn vertex_history_window(&self, v: VID, w: Range) -> Vec { + self.vertex_additions(v) + .range(w) + .iter_t() + .copied() + .collect() + } + + fn edge_exploded(&self, e: EdgeRef, layer_ids: LayerIds) -> BoxedIter { + let arc = self.inner().edge_arc(e.pid()); + let layer_id = layer_ids.constrain_from_edge(e); + let iter: GenBoxed = GenBoxed::new_boxed(|co| async move { + // this is for when we explode edges we want to select the layer we get the timestamps from + for (l, t) in arc.timestamps_and_layers(layer_id) { + co.yield_(e.at(*t).at_layer(l)).await; + } + }); + Box::new(iter.into_iter()) + } + + fn edge_layers(&self, e: EdgeRef, layer_ids: LayerIds) -> BoxedIter { + let arc = self.inner().edge_arc(e.pid()); + let layer_ids = layer_ids.constrain_from_edge(e); + let iter: GenBoxed = GenBoxed::new_boxed(|co| async move { + for l in arc.layers() { + if layer_ids.contains(&l) { + co.yield_(e.at_layer(l)).await; + } + } + }); + Box::new(iter.into_iter()) + } + + fn edge_window_exploded( + &self, + e: EdgeRef, + w: Range, + layer_ids: LayerIds, + ) -> BoxedIter { + let arc = self.inner().edge_arc(e.pid()); + let layer_ids = layer_ids.constrain_from_edge(e); + let iter: GenBoxed = GenBoxed::new_boxed(|co| async move { + // this is for when we explode edges we want to select the layer we get the timestamps from + for (l, t) in arc.timestamps_and_layers_window(layer_ids, w) { + co.yield_(e.at(*t).at_layer(l)).await; + } + }); + Box::new(iter.into_iter()) + } + + fn edge_window_layers( + &self, + e: EdgeRef, + w: Range, + layer_ids: LayerIds, + ) -> BoxedIter { + let arc = self.inner().edge_arc(e.pid()); + let iter: GenBoxed = GenBoxed::new_boxed(|co| async move { + for l in arc.layers_window(w) { + if layer_ids.contains(&l) { + co.yield_(e.at_layer(l)).await; + } + } + }); + Box::new(iter.into_iter()) + } + + fn edge_earliest_time(&self, e: EdgeRef, layer_ids: LayerIds) -> Option { + e.time_t() + .or_else(|| self.edge_additions(e, layer_ids).first_t()) + } + + fn edge_earliest_time_window( + &self, + e: EdgeRef, + w: Range, + layer_ids: LayerIds, + ) -> Option { + e.time_t() + .or_else(|| self.edge_additions(e, layer_ids).range(w).first_t()) + } + + fn edge_latest_time(&self, e: EdgeRef, layer_ids: LayerIds) -> Option { + e.time_t() + .or_else(|| self.edge_additions(e, layer_ids).last_t()) + } + + fn edge_latest_time_window( + &self, + e: EdgeRef, + w: Range, + layer_ids: LayerIds, + ) -> Option { + e.time_t() + .or_else(|| self.edge_additions(e, layer_ids).range(w).last_t()) + } + + fn edge_deletion_history(&self, e: EdgeRef, layer_ids: LayerIds) -> Vec { + self.edge_deletions(e, layer_ids) + .iter_t() + .copied() + .collect() + } + + fn edge_deletion_history_window( + &self, + e: EdgeRef, + w: Range, + layer_ids: LayerIds, + ) -> Vec { + self.edge_deletions(e, layer_ids) + .range(w) + .iter_t() + .copied() + .collect() + } + + fn has_temporal_prop(&self, prop_id: usize) -> bool { + prop_id < self.inner().graph_props.temporal_prop_meta().len() + } + + fn temporal_prop_vec(&self, prop_id: usize) -> Vec<(i64, Prop)> { + self.inner() + .get_temporal_prop(prop_id) + .map(|prop| prop.iter().collect()) + .unwrap_or_default() + } + + fn has_temporal_prop_window(&self, prop_id: usize, w: Range) -> bool { + self.inner() + .graph_props + .get_temporal_prop(prop_id) + .filter(|p| p.iter_window(w).next().is_some()) + .is_some() + } + + fn temporal_prop_vec_window( + &self, + prop_id: usize, + t_start: i64, + t_end: i64, + ) -> Vec<(i64, Prop)> { + self.inner() + .get_temporal_prop(prop_id) + .map(|prop| prop.iter_window(t_start..t_end).collect()) + .unwrap_or_default() + } + + fn has_temporal_vertex_prop(&self, v: VID, prop_id: usize) -> bool { + let entry = self.inner().storage.get_node(v); + entry.temporal_property(prop_id).is_some() + } + + fn temporal_vertex_prop_vec(&self, v: VID, prop_id: usize) -> Vec<(i64, Prop)> { + self.inner() + .vertex(v) + .temporal_properties(prop_id, None) + .collect() + } + + fn has_temporal_vertex_prop_window(&self, v: VID, prop_id: usize, w: Range) -> bool { + let entry = self.inner().storage.get_node(v); + entry + .temporal_property(prop_id) + .filter(|p| p.iter_window(w).next().is_some()) + .is_some() + } + + fn temporal_vertex_prop_vec_window( + &self, + v: VID, + prop_id: usize, + t_start: i64, + t_end: i64, + ) -> Vec<(i64, Prop)> { + self.inner() + .vertex(v) + .temporal_properties(prop_id, Some(t_start..t_end)) + .collect() + } + + fn has_temporal_edge_prop_window( + &self, + e: EdgeRef, + prop_id: usize, + w: Range, + layer_ids: LayerIds, + ) -> bool { + let entry = self.inner().storage.get_edge(e.pid()); + entry.has_temporal_prop_window(layer_ids, prop_id, w) + } + + fn temporal_edge_prop_vec_window( + &self, + e: EdgeRef, + prop_id: usize, + t_start: i64, + t_end: i64, + layer_ids: LayerIds, + ) -> Vec<(i64, Prop)> { + self.temporal_edge_prop(e, prop_id, layer_ids) + .map(|p| match e.time() { + Some(t) => { + if *t.t() >= t_start && *t.t() < t_end { + p.at(&t).map(|v| vec![(*t.t(), v)]).unwrap_or_default() + } else { + vec![] + } + } + None => p.iter_window(t_start..t_end).collect(), + }) + .unwrap_or_default() + } + + fn has_temporal_edge_prop(&self, e: EdgeRef, prop_id: usize, layer_ids: LayerIds) -> bool { + let entry = self.inner().storage.get_edge(e.pid()); + entry.has_temporal_prop(&layer_ids, prop_id) + } + + fn temporal_edge_prop_vec( + &self, + e: EdgeRef, + prop_id: usize, + layer_ids: LayerIds, + ) -> Vec<(i64, Prop)> { + self.temporal_edge_prop(e, prop_id, layer_ids) + .map(|p| match e.time() { + Some(t) => p.at(&t).map(|v| vec![(*t.t(), v)]).unwrap_or_default(), + None => p.iter().collect(), + }) + .unwrap_or_default() + } +} diff --git a/raphtory/src/db/mod.rs b/raphtory/src/db/mod.rs index e188e11a69..80ea7d70d2 100644 --- a/raphtory/src/db/mod.rs +++ b/raphtory/src/db/mod.rs @@ -1,12 +1,5 @@ -pub mod doc_strings; -pub mod edge; +pub mod api; pub mod graph; -pub mod graph_immutable; -pub mod graph_layer; -pub mod graph_window; -pub mod path; -pub mod subgraph_vertex; +pub(crate) mod internal; pub mod task; -pub mod vertex; -pub mod vertices; -pub mod view_api; +pub mod utils; diff --git a/raphtory/src/db/subgraph_vertex.rs b/raphtory/src/db/subgraph_vertex.rs deleted file mode 100644 index 7b02ffea6e..0000000000 --- a/raphtory/src/db/subgraph_vertex.rs +++ /dev/null @@ -1,481 +0,0 @@ -use crate::core::edge_ref::EdgeRef; -use crate::core::vertex_ref::{LocalVertexRef, VertexRef}; -use crate::core::{Direction, Prop}; -use crate::db::view_api::internal::GraphViewInternalOps; -use crate::db::view_api::GraphViewOps; -use rustc_hash::FxHashSet; -use std::collections::HashMap; -use std::iter; -use std::ops::Range; -use std::sync::Arc; - -#[derive(Clone, Debug)] -pub struct VertexSubgraph { - graph: G, - vertices: Arc>, -} - -impl VertexSubgraph { - pub(crate) fn new(graph: G, vertices: FxHashSet) -> Self { - Self {graph, vertices: Arc::new(vertices)} - } -} - - -impl GraphViewInternalOps for VertexSubgraph { - fn local_vertex(&self, v: VertexRef) -> Option { - self.graph - .local_vertex(v) - .filter(|v| self.vertices.contains(v)) - } - - fn local_vertex_window( - &self, - v: VertexRef, - t_start: i64, - t_end: i64, - ) -> Option { - self.graph - .local_vertex_window(v, t_start, t_end) - .filter(|v| self.vertices.contains(v)) - } - - fn get_unique_layers_internal(&self) -> Vec { - self.graph.get_unique_layers_internal() - } - - fn get_layer_name_by_id(&self, layer_id: usize) -> String { - self.graph.get_layer_name_by_id(layer_id) - } - - fn get_layer(&self, key: Option<&str>) -> Option { - self.graph.get_layer(key) - } - - fn view_start(&self) -> Option { - self.graph.view_start() - } - - fn view_end(&self) -> Option { - self.graph.view_end() - } - - fn earliest_time_global(&self) -> Option { - self.vertices - .iter() - .flat_map(|v| self.graph.vertex_earliest_time(*v)) - .min() - } - - fn earliest_time_window(&self, t_start: i64, t_end: i64) -> Option { - self.vertices - .iter() - .flat_map(|v| self.graph.vertex_earliest_time_window(*v, t_start, t_end)) - .min() - } - - fn latest_time_global(&self) -> Option { - self.vertices - .iter() - .flat_map(|v| self.graph.vertex_latest_time(*v)) - .max() - } - - fn latest_time_window(&self, t_start: i64, t_end: i64) -> Option { - self.vertices - .iter() - .flat_map(|v| self.graph.vertex_latest_time_window(*v, t_start, t_end)) - .max() - } - - fn vertices_len(&self) -> usize { - self.vertices.len() - } - - fn vertices_len_window(&self, t_start: i64, t_end: i64) -> usize { - self.vertices - .iter() - .filter(|&&v| { - self.graph - .has_vertex_ref_window(VertexRef::Local(v), t_start, t_end) - }) - .count() - } - - fn edges_len(&self, layer: Option) -> usize { - self.vertices - .iter() - .map(|v| self.degree(*v, Direction::OUT, layer)) - .sum() - } - - fn edges_len_window(&self, t_start: i64, t_end: i64, layer: Option) -> usize { - self.vertices - .iter() - .map(|v| self.degree_window(*v, t_start, t_end, Direction::OUT, layer)) - .sum() - } - - fn has_edge_ref(&self, src: VertexRef, dst: VertexRef, layer: usize) -> bool { - self.has_vertex_ref(src) - && self.has_vertex_ref(dst) - && self.graph.has_edge_ref(src, dst, layer) - } - - fn has_edge_ref_window( - &self, - src: VertexRef, - dst: VertexRef, - t_start: i64, - t_end: i64, - layer: usize, - ) -> bool { - self.has_vertex_ref(src) - && self.has_vertex_ref(dst) - && self - .graph - .has_edge_ref_window(src, dst, t_start, t_end, layer) - } - - fn has_vertex_ref(&self, v: VertexRef) -> bool { - self.local_vertex(v).is_some() - } - - fn has_vertex_ref_window(&self, v: VertexRef, t_start: i64, t_end: i64) -> bool { - self.local_vertex_window(v, t_start, t_end).is_some() - } - - fn degree(&self, v: LocalVertexRef, d: Direction, layer: Option) -> usize { - self.vertex_edges(v, d, layer).count() - } - - fn degree_window( - &self, - v: LocalVertexRef, - t_start: i64, - t_end: i64, - d: Direction, - layer: Option, - ) -> usize { - self.vertex_edges_window(v, t_start, t_end, d, layer) - .count() - } - - fn vertex_ref(&self, v: u64) -> Option { - self.local_vertex(v.into()) - } - - fn vertex_id(&self, v: LocalVertexRef) -> u64 { - self.graph.vertex_id(v) - } - - fn vertex_ref_window(&self, v: u64, t_start: i64, t_end: i64) -> Option { - self.local_vertex_window(v.into(), t_start, t_end) - } - - fn vertex_earliest_time(&self, v: LocalVertexRef) -> Option { - self.vertex_edges(v, Direction::BOTH, None) - .flat_map(|e| self.graph.edge_timestamps(e, None).first().copied()) - .min() - } - - fn vertex_earliest_time_window( - &self, - v: LocalVertexRef, - t_start: i64, - t_end: i64, - ) -> Option { - self.vertex_edges(v, Direction::BOTH, None) - .flat_map(|e| { - self.graph - .edge_timestamps(e, Some(t_start..t_end)) - .first() - .copied() - }) - .min() - } - - fn vertex_latest_time(&self, v: LocalVertexRef) -> Option { - self.vertex_edges(v, Direction::BOTH, None) - .flat_map(|e| self.graph.edge_timestamps(e, None).last().copied()) - .max() - } - - fn vertex_latest_time_window( - &self, - v: LocalVertexRef, - t_start: i64, - t_end: i64, - ) -> Option { - self.vertex_edges(v, Direction::BOTH, None) - .flat_map(|e| { - self.graph - .edge_timestamps(e, Some(t_start..t_end)) - .last() - .copied() - }) - .max() - } - - fn vertex_refs(&self) -> Box + Send> { - // this sucks but seems to be the only way currently (see also http://smallcultfollowing.com/babysteps/blog/2018/09/02/rust-pattern-iterating-an-over-a-rc-vec-t/) - let verts = Vec::from_iter(self.vertices.iter().copied()); - Box::new(verts.into_iter()) - } - - fn vertex_refs_window( - &self, - t_start: i64, - t_end: i64, - ) -> Box + Send> { - let g = self.clone(); - Box::new( - self.vertex_refs() - .filter(move |&v| g.has_vertex_ref_window(VertexRef::Local(v), t_start, t_end)), - ) - } - - fn vertex_refs_shard(&self, shard: usize) -> Box + Send> { - // FIXME: if keep shards, they need to support views (i.e., implement GraphViewInternalOps, this is terrible!) - Box::new(self.vertex_refs().filter(move |&v| v.shard_id == shard)) - } - - fn vertex_refs_window_shard( - &self, - shard: usize, - t_start: i64, - t_end: i64, - ) -> Box + Send> { - // FIXME: if keep shards, they need to support views (i.e., implement GraphViewInternalOps, this is terrible!) - Box::new( - self.vertex_refs_window(t_start, t_end) - .filter(move |&v| v.shard_id == shard), - ) - } - - fn edge_ref(&self, src: VertexRef, dst: VertexRef, layer: usize) -> Option { - if self.has_vertex_ref(src) && self.has_vertex_ref(dst) { - self.graph.edge_ref(src, dst, layer) - } else { - None - } - } - - fn edge_ref_window( - &self, - src: VertexRef, - dst: VertexRef, - t_start: i64, - t_end: i64, - layer: usize, - ) -> Option { - if self.has_vertex_ref(src) && self.has_vertex_ref(dst) { - self.graph.edge_ref_window(src, dst, t_start, t_end, layer) - } else { - None - } - } - - fn edge_refs(&self, layer: Option) -> Box + Send> { - let g1 = self.clone(); - Box::new( - self.vertex_refs() - .flat_map(move |v| g1.vertex_edges(v, Direction::OUT, layer)), - ) - } - - fn edge_refs_window( - &self, - t_start: i64, - t_end: i64, - layer: Option, - ) -> Box + Send> { - let g1 = self.clone(); - Box::new( - self.vertex_refs().flat_map(move |v| { - g1.vertex_edges_window(v, t_start, t_end, Direction::OUT, layer) - }), - ) - } - - fn vertex_edges( - &self, - v: LocalVertexRef, - d: Direction, - layer: Option, - ) -> Box + Send> { - let g = self.clone(); - Box::new( - self.graph - .vertex_edges(v, d, layer) - .filter(move |&e| g.has_vertex_ref(e.remote())), - ) - } - - fn vertex_edges_t( - &self, - v: LocalVertexRef, - d: Direction, - layer: Option, - ) -> Box + Send> { - // FIXME: Could be improved if we had an edge_t function as it calls filter too many times - let g = self.clone(); - Box::new( - self.graph - .vertex_edges_t(v, d, layer) - .filter(move |&e| g.has_vertex_ref(e.remote())), - ) - } - - fn vertex_edges_window( - &self, - v: LocalVertexRef, - t_start: i64, - t_end: i64, - d: Direction, - layer: Option, - ) -> Box + Send> { - let g = self.clone(); - Box::new( - self.graph - .vertex_edges_window(v, t_start, t_end, d, layer) - .filter(move |&e| g.has_vertex_ref(e.remote())), - ) - } - - fn vertex_edges_window_t( - &self, - v: LocalVertexRef, - t_start: i64, - t_end: i64, - d: Direction, - layer: Option, - ) -> Box + Send> { - // FIXME: Could be improved if we had an edge_t function as it calls filter too many times - let g = self.clone(); - Box::new( - self.graph - .vertex_edges_window_t(v, t_start, t_end, d, layer) - .filter(move |&e| g.has_vertex_ref(e.remote())), - ) - } - - fn neighbours( - &self, - v: LocalVertexRef, - d: Direction, - layer: Option, - ) -> Box + Send> { - Box::new(self.vertex_edges(v, d, layer).map(|e| e.remote())) - } - - fn neighbours_window( - &self, - v: LocalVertexRef, - t_start: i64, - t_end: i64, - d: Direction, - layer: Option, - ) -> Box + Send> { - Box::new( - self.vertex_edges_window(v, t_start, t_end, d, layer) - .map(|e| e.remote()), - ) - } - - fn static_vertex_prop(&self, v: LocalVertexRef, name: String) -> Option { - self.graph.static_vertex_prop(v, name) - } - - fn static_vertex_prop_names(&self, v: LocalVertexRef) -> Vec { - self.graph.static_vertex_prop_names(v) - } - - fn temporal_vertex_prop_names(&self, v: LocalVertexRef) -> Vec { - self.graph.temporal_vertex_prop_names(v) - } - - fn temporal_vertex_prop_vec(&self, v: LocalVertexRef, name: String) -> Vec<(i64, Prop)> { - self.graph.temporal_vertex_prop_vec(v, name) - } - - fn vertex_timestamps(&self, v: LocalVertexRef) -> Vec { - self.graph.vertex_timestamps(v) - } - - fn vertex_timestamps_window(&self, v: LocalVertexRef, t_start: i64, t_end: i64) -> Vec { - self.graph.vertex_timestamps_window(v, t_start, t_end) - } - - fn temporal_vertex_prop_vec_window( - &self, - v: LocalVertexRef, - name: String, - t_start: i64, - t_end: i64, - ) -> Vec<(i64, Prop)> { - self.graph - .temporal_vertex_prop_vec_window(v, name, t_start, t_end) - } - - fn temporal_vertex_props(&self, v: LocalVertexRef) -> HashMap> { - self.graph.temporal_vertex_props(v) - } - - fn temporal_vertex_props_window( - &self, - v: LocalVertexRef, - t_start: i64, - t_end: i64, - ) -> HashMap> { - self.graph.temporal_vertex_props_window(v, t_start, t_end) - } - - fn static_edge_prop(&self, e: EdgeRef, name: String) -> Option { - self.graph.static_edge_prop(e, name) - } - - fn static_edge_prop_names(&self, e: EdgeRef) -> Vec { - self.graph.static_edge_prop_names(e) - } - - fn temporal_edge_prop_names(&self, e: EdgeRef) -> Vec { - self.graph.temporal_edge_prop_names(e) - } - - fn temporal_edge_props_vec(&self, e: EdgeRef, name: String) -> Vec<(i64, Prop)> { - self.graph.temporal_edge_props_vec(e, name) - } - - fn temporal_edge_props_vec_window( - &self, - e: EdgeRef, - name: String, - t_start: i64, - t_end: i64, - ) -> Vec<(i64, Prop)> { - self.graph - .temporal_edge_props_vec_window(e, name, t_start, t_end) - } - - fn edge_timestamps(&self, e: EdgeRef, window: Option>) -> Vec { - self.graph.edge_timestamps(e, window) - } - - fn temporal_edge_props(&self, e: EdgeRef) -> HashMap> { - self.graph.temporal_edge_props(e) - } - - fn temporal_edge_props_window( - &self, - e: EdgeRef, - t_start: i64, - t_end: i64, - ) -> HashMap> { - self.graph.temporal_edge_props_window(e, t_start, t_end) - } - - fn num_shards(&self) -> usize { - self.graph.num_shards() - } -} diff --git a/raphtory/src/db/task/context.rs b/raphtory/src/db/task/context.rs index 2772917f9a..1124203b74 100644 --- a/raphtory/src/db/task/context.rs +++ b/raphtory/src/db/task/context.rs @@ -1,17 +1,15 @@ -use std::sync::Arc; - +use super::task_state::{Global, Shard}; use crate::{ core::{ - agg::Accumulator, + entities::VID, state::{ - accumulator_id::AccId, compute_state::ComputeState, shuffle_state::ShuffleComputeState, - StateType, + accumulator_id::AccId, agg::Accumulator, compute_state::ComputeState, + shuffle_state::ShuffleComputeState, StateType, }, }, - db::view_api::GraphViewOps, + db::{api::view::GraphViewOps, graph::vertex::VertexView}, }; - -use super::task_state::{Global, Shard}; +use std::{fmt::Debug, sync::Arc}; type MergeFn = Arc, &ShuffleComputeState, usize) + Send + Sync>; @@ -32,6 +30,20 @@ where G: GraphViewOps, CS: ComputeState, { + pub fn new_local_state) -> O>( + &self, + init_f: F, + ) -> Vec { + let n = self.g.unfiltered_num_vertices(); + let mut new_state = Vec::with_capacity(n); + for i in 0..n { + match self.g.vertex(VID(i)) { + Some(v) => new_state.push(init_f(v)), + None => new_state.push(O::default()), + } + } + new_state + } pub fn ss(&self) -> usize { self.ss } @@ -61,7 +73,6 @@ where mut a: Arc>, mut b: Arc>, ) -> Arc> { - // println!("Running merge \na: {:?} \nb: {:?}", a,b); if let Some(left) = Arc::get_mut(&mut a) { for merge_fn in self.merge_fns.iter() { merge_fn(left, &b, self.ss); @@ -82,7 +93,7 @@ where &mut self, id: AccId, ) { - let fn_merge: MergeFn = Arc::new(move |a, b, ss| a.merge_mut_2(b, id, ss)); + let fn_merge: MergeFn = Arc::new(move |a, b, ss| a.merge_mut(b, id, ss)); self.merge_fns.push(fn_merge); } @@ -91,7 +102,7 @@ where &mut self, id: AccId, ) { - let fn_merge: MergeFn = Arc::new(move |a, b, ss| a.merge_mut_2(b, id, ss)); + let fn_merge: MergeFn = Arc::new(move |a, b, ss| a.merge_mut(b, id, ss)); self.merge_fns.push(fn_merge); self.resetable_states.push(id.id()); @@ -146,7 +157,6 @@ pub struct GlobalState { } impl GlobalState { - pub fn finalize>( &self, agg_def: &AccId, @@ -157,7 +167,8 @@ impl GlobalState { { // ss needs to be incremented because the loop ran once and at the end it incremented the state thus // the value is on the previous ss - self.state.inner() + self.state + .inner() .read_global(self.ss + 1, agg_def) .unwrap_or_default() } diff --git a/raphtory/src/db/task/edge/eval_edge.rs b/raphtory/src/db/task/edge/eval_edge.rs new file mode 100644 index 0000000000..b6d5031e61 --- /dev/null +++ b/raphtory/src/db/task/edge/eval_edge.rs @@ -0,0 +1,277 @@ +use crate::{ + core::{ + entities::{edges::edge_ref::EdgeRef, LayerIds, VID}, + state::compute_state::ComputeState, + ArcStr, Prop, + }, + db::{ + api::{ + properties::{ + internal::{ConstPropertiesOps, TemporalPropertiesOps, TemporalPropertyViewOps}, + Properties, + }, + view::*, + }, + task::{ + task_state::Local2, + vertex::{eval_vertex::EvalVertexView, eval_vertex_state::EVState}, + }, + }, +}; +use std::{cell::RefCell, iter, marker::PhantomData, rc::Rc}; + +pub struct EvalEdgeView<'a, G: GraphViewOps, CS: ComputeState, S> { + ss: usize, + ev: EdgeRef, + graph: &'a G, + vertex_state: Rc>>, + local_state_prev: &'a Local2<'a, S>, + _s: PhantomData, +} + +impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> EvalEdgeView<'a, G, CS, S> { + pub(crate) fn new( + ss: usize, + ev: EdgeRef, + graph: &'a G, + vertex_state: Rc>>, + local_state_prev: &'a Local2<'a, S>, + ) -> Self { + Self { + ss, + ev, + graph, + vertex_state, + local_state_prev, + _s: PhantomData, + } + } + + fn layer_ids(&self) -> LayerIds { + self.graph.layer_ids().constrain_from_edge(self.ev) + } +} + +impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> + EdgeViewInternalOps> for EvalEdgeView<'a, G, CS, S> +{ + fn graph(&self) -> G { + self.graph.clone() + } + + fn eref(&self) -> EdgeRef { + self.ev + } + + fn new_vertex(&self, v: VID) -> EvalVertexView<'a, G, CS, S> { + EvalVertexView::new_local( + self.ss, + v, + self.graph, + None, + self.local_state_prev, + self.vertex_state.clone(), + ) + } + + fn new_edge(&self, e: EdgeRef) -> Self { + EvalEdgeView::new_( + self.ss, + e, + self.graph, + self.local_state_prev, + self.vertex_state.clone(), + ) + } +} + +impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> ConstPropertiesOps + for EvalEdgeView<'a, G, CS, S> +{ + fn get_const_prop_id(&self, name: &str) -> Option { + self.graph.edge_meta().const_prop_meta().get_id(name) + } + + fn get_const_prop_name(&self, id: usize) -> ArcStr { + self.graph.edge_meta().const_prop_meta().get_name(id) + } + + fn const_prop_ids(&self) -> Box + '_> { + self.graph + .const_edge_prop_ids(self.ev, self.graph.layer_ids()) + } + + fn get_const_prop(&self, prop_id: usize) -> Option { + self.graph + .get_const_edge_prop(self.ev, prop_id, self.graph.layer_ids()) + } +} + +impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> Clone for EvalEdgeView<'a, G, CS, S> { + fn clone(&self) -> Self { + Self { + ss: self.ss, + ev: self.ev, + graph: self.graph, + vertex_state: self.vertex_state.clone(), + local_state_prev: self.local_state_prev, + _s: Default::default(), + } + } +} + +impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> TemporalPropertyViewOps + for EvalEdgeView<'a, G, CS, S> +{ + fn temporal_history(&self, id: usize) -> Vec { + self.graph + .temporal_edge_prop_vec(self.ev, id, self.graph.layer_ids()) + .into_iter() + .map(|(t, _)| t) + .collect() + } + + fn temporal_values(&self, id: usize) -> Vec { + self.graph + .temporal_edge_prop_vec(self.ev, id, self.graph.layer_ids()) + .into_iter() + .map(|(_, v)| v) + .collect() + } +} + +impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> TemporalPropertiesOps + for EvalEdgeView<'a, G, CS, S> +{ + fn get_temporal_prop_id(&self, name: &str) -> Option { + self.graph + .edge_meta() + .temporal_prop_meta() + .get_id(name) + .filter(|id| { + self.graph + .has_temporal_edge_prop(self.ev, *id, self.layer_ids()) + }) + } + + fn get_temporal_prop_name(&self, id: usize) -> ArcStr { + self.graph.edge_meta().temporal_prop_meta().get_name(id) + } + + fn temporal_prop_ids(&self) -> Box + '_> { + Box::new( + self.graph + .temporal_edge_prop_ids(self.ev, self.layer_ids()) + .filter(|id| { + self.graph + .has_temporal_edge_prop(self.ev, *id, self.layer_ids()) + }), + ) + } +} + +impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> EdgeViewOps for EvalEdgeView<'a, G, CS, S> { + type Graph = G; + type Vertex = EvalVertexView<'a, G, CS, S>; + type EList = Box + 'a>; + + fn explode(&self) -> Self::EList { + let iter: Box> = match self.ev.time() { + Some(_) => Box::new(iter::once(self.ev)), + None => Box::new(self.graph.edge_exploded(self.ev, LayerIds::All)), + }; + + let ss = self.ss; + let g = self.graph; + let vertex_state = self.vertex_state.clone(); + let local_state_prev = self.local_state_prev; + Box::new( + iter.map(move |ev| { + EvalEdgeView::new(ss, ev, g, vertex_state.clone(), local_state_prev) + }), + ) + } + + fn explode_layers(&self) -> Self::EList { + let iter: Box> = match self.ev.time() { + Some(_) => Box::new(iter::once(self.ev)), + None => Box::new(self.graph.edge_layers(self.ev, LayerIds::All)), + }; + + let ss = self.ss; + let g = self.graph; + let vertex_state = self.vertex_state.clone(); + let local_state_prev = self.local_state_prev; + Box::new( + iter.map(move |ev| { + EvalEdgeView::new(ss, ev, g, vertex_state.clone(), local_state_prev) + }), + ) + } +} + +impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> EdgeListOps + for Box> + 'a> +{ + type Graph = G; + type Vertex = EvalVertexView<'a, G, CS, S>; + type Edge = EvalEdgeView<'a, G, CS, S>; + type ValueType = T; + type VList = Box + 'a>; + type IterType = Box + 'a>; + + fn properties(self) -> Self::IterType> { + Box::new(self.map(move |e| e.properties())) + } + + fn src(self) -> Self::VList { + Box::new(self.map(|e| e.src())) + } + + fn dst(self) -> Self::VList { + Box::new(self.map(|e| e.dst())) + } + + fn id(self) -> Self::IterType<(u64, u64)> { + Box::new(self.map(|e| e.id())) + } + + fn explode(self) -> Self::IterType { + Box::new(self.flat_map(|e| e.explode())) + } + + fn earliest_time(self) -> Self::IterType> { + Box::new(self.map(|e| e.earliest_time())) + } + + fn latest_time(self) -> Self::IterType> { + Box::new(self.map(|e| e.latest_time())) + } + + fn time(self) -> Self::IterType> { + Box::new(self.map(|e| e.time())) + } + + fn layer_name(self) -> Self::IterType> { + Box::new(self.map(|e| e.layer_name().map(|v| v.clone()))) + } +} + +impl<'a, G: GraphViewOps, CS: ComputeState, S> EvalEdgeView<'a, G, CS, S> { + pub(crate) fn new_( + ss: usize, + ev: EdgeRef, + graph: &'a G, + local_state_prev: &'a Local2<'a, S>, + vertex_state: Rc>>, + ) -> Self { + Self { + ss, + ev, + graph, + vertex_state, + local_state_prev, + _s: PhantomData, + } + } +} diff --git a/raphtory/src/db/task/edge/mod.rs b/raphtory/src/db/task/edge/mod.rs new file mode 100644 index 0000000000..4bb00ca1e8 --- /dev/null +++ b/raphtory/src/db/task/edge/mod.rs @@ -0,0 +1,2 @@ +pub mod eval_edge; +pub mod window_eval_edge; diff --git a/raphtory/src/db/task/edge/window_eval_edge.rs b/raphtory/src/db/task/edge/window_eval_edge.rs new file mode 100644 index 0000000000..78d5a6c6ed --- /dev/null +++ b/raphtory/src/db/task/edge/window_eval_edge.rs @@ -0,0 +1,391 @@ +use crate::{ + core::{ + entities::{edges::edge_ref::EdgeRef, LayerIds, VID}, + state::compute_state::ComputeState, + ArcStr, Prop, + }, + db::{ + api::{ + properties::{ + internal::{ConstPropertiesOps, TemporalPropertiesOps, TemporalPropertyViewOps}, + Properties, + }, + view::{internal::*, *}, + }, + graph::views::window_graph::WindowedGraph, + task::{ + task_state::Local2, + vertex::{eval_vertex_state::EVState, window_eval_vertex::WindowEvalVertex}, + }, + }, +}; +use std::{cell::RefCell, iter, marker::PhantomData, rc::Rc}; + +pub struct WindowEvalEdgeView<'a, G: GraphViewOps, CS: ComputeState, S: 'static> { + ss: usize, + ev: EdgeRef, + g: &'a G, + vertex_state: Rc>>, + local_state_prev: &'a Local2<'a, S>, + t_start: i64, + t_end: i64, + _s: PhantomData, + edge_filter: Option>, +} + +impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> WindowEvalEdgeView<'a, G, CS, S> { + pub(crate) fn new( + ss: usize, + ev: EdgeRef, + g: &'a G, + local_state_prev: &'a Local2<'a, S>, + vertex_state: Rc>>, + t_start: i64, + t_end: i64, + edge_filter: Option>, + ) -> Self { + Self { + ss, + ev, + g, + vertex_state, + local_state_prev, + t_start, + t_end, + _s: PhantomData, + edge_filter, + } + } + + pub fn history(&self) -> Vec { + self.graph() + .edge_window_exploded(self.eref(), self.t_start..self.t_end, LayerIds::All) + .map(|e| e.time_t().expect("exploded")) + .collect() + } + + fn layer_ids(&self) -> LayerIds { + self.g.layer_ids().constrain_from_edge(self.ev) + } +} +impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> + EdgeViewInternalOps, WindowEvalVertex<'a, G, CS, S>> + for WindowEvalEdgeView<'a, G, CS, S> +{ + fn graph(&self) -> WindowedGraph { + WindowedGraph::new(self.g.clone(), self.t_start, self.t_end) + } + + fn eref(&self) -> EdgeRef { + self.ev.clone() + } + + fn new_vertex(&self, v: VID) -> WindowEvalVertex<'a, G, CS, S> { + WindowEvalVertex::new( + self.ss, + v, + self.g, + None, + self.local_state_prev, + self.vertex_state.clone(), + self.t_start, + self.t_end, + self.edge_filter.clone(), + ) + } + + fn new_edge(&self, e: EdgeRef) -> Self { + WindowEvalEdgeView::new( + self.ss, + e, + self.g, + self.local_state_prev, + self.vertex_state.clone(), + self.t_start, + self.t_end, + self.edge_filter.clone(), + ) + } +} + +impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> ConstPropertiesOps + for WindowEvalEdgeView<'a, G, CS, S> +{ + fn get_const_prop_id(&self, name: &str) -> Option { + self.g.edge_meta().const_prop_meta().get_id(name) + } + + fn get_const_prop_name(&self, id: usize) -> ArcStr { + self.g.edge_meta().const_prop_meta().get_name(id) + } + + fn const_prop_ids(&self) -> Box + '_> { + self.g.const_edge_prop_ids(self.ev, self.g.layer_ids()) + } + + fn get_const_prop(&self, prop_id: usize) -> Option { + self.graph() + .get_const_edge_prop(self.ev, prop_id, self.g.layer_ids()) + } +} + +impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> Clone for WindowEvalEdgeView<'a, G, CS, S> { + fn clone(&self) -> Self { + Self { + ss: self.ss, + ev: self.ev, + g: self.g, + vertex_state: self.vertex_state.clone(), + local_state_prev: self.local_state_prev, + t_start: self.t_start, + t_end: self.t_end, + _s: Default::default(), + edge_filter: self.edge_filter.clone(), + } + } +} + +impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> TemporalPropertyViewOps + for WindowEvalEdgeView<'a, G, CS, S> +{ + fn temporal_value(&self, id: usize) -> Option { + self.g + .temporal_edge_prop_vec_window( + self.ev, + id, + self.t_start, + self.t_end, + self.g.layer_ids(), + ) + .last() + .map(|(_, v)| v.to_owned()) + } + + fn temporal_history(&self, id: usize) -> Vec { + self.g + .temporal_edge_prop_vec_window( + self.ev, + id, + self.t_start, + self.t_end, + self.g.layer_ids(), + ) + .into_iter() + .map(|(t, _)| t) + .collect() + } + + fn temporal_values(&self, id: usize) -> Vec { + self.g + .temporal_edge_prop_vec_window( + self.ev, + id, + self.t_start, + self.t_end, + self.g.layer_ids(), + ) + .into_iter() + .map(|(_, v)| v) + .collect() + } +} + +impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> TemporalPropertiesOps + for WindowEvalEdgeView<'a, G, CS, S> +{ + fn get_temporal_prop_id(&self, key: &str) -> Option { + self.g + .edge_meta() + .temporal_prop_meta() + .get_id(key) + .filter(|&id| { + self.g.has_temporal_edge_prop_window( + self.ev, + id, + self.t_start..self.t_end, + self.layer_ids(), + ) + }) + } + + fn get_temporal_prop_name(&self, id: usize) -> ArcStr { + self.g.edge_meta().temporal_prop_meta().get_name(id) + } + + fn temporal_prop_ids(&self) -> Box + '_> { + Box::new( + self.g + .temporal_edge_prop_ids(self.ev, self.g.layer_ids()) + .filter(|&id| { + self.g.has_temporal_edge_prop_window( + self.ev, + id, + self.t_start..self.t_end, + self.layer_ids(), + ) + }), + ) + } +} + +impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> EdgeViewOps + for WindowEvalEdgeView<'a, G, CS, S> +{ + type Graph = WindowedGraph; + + type Vertex = WindowEvalVertex<'a, G, CS, S>; + + type EList = Box + 'a>; + + fn history(&self) -> Vec { + self.graph() + .edge_window_exploded(self.ev, self.t_start..self.t_end, self.g.layer_ids()) + .map(|eref| eref.time_t().expect("exploded")) + .collect() + } + + /// Check if edge is active at a given time point + fn active(&self, t: i64) -> bool { + match self.eref().time_t() { + Some(tt) => tt <= t && t <= self.latest_time().unwrap_or(tt), + None => { + let layer_ids = self.graph().layer_ids().constrain_from_edge(self.eref()); + let entry = self.graph().core_edge(self.eref().pid()); + (self.t_start..self.t_end).contains(&t) + && self + .graph() + .include_edge_window(&entry, t..t.saturating_add(1), &layer_ids) + } + } + } + + fn explode(&self) -> Self::EList { + let e = self.ev.clone(); + let t_start = self.t_start; + let t_end = self.t_end; + let ss = self.ss; + let g = self.g; + let layer_ids = g.layer_ids(); + let vertex_state = self.vertex_state.clone(); + let local_state_prev = self.local_state_prev; + let edge_filter = self.edge_filter.clone(); + match self.ev.time() { + Some(_) => Box::new(iter::once(self.new_edge(e))), + None => { + let ts = self.g.edge_window_exploded(e, t_start..t_end, layer_ids); + Box::new(ts.map(move |ex| { + WindowEvalEdgeView::new( + ss, + ex, + g, + local_state_prev, + vertex_state.clone(), + t_start, + t_end, + edge_filter.clone(), + ) + })) + } + } + } + + fn explode_layers(&self) -> Self::EList { + let e = self.ev.clone(); + let t_start = self.t_start; + let t_end = self.t_end; + let ss = self.ss; + let g = self.g; + let vertex_state = self.vertex_state.clone(); + let local_state_prev = self.local_state_prev; + let edge_filter = self.edge_filter.clone(); + let layer_ids = g.layer_ids(); + + match self.ev.time() { + Some(_) => Box::new(iter::once(self.new_edge(e))), + None => { + let ts = self.g.edge_window_layers(e, t_start..t_end, layer_ids); + Box::new(ts.map(move |ex| { + WindowEvalEdgeView::new( + ss, + ex, + g, + local_state_prev, + vertex_state.clone(), + t_start, + t_end, + edge_filter.clone(), + ) + })) + } + } + } + + /// Gets the first time an edge was seen + fn earliest_time(&self) -> Option { + self.eref().time_t().or_else(|| { + self.graph().edge_earliest_time_window( + self.eref(), + self.t_start..self.t_end, + LayerIds::All, + ) + }) + } + + /// Gets the latest time an edge was updated + fn latest_time(&self) -> Option { + self.eref().time_t().or_else(|| { + self.graph().edge_latest_time_window( + self.eref(), + self.t_start..self.t_end, + LayerIds::All, + ) + }) + } +} + +impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> EdgeListOps + for Box> + 'a> +{ + type Graph = WindowedGraph; + type Vertex = WindowEvalVertex<'a, G, CS, S>; + type Edge = WindowEvalEdgeView<'a, G, CS, S>; + type ValueType = T; + type VList = Box + 'a>; + type IterType = Box + 'a>; + + fn properties(self) -> Self::IterType> { + Box::new(self.map(move |e| e.properties())) + } + + fn src(self) -> Self::VList { + Box::new(self.map(|e| e.src())) + } + + fn dst(self) -> Self::VList { + Box::new(self.map(|e| e.dst())) + } + + fn id(self) -> Self::IterType<(u64, u64)> { + Box::new(self.map(|e| e.id())) + } + + fn explode(self) -> Self::IterType { + Box::new(self.flat_map(move |it| it.explode())) + } + + fn earliest_time(self) -> Self::IterType> { + Box::new(self.map(|e| e.earliest_time())) + } + + fn latest_time(self) -> Self::IterType> { + Box::new(self.map(|e| e.latest_time())) + } + + fn time(self) -> Self::IterType> { + Box::new(self.map(|e| e.time())) + } + + fn layer_name(self) -> Self::IterType> { + Box::new(self.map(|e| e.layer_name().map(|v| v.clone()))) + } +} diff --git a/raphtory/src/db/task/eval_edge.rs b/raphtory/src/db/task/eval_edge.rs deleted file mode 100644 index 7f9eb9859b..0000000000 --- a/raphtory/src/db/task/eval_edge.rs +++ /dev/null @@ -1,189 +0,0 @@ -use crate::core::edge_ref::EdgeRef; -use crate::core::state::compute_state::ComputeState; -use crate::core::vertex_ref::VertexRef; -use crate::core::Prop; -use crate::db::task::eval_vertex::EvalVertexView; -use crate::db::view_api::edge::{EdgeViewInternalOps, EdgeViewOps}; -use crate::db::view_api::{EdgeListOps, GraphViewOps}; -use std::cell::RefCell; -use std::collections::HashMap; -use std::iter; -use std::marker::PhantomData; -use std::rc::Rc; - -use super::eval_vertex_state::EVState; -use super::task_state::Local2; - -pub struct EvalEdgeView<'a, G: GraphViewOps, CS: ComputeState, S> { - ss: usize, - ev: EdgeRef, - graph: &'a G, - vertex_state: Rc>>, - local_state_prev: &'a Local2<'a, S>, - _s: PhantomData, -} - -impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> EvalEdgeView<'a, G, CS, S> { - pub(crate) fn new( - ss: usize, - ev: EdgeRef, - graph: &'a G, - vertex_state: Rc>>, - local_state_prev: &'a Local2<'a, S>, - ) -> Self { - Self { - ss, - ev, - graph, - vertex_state, - local_state_prev, - _s: PhantomData, - } - } -} - -impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> - EdgeViewInternalOps> for EvalEdgeView<'a, G, CS, S> -{ - fn graph(&self) -> G { - self.graph.clone() - } - - fn eref(&self) -> EdgeRef { - self.ev.clone() - } - - fn new_vertex(&self, v: VertexRef) -> EvalVertexView<'a, G, CS, S> { - EvalVertexView::new_local( - self.ss, - self.graph.localise_vertex_unchecked(v), - self.graph, - None, - self.local_state_prev, - self.vertex_state.clone(), - ) - } - - fn new_edge(&self, e: EdgeRef) -> Self { - EvalEdgeView::new_( - self.ss, - e, - self.graph, - self.local_state_prev, - self.vertex_state.clone(), - ) - } -} - -impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> EdgeViewOps for EvalEdgeView<'a, G, CS, S> { - type Graph = G; - type Vertex = EvalVertexView<'a, G, CS, S>; - type EList = Box + 'a>; - - fn explode(&self) -> Self::EList { - let iter: Box> = match self.ev.time() { - Some(_) => Box::new(iter::once(self.ev.clone())), - None => { - let e = self.ev.clone(); - let ts = self.graph.edge_timestamps(self.ev, None); - Box::new(ts.into_iter().map(move |t| e.at(t))) - } - }; - - let ss = self.ss; - let g = self.graph; - let vertex_state = self.vertex_state.clone(); - let local_state_prev = self.local_state_prev; - Box::new( - iter.map(move |ev| { - EvalEdgeView::new(ss, ev, g, vertex_state.clone(), local_state_prev) - }), - ) - } -} - -impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> EdgeListOps - for Box> + 'a> -{ - type Graph = G; - type Vertex = EvalVertexView<'a, G, CS, S>; - type Edge = EvalEdgeView<'a, G, CS, S>; - type ValueType = T; - type VList = Box + 'a>; - type IterType = Box + 'a>; - - fn has_property(self, name: String, include_static: bool) -> Self::IterType { - Box::new(self.map(move |e| e.has_property(name.clone(), include_static))) - } - - fn property(self, name: String, include_static: bool) -> Self::IterType> { - Box::new(self.map(move |e| e.property(name.clone(), include_static))) - } - - fn properties(self, include_static: bool) -> Self::IterType> { - Box::new(self.map(move |e| e.properties(include_static))) - } - - fn property_names(self, include_static: bool) -> Self::IterType> { - Box::new(self.map(move |e| e.property_names(include_static))) - } - - fn has_static_property(self, name: String) -> Self::IterType { - Box::new(self.map(move |e| e.has_static_property(name.clone()))) - } - - fn static_property(self, name: String) -> Self::IterType> { - Box::new(self.map(move |e| e.static_property(name.clone()))) - } - - fn property_history(self, name: String) -> Self::IterType> { - Box::new(self.map(move |e| e.property_history(name.clone()))) - } - - fn property_histories(self) -> Self::IterType>> { - Box::new(self.map(|e| e.property_histories())) - } - - fn src(self) -> Self::VList { - Box::new(self.map(|e| e.src())) - } - - fn dst(self) -> Self::VList { - Box::new(self.map(|e| e.dst())) - } - - fn id(self) -> Self::IterType<(u64, u64)> { - Box::new(self.map(|e| e.id())) - } - - fn explode(self) -> Self::IterType { - Box::new(self.flat_map(|e| e.explode())) - } - - fn earliest_time(self) -> Self::IterType> { - Box::new(self.map(|e| e.earliest_time())) - } - - fn latest_time(self) -> Self::IterType> { - Box::new(self.map(|e| e.latest_time())) - } -} - -impl<'a, G: GraphViewOps, CS: ComputeState, S> EvalEdgeView<'a, G, CS, S> { - pub(crate) fn new_( - ss: usize, - ev: EdgeRef, - graph: &'a G, - local_state_prev: &'a Local2<'a, S>, - vertex_state: Rc>>, - ) -> Self { - Self { - ss, - ev, - graph, - vertex_state, - local_state_prev, - _s: PhantomData, - } - } -} diff --git a/raphtory/src/db/task/mod.rs b/raphtory/src/db/task/mod.rs index 2d878338e1..e6d1c19532 100644 --- a/raphtory/src/db/task/mod.rs +++ b/raphtory/src/db/task/mod.rs @@ -1,17 +1,13 @@ -use std::sync::Arc; - use once_cell::sync::Lazy; use rayon::{ThreadPool, ThreadPoolBuilder}; +use std::sync::Arc; pub mod context; -pub mod eval_edge; -pub mod eval_vertex; -pub mod eval_vertex_state; +pub mod edge; pub mod task; pub mod task_runner; pub(crate) mod task_state; -pub mod window_eval_vertex; -pub mod window_eval_edge; +pub mod vertex; pub static POOL: Lazy> = Lazy::new(|| { let num_threads = std::env::var("DOCBROWN_MAX_THREADS") @@ -46,7 +42,8 @@ pub fn custom_pool(n_threads: usize) -> Arc { mod task_tests { use crate::{ core::state::{self, compute_state::ComputeStateVec}, - db::graph::Graph, + db::{api::mutation::AdditionOps, task::vertex::eval_vertex::EvalVertexView}, + prelude::*, }; use super::{ @@ -58,7 +55,7 @@ mod task_tests { // count all the vertices with a global state #[test] fn count_all_vertices_with_global_state() { - let graph = Graph::new(2); + let graph = Graph::new(); let edges = vec![ (1, 2, 1), @@ -71,7 +68,7 @@ mod task_tests { ]; for (src, dst, ts) in edges { - graph.add_edge(ts, src, dst, &vec![], None).unwrap(); + graph.add_edge(ts, src, dst, NO_PROPS, None).unwrap(); } let mut ctx: Context = (&graph).into(); @@ -80,17 +77,19 @@ mod task_tests { ctx.global_agg(count.clone()); - let step1 = ATask::new(move |vv| { - vv.global_update(&count, 1); - Step::Done - }); + let step1 = ATask::new( + move |vv: &mut EvalVertexView<'_, Graph, ComputeStateVec, ()>| { + vv.global_update(&count, 1); + Step::Done + }, + ); let mut runner = TaskRunner::new(ctx); let actual = runner.run( vec![], vec![Job::new(step1)], - (), + None, |egs, _, _, _| egs.finalize(&count), Some(2), 1, diff --git a/raphtory/src/db/task/task.rs b/raphtory/src/db/task/task.rs index 32aba17c71..6d90944e07 100644 --- a/raphtory/src/db/task/task.rs +++ b/raphtory/src/db/task/task.rs @@ -1,11 +1,9 @@ -use std::marker::PhantomData; - -use crate::core::state::compute_state::ComputeState; -use crate::db::view_api::internal::GraphViewInternalOps; -use crate::db::view_api::GraphViewOps; - use super::context::GlobalState; -use super::eval_vertex::EvalVertexView; +use crate::{ + core::state::compute_state::ComputeState, + db::{api::view::GraphViewOps, task::vertex::eval_vertex::EvalVertexView}, +}; +use std::marker::PhantomData; pub trait Task where @@ -40,7 +38,7 @@ pub enum Job { Check(Box) -> Step + Send + Sync + 'static>), } -impl Job { +impl Job { pub fn new + Send + Sync + 'static>(t: T) -> Self { Self::Write(Box::new(t)) } diff --git a/raphtory/src/db/task/task_runner.rs b/raphtory/src/db/task/task_runner.rs index 62c90d33b1..5fcdf7d46e 100644 --- a/raphtory/src/db/task/task_runner.rs +++ b/raphtory/src/db/task/task_runner.rs @@ -1,24 +1,29 @@ -use std::{ - borrow::Cow, - rc::Rc, - sync::atomic::{AtomicBool, Ordering}, -}; - -use rayon::{prelude::*, ThreadPool}; - -use crate::core::state::shuffle_state::{EvalLocalState, EvalShardState}; -use crate::core::vertex_ref::LocalVertexRef; -use crate::{core::state::compute_state::ComputeState, db::view_api::GraphViewOps}; - use super::{ context::{Context, GlobalState}, custom_pool, - eval_vertex::EvalVertexView, - eval_vertex_state::EVState, task::{Job, Step, Task}, task_state::{Global, Local2, Shard}, POOL, }; +use crate::{ + core::{ + entities::vertices::vertex_ref::VertexRef, + state::{ + compute_state::ComputeState, + shuffle_state::{EvalLocalState, EvalShardState}, + }, + }, + db::{ + api::view::GraphViewOps, + task::vertex::{eval_vertex::EvalVertexView, eval_vertex_state::EVState}, + }, +}; +use rayon::{prelude::*, ThreadPool}; +use std::{ + borrow::Cow, + rc::Rc, + sync::atomic::{AtomicBool, Ordering}, +}; pub struct TaskRunner { pub(crate) ctx: Context, @@ -43,10 +48,11 @@ impl TaskRunner { &self, shard_state: &Shard, global_state: &Global, - morcel: &mut [Option<(LocalVertexRef, S)>], - prev_local_state: &Vec>, - max_shard_len: usize, + morcel: &mut [S], + prev_local_state: &Vec, atomic_done: &AtomicBool, + morcel_size: usize, + morcel_id: usize, task: &Box + Send + Sync>, ) -> (Shard, Global) { // the view for this task of the global state @@ -59,13 +65,17 @@ impl TaskRunner { let vertex_state = EVState::rc_from(shard_state_view, global_state_view); - let local = Local2::new(max_shard_len, prev_local_state); - - for line in morcel { - if let Some((v_ref, local_state)) = line { + let local = Local2::new(prev_local_state); + let mut v_ref = morcel_id * morcel_size; + for local_state in morcel { + if g.has_vertex_ref( + VertexRef::Internal(v_ref.into()), + &g.layer_ids(), + g.edge_filter().as_deref(), + ) { let mut vv = EvalVertexView::new_local( self.ctx.ss(), - v_ref.clone(), + v_ref.into(), &g, Some(local_state), &local, @@ -79,6 +89,7 @@ impl TaskRunner { Step::Done => {} } } + v_ref += 1; } if !done { @@ -112,19 +123,13 @@ impl TaskRunner { &mut self, tasks: &[Job], pool: &ThreadPool, + morcel_size: usize, shard_state: Shard, global_state: Global, - mut local_state: Vec>, - prev_local_state: &Vec>, - max_shard_len: usize, - ) -> ( - bool, - Shard, - Global, - Vec>, - ) { + mut local_state: Vec, + prev_local_state: &Vec, + ) -> (bool, Shard, Global, Vec) { pool.install(move || { - let chunk_size = 16_000; let mut new_shard_state = shard_state; let mut new_global_state = global_state; @@ -135,31 +140,37 @@ impl TaskRunner { let updated_state: Option<(Shard, Global)> = match task { Job::Write(task) => local_state - .par_chunks_mut(chunk_size) - .map(|morcel| { + .par_chunks_mut(morcel_size) + .enumerate() + .map(|(morcel_id, morcel)| { self.run_task_v2( &new_shard_state, &new_global_state, morcel, prev_local_state, - max_shard_len, &atomic_done, + morcel_size, + morcel_id, task, ) }) .reduce_with(|a, b| self.merge_states(a, b)), Job::Read(task) => { - local_state.par_chunks_mut(chunk_size).for_each(|morcel| { - self.run_task_v2( - &new_shard_state, - &new_global_state, - morcel, - prev_local_state, - max_shard_len, - &atomic_done, - task, - ); - }); + local_state + .par_chunks_mut(morcel_size) + .enumerate() + .for_each(|(morcel_id, morcel)| { + self.run_task_v2( + &new_shard_state, + &new_global_state, + morcel, + prev_local_state, + &atomic_done, + morcel_size, + morcel_id, + task, + ); + }); None } Job::Check(task) => { @@ -188,90 +199,68 @@ impl TaskRunner { }) } - fn make_cur_and_prev_states( - &self, - init: S, - ) -> ( - usize, - Vec>, - Vec>, - ) { + fn make_cur_and_prev_states(&self, mut init: Vec) -> (Vec, Vec) { let g = self.ctx.graph(); + init.resize(g.unfiltered_num_vertices(), S::default()); - // find the shard with the largest number of vertices - let max_shard_len = g.vertex_refs().map(|v| v.pid).max().unwrap_or(0) + 1; - - let n_shards = g.num_shards(); - - let mut states = vec![None; max_shard_len * n_shards]; - - for v_ref in g.vertex_refs() { - let LocalVertexRef { shard_id, pid } = v_ref; - let i = max_shard_len * shard_id + pid; - states[i] = Some((v_ref.clone(), init.clone())); - } - - (max_shard_len, states.clone(), states) + (init.clone(), init) } pub fn run< B: std::fmt::Debug, - F: FnOnce( - GlobalState, - EvalShardState, - EvalLocalState, - &Vec>, - ) -> B - + std::marker::Copy, - S: Send + Sync + Clone + 'static + std::fmt::Debug, + F: FnOnce(GlobalState, EvalShardState, EvalLocalState, Vec) -> B, + S: Send + Sync + Clone + 'static + std::fmt::Debug + Default, >( &mut self, init_tasks: Vec>, tasks: Vec>, - init: S, + init: Option>, f: F, num_threads: Option, steps: usize, shard_initial_state: Option>, global_initial_state: Option>, ) -> B { - let graph_shards = self.ctx.graph().num_shards(); - let pool = num_threads .map(|nt| custom_pool(nt)) .unwrap_or_else(|| POOL.clone()); - let mut shard_state = shard_initial_state.unwrap_or_else(|| Shard::new(graph_shards)); + let num_vertices = self.ctx.graph().unfiltered_num_vertices(); + let morcel_size = num_vertices.min(16_000); + let num_chunks = (num_vertices + morcel_size - 1) / morcel_size; + + let mut shard_state = shard_initial_state + .unwrap_or_else(|| Shard::new(num_vertices, num_chunks, morcel_size)); let mut global_state = global_initial_state.unwrap_or_else(|| Global::new()); - let (max_shard_len, mut cur_local_state, mut prev_local_state) = - self.make_cur_and_prev_states::(init); + let (mut cur_local_state, mut prev_local_state) = + self.make_cur_and_prev_states::(init.unwrap_or_default()); - let mut done = false; + let mut _done = false; - (done, shard_state, global_state, cur_local_state) = self.run_task_list( + (_done, shard_state, global_state, cur_local_state) = self.run_task_list( &init_tasks, &pool, + morcel_size, shard_state, global_state, cur_local_state, &prev_local_state, - max_shard_len, ); // To allow the init step to cache stuff we will copy everything from cur_local_state to prev_local_state prev_local_state.clone_from_slice(&cur_local_state); - while !done && self.ctx.ss() < steps && tasks.len() > 0 { - (done, shard_state, global_state, cur_local_state) = self.run_task_list( + while !_done && self.ctx.ss() < steps && tasks.len() > 0 { + (_done, shard_state, global_state, cur_local_state) = self.run_task_list( &tasks, &pool, + morcel_size, shard_state, global_state, cur_local_state, &prev_local_state, - max_shard_len, ); // copy and reset the state from the step that just ended @@ -292,14 +281,12 @@ impl TaskRunner { } else { prev_local_state }; - //TODO change to log - //println!("Done running iterations: {ss}"); f( GlobalState::new(global_state, ss), EvalShardState::new(ss, self.ctx.graph(), shard_state), EvalLocalState::new(ss, self.ctx.graph(), vec![]), - &last_local_state, + last_local_state, ) } } diff --git a/raphtory/src/db/task/task_state.rs b/raphtory/src/db/task/task_state.rs index aaaccc6769..106f8e2e71 100644 --- a/raphtory/src/db/task/task_state.rs +++ b/raphtory/src/db/task/task_state.rs @@ -1,10 +1,6 @@ +use crate::core::state::{compute_state::ComputeState, shuffle_state::ShuffleComputeState}; use std::{borrow::Cow, sync::Arc}; -use crate::core::{ - state::{compute_state::ComputeState, shuffle_state::ShuffleComputeState}, - vertex_ref::LocalVertexRef, -}; - // this only contains the global state and it is synchronized after each task run #[derive(Clone, Debug)] pub struct Global(Arc>); @@ -19,25 +15,24 @@ pub(crate) struct Local(Arc>>); #[derive(Debug)] pub(crate) struct Local2<'a, S> { - pub(crate) shard_len: usize, - pub(crate) state: &'a Vec>, + pub(crate) state: &'a Vec, } impl<'a, S: 'static> Local2<'a, S> { - pub(crate) fn new( - max_shard_len: usize, - prev_local_state: &'a Vec>, - ) -> Self { + pub(crate) fn new(prev_local_state: &'a Vec) -> Self { Self { - shard_len: max_shard_len, state: prev_local_state, } } } impl Shard { - pub(crate) fn new(graph_shards: usize) -> Self { - Self(Arc::new(ShuffleComputeState::new(graph_shards))) + pub(crate) fn new(total_len: usize, num_morcels: usize, morcel_size: usize) -> Self { + Self(Arc::new(ShuffleComputeState::new( + total_len, + num_morcels, + morcel_size, + ))) } pub(crate) fn as_cow(&self) -> Cow<'_, ShuffleComputeState> { @@ -56,6 +51,10 @@ impl Shard { &self.0 } + pub fn consume(self) -> Result, Arc>> { + Arc::try_unwrap(self.0) + } + pub fn reset(&mut self, ss: usize, resetable_states: &[u32]) { Arc::get_mut(&mut self.0).map(|s| { s.copy_over_next_ss(ss); @@ -72,7 +71,7 @@ impl From>> for Shard { impl Global { pub(crate) fn new() -> Self { - Self(Arc::new(ShuffleComputeState::new(0))) + Self(Arc::new(ShuffleComputeState::global())) } pub(crate) fn as_cow(&self) -> Cow<'_, ShuffleComputeState> { diff --git a/raphtory/src/db/task/eval_vertex.rs b/raphtory/src/db/task/vertex/eval_vertex.rs similarity index 67% rename from raphtory/src/db/task/eval_vertex.rs rename to raphtory/src/db/task/vertex/eval_vertex.rs index 5c30155e5b..0775be6e35 100644 --- a/raphtory/src/db/task/eval_vertex.rs +++ b/raphtory/src/db/task/vertex/eval_vertex.rs @@ -1,31 +1,43 @@ -use crate::core::time::IntoTime; -use crate::core::{Direction, Prop}; -use crate::db::edge::EdgeView; -use crate::db::path::{Operations, PathFromVertex}; -use crate::db::task::eval_edge::EvalEdgeView; -use crate::db::view_api::{BoxedIter, TimeOps, VertexListOps, VertexViewOps}; use crate::{ core::{ - agg::Accumulator, - state::{accumulator_id::AccId, compute_state::ComputeState, StateType}, - vertex_ref::LocalVertexRef, + entities::VID, + state::{accumulator_id::AccId, agg::Accumulator, compute_state::ComputeState, StateType}, + utils::time::IntoTime, + Direction, + }, + db::{ + api::{ + properties::Properties, + view::{ + BoxedIter, EdgeListOps, EdgeViewOps, GraphViewOps, TimeOps, VertexListOps, + VertexViewOps, + }, + }, + graph::{ + edge::EdgeView, + path::{Operations, PathFromVertex}, + vertex::VertexView, + }, + task::{ + edge::eval_edge::EvalEdgeView, + task_state::Local2, + vertex::{ + eval_vertex_state::EVState, + window_eval_vertex::{edge_filter, WindowEvalPathFromVertex, WindowEvalVertex}, + }, + }, }, - db::view_api::GraphViewOps, }; -use std::collections::HashMap; -use std::marker::PhantomData; +use itertools::Itertools; use std::{ cell::{Ref, RefCell}, + marker::PhantomData, rc::Rc, }; -use super::eval_vertex_state::EVState; -use super::task_state::Local2; -use super::window_eval_vertex::{WindowEvalPathFromVertex, WindowEvalVertex}; - pub struct EvalVertexView<'a, G: GraphViewOps, CS: ComputeState, S: 'static> { ss: usize, - vertex: LocalVertexRef, + vertex: VID, pub(crate) graph: &'a G, local_state: Option<&'a mut S>, local_state_prev: &'a Local2<'a, S>, @@ -34,13 +46,8 @@ pub struct EvalVertexView<'a, G: GraphViewOps, CS: ComputeState, S: 'static> { impl<'a, G: GraphViewOps, CS: ComputeState, S> EvalVertexView<'a, G, CS, S> { pub fn prev(&self) -> &S { - let LocalVertexRef { shard_id, pid } = self.vertex; - let shard_size = self.local_state_prev.shard_len; - let i = shard_size * shard_id + pid; - self.local_state_prev.state[i] - .as_ref() - .map(|(_, val)| val) - .unwrap() + let i: usize = self.vertex.into(); + &self.local_state_prev.state[i] } pub fn get_mut(&mut self) -> &mut S { @@ -59,7 +66,7 @@ impl<'a, G: GraphViewOps, CS: ComputeState, S> EvalVertexView<'a, G, CS, S> { pub(crate) fn new_local( ss: usize, - v_ref: LocalVertexRef, + v_ref: VID, g: &'a G, local_state: Option<&'a mut S>, local_state_prev: &'a Local2<'a, S>, @@ -76,7 +83,7 @@ impl<'a, G: GraphViewOps, CS: ComputeState, S> EvalVertexView<'a, G, CS, S> { } fn pid(&self) -> usize { - self.vertex.pid + self.vertex.into() } pub fn update>( @@ -87,7 +94,7 @@ impl<'a, G: GraphViewOps, CS: ComputeState, S> EvalVertexView<'a, G, CS, S> { self.vertex_state .borrow_mut() .shard_mut() - .accumulate_into_pid(self.ss, self.id(), self.pid(), a, id); + .accumulate_into(self.ss, self.pid(), a, id); } pub fn global_update>( @@ -145,7 +152,7 @@ impl<'a, G: GraphViewOps, CS: ComputeState, S> EvalVertexView<'a, G, CS, S> { self.vertex_state .borrow() .shard() - .read_with_pid(self.ss, self.id(), self.pid(), agg_r) + .read_with_pid(self.ss, self.pid(), agg_r) .unwrap_or(ACC::finish(&ACC::zero())) } @@ -159,13 +166,7 @@ impl<'a, G: GraphViewOps, CS: ComputeState, S> EvalVertexView<'a, G, CS, S> { A: StateType, OUT: std::fmt::Debug, { - Entry::new( - self.vertex_state.borrow(), - *agg_r, - &self.vertex, - self.id(), - self.ss, - ) + Entry::new(self.vertex_state.borrow(), *agg_r, &self.vertex, self.ss) } /// Read the prev value of the vertex state using the given accumulator. @@ -181,7 +182,7 @@ impl<'a, G: GraphViewOps, CS: ComputeState, S> EvalVertexView<'a, G, CS, S> { self.vertex_state .borrow() .shard() - .read_with_pid(self.ss + 1, self.id(), self.pid(), agg_r) + .read_with_pid(self.ss + 1, self.pid(), agg_r) .unwrap_or(ACC::finish(&ACC::zero())) } @@ -240,10 +241,10 @@ impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> EvalPathFromVertex<'a, G Box::new(self.path.iter_refs().map(|v| { EvalVertexView::new_local( self.ss, - self.g.localise_vertex_unchecked(v), + v, self.g, None, - self.local_state_prev.clone(), + self.local_state_prev, self.vertex_state.clone(), ) })) @@ -263,14 +264,7 @@ impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> IntoIterator let ss = self.ss; let g: &G = self.g; Box::new(path.iter_refs().map(move |v| { - EvalVertexView::new_local( - ss, - self.g.localise_vertex_unchecked(v), - g, - None, - self.local_state_prev.clone(), - vertex_state.clone(), - ) + EvalVertexView::new_local(ss, v, g, None, self.local_state_prev, vertex_state.clone()) })) } } @@ -289,14 +283,18 @@ impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> TimeOps } fn window(&self, t_start: T, t_end: T) -> Self::WindowedViewType { + let t_start = t_start.into_time(); + let t_end = t_end.into_time(); + let edge_filter = edge_filter(self.g, t_start, t_end).map(Rc::new); WindowEvalPathFromVertex::new( self.path.clone(), self.ss, self.g, self.vertex_state.clone(), - self.local_state_prev.clone(), - t_start.into_time(), - t_end.into_time(), + self.local_state_prev, + t_start, + t_end, + edge_filter, ) } } @@ -325,40 +323,12 @@ impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> VertexViewOps self.path.latest_time() } - fn property(&self, name: String, include_static: bool) -> Self::ValueType> { - self.path.property(name, include_static) - } - fn history(&self) -> Self::ValueType> { self.path.history() } - fn property_history(&self, name: String) -> Self::ValueType> { - self.path.property_history(name) - } - - fn properties(&self, include_static: bool) -> Self::ValueType> { - self.path.properties(include_static) - } - - fn property_histories(&self) -> Self::ValueType>> { - self.path.property_histories() - } - - fn property_names(&self, include_static: bool) -> Self::ValueType> { - self.path.property_names(include_static) - } - - fn has_property(&self, name: String, include_static: bool) -> Self::ValueType { - self.path.has_property(name, include_static) - } - - fn has_static_property(&self, name: String) -> Self::ValueType { - self.path.has_static_property(name) - } - - fn static_property(&self, name: String) -> Self::ValueType> { - self.path.static_property(name) + fn properties(&self) -> Self::ValueType>> { + self.path.properties() } fn degree(&self) -> Self::ValueType { @@ -410,15 +380,19 @@ impl<'a, G: GraphViewOps, CS: ComputeState, S> TimeOps for EvalVertexView<'a, G, } fn window(&self, t_start: T, t_end: T) -> Self::WindowedViewType { + let t_start = t_start.into_time(); + let t_end = t_end.into_time(); + let edge_filter = edge_filter(self.graph, t_start, t_end).map(Rc::new); WindowEvalVertex::new( self.ss, self.vertex, self.graph, None, - self.local_state_prev.clone(), + self.local_state_prev, self.vertex_state.clone(), - t_start.into_time(), - t_end.into_time(), + t_start, + t_end, + edge_filter, ) } } @@ -447,89 +421,44 @@ impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> VertexViewOps self.graph.vertex_latest_time(self.vertex) } - fn property(&self, name: String, include_static: bool) -> Self::ValueType> { - let props = self.property_history(name.clone()); - match props.last() { - None => { - if include_static { - self.graph.static_vertex_prop(self.vertex, name) - } else { - None - } - } - Some((_, prop)) => Some(prop.clone()), - } - } - fn history(&self) -> Self::ValueType> { - self.graph.vertex_timestamps(self.vertex) - } - - fn property_history(&self, name: String) -> Self::ValueType> { - self.graph.temporal_vertex_prop_vec(self.vertex, name) - } - - fn properties(&self, include_static: bool) -> Self::ValueType> { - let mut props: HashMap = self - .property_histories() - .iter() - .map(|(key, values)| (key.clone(), values.last().unwrap().1.clone())) - .collect(); - - if include_static { - for prop_name in self.graph.static_vertex_prop_names(self.vertex) { - if let Some(prop) = self - .graph - .static_vertex_prop(self.vertex, prop_name.clone()) - { - props.insert(prop_name, prop); - } - } - } - props + self.edges() + .map(|e| e.explode().earliest_time().flatten()) + .kmerge() + .dedup() + .collect() } - fn property_histories(&self) -> Self::ValueType>> { - self.graph.temporal_vertex_props(self.vertex) - } - - fn property_names(&self, include_static: bool) -> Self::ValueType> { - let mut names: Vec = self.graph.temporal_vertex_prop_names(self.vertex); - if include_static { - names.extend(self.graph.static_vertex_prop_names(self.vertex)) - } - names - } - - fn has_property(&self, name: String, include_static: bool) -> Self::ValueType { - (!self.property_history(name.clone()).is_empty()) - || (include_static - && self - .graph - .static_vertex_prop_names(self.vertex) - .contains(&name)) - } - - fn has_static_property(&self, name: String) -> Self::ValueType { - self.graph - .static_vertex_prop_names(self.vertex) - .contains(&name) - } - - fn static_property(&self, name: String) -> Self::ValueType> { - self.graph.static_vertex_prop(self.vertex, name) + fn properties(&self) -> Self::ValueType>> { + //FIXME: need to implement this properly without cloning the graph... + Properties::new(VertexView::new_internal(self.graph.clone(), self.vertex)) } fn degree(&self) -> Self::ValueType { - self.graph.degree(self.vertex, Direction::BOTH, None) + self.graph.degree( + self.vertex, + Direction::BOTH, + &self.graph.layer_ids(), + self.graph.edge_filter(), + ) } fn in_degree(&self) -> Self::ValueType { - self.graph.degree(self.vertex, Direction::IN, None) + self.graph.degree( + self.vertex, + Direction::IN, + &self.graph.layer_ids(), + self.graph.edge_filter(), + ) } fn out_degree(&self) -> Self::ValueType { - self.graph.degree(self.vertex, Direction::OUT, None) + self.graph.degree( + self.vertex, + Direction::OUT, + &self.graph.layer_ids(), + self.graph.edge_filter(), + ) } fn edges(&self) -> Self::EList { @@ -539,7 +468,12 @@ impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> VertexViewOps let graph = self.graph; Box::new( self.graph - .vertex_edges(self.vertex, Direction::BOTH, None) + .vertex_edges( + self.vertex, + Direction::BOTH, + self.graph.layer_ids(), + self.graph.edge_filter(), + ) .map(move |e| EvalEdgeView::new_(ss, e, graph, local, vertex_state.clone())), ) } @@ -551,7 +485,12 @@ impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> VertexViewOps let graph = self.graph; Box::new( self.graph - .vertex_edges(self.vertex, Direction::IN, None) + .vertex_edges( + self.vertex, + Direction::IN, + self.graph.layer_ids(), + self.graph.edge_filter(), + ) .map(move |e| EvalEdgeView::new_(ss, e, graph, local, vertex_state.clone())), ) } @@ -563,7 +502,12 @@ impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> VertexViewOps let graph = self.graph; Box::new( self.graph - .vertex_edges(self.vertex, Direction::OUT, None) + .vertex_edges( + self.vertex, + Direction::OUT, + self.graph.layer_ids(), + self.graph.edge_filter(), + ) .map(move |e| EvalEdgeView::new_(ss, e, graph, local, vertex_state.clone())), ) } @@ -594,7 +538,9 @@ impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> VertexViewOps let neighbours = PathFromVertex::new( self.graph.clone(), self.vertex, - Operations::Neighbours { dir: Direction::OUT }, + Operations::Neighbours { + dir: Direction::OUT, + }, ); EvalPathFromVertex::new_from_path_and_vertex(neighbours, self) @@ -609,8 +555,7 @@ impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> VertexViewOps pub struct Entry<'a, 'b, A: StateType, IN, OUT, ACC: Accumulator, CS: ComputeState> { state: Ref<'a, EVState<'b, CS>>, acc_id: AccId, - v_ref: &'a LocalVertexRef, - gid: u64, + v_ref: &'a VID, ss: usize, } @@ -629,15 +574,13 @@ impl<'a, 'b, A: StateType, IN, OUT, ACC: Accumulator, CS: ComputeSta pub(crate) fn new( state: Ref<'a, EVState<'b, CS>>, acc_id: AccId, - v_ref: &'a LocalVertexRef, - gid: u64, + v_ref: &'a VID, ss: usize, ) -> Entry<'a, 'b, A, IN, OUT, ACC, CS> { Entry { state, acc_id, v_ref, - gid, ss, } } @@ -646,7 +589,7 @@ impl<'a, 'b, A: StateType, IN, OUT, ACC: Accumulator, CS: ComputeSta pub fn read_ref(&self) -> Option<&A> { self.state .shard() - .read_ref_with_pid(self.ss, self.gid, self.v_ref.pid, &self.acc_id) + .read_ref(self.ss, (*self.v_ref).into(), &self.acc_id) } } @@ -675,6 +618,10 @@ impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> VertexListOps Box::new(self.map(move |v| v.window(t_start, t_end))) } + fn at(self, end: i64) -> Self::IterType<::WindowedViewType> { + Box::new(self.map(move |v| v.at(end))) + } + fn id(self) -> Self::IterType { Box::new(self.map(|v| v.id())) } @@ -683,42 +630,14 @@ impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> VertexListOps Box::new(self.map(|v| v.name())) } - fn property(self, name: String, include_static: bool) -> Self::IterType> { - Box::new(self.map(move |v| v.property(name.clone(), include_static))) - } - - fn property_history(self, name: String) -> Self::IterType> { - Box::new(self.map(move |v| v.property_history(name.clone()))) - } - - fn properties(self, include_static: bool) -> Self::IterType> { - Box::new(self.map(move |v| v.properties(include_static))) + fn properties(self) -> Self::IterType>> { + Box::new(self.map(move |v| v.properties())) } fn history(self) -> Self::IterType> { Box::new(self.map(|v| v.history())) } - fn property_histories(self) -> Self::IterType>> { - Box::new(self.map(|v| v.property_histories())) - } - - fn property_names(self, include_static: bool) -> Self::IterType> { - Box::new(self.map(move |v| v.property_names(include_static))) - } - - fn has_property(self, name: String, include_static: bool) -> Self::IterType { - Box::new(self.map(move |v| v.has_property(name.clone(), include_static))) - } - - fn has_static_property(self, name: String) -> Self::IterType { - Box::new(self.map(move |v| v.has_static_property(name.clone()))) - } - - fn static_property(self, name: String) -> Self::IterType> { - Box::new(self.map(move |v| v.static_property(name.clone()))) - } - fn degree(self) -> Self::IterType { Box::new(self.map(|v| v.degree())) } diff --git a/raphtory/src/db/task/eval_vertex_state.rs b/raphtory/src/db/task/vertex/eval_vertex_state.rs similarity index 99% rename from raphtory/src/db/task/eval_vertex_state.rs rename to raphtory/src/db/task/vertex/eval_vertex_state.rs index ae8f0669bb..c0d354c162 100644 --- a/raphtory/src/db/task/eval_vertex_state.rs +++ b/raphtory/src/db/task/vertex/eval_vertex_state.rs @@ -1,6 +1,5 @@ -use std::{borrow::Cow, cell::RefCell, rc::Rc}; - use crate::core::state::{compute_state::ComputeState, shuffle_state::ShuffleComputeState}; +use std::{borrow::Cow, cell::RefCell, rc::Rc}; #[derive(Debug)] pub(crate) struct EVState<'a, CS: ComputeState> { diff --git a/raphtory/src/db/task/vertex/mod.rs b/raphtory/src/db/task/vertex/mod.rs new file mode 100644 index 0000000000..ca5802a826 --- /dev/null +++ b/raphtory/src/db/task/vertex/mod.rs @@ -0,0 +1,3 @@ +pub mod eval_vertex; +pub mod eval_vertex_state; +pub mod window_eval_vertex; diff --git a/raphtory/src/db/task/window_eval_vertex.rs b/raphtory/src/db/task/vertex/window_eval_vertex.rs similarity index 56% rename from raphtory/src/db/task/window_eval_vertex.rs rename to raphtory/src/db/task/vertex/window_eval_vertex.rs index 031e6e519a..64921aa62b 100644 --- a/raphtory/src/db/task/window_eval_vertex.rs +++ b/raphtory/src/db/task/vertex/window_eval_vertex.rs @@ -1,33 +1,54 @@ -use std::{cell::RefCell, collections::HashMap, marker::PhantomData, rc::Rc}; - use crate::{ core::{ - state::{compute_state::ComputeState, StateType, accumulator_id::AccId}, time::IntoTime, vertex_ref::LocalVertexRef, Direction, - Prop, agg::Accumulator, + entities::VID, + state::{accumulator_id::AccId, agg::Accumulator, compute_state::ComputeState, StateType}, + utils::time::IntoTime, + Direction, }, db::{ - path::{Operations, PathFromVertex}, - view_api::{GraphViewOps, TimeOps, VertexViewOps, VertexListOps}, + api::{ + properties::Properties, + view::{ + internal::{EdgeFilter, EdgeFilterOps}, + GraphViewOps, TimeOps, VertexListOps, VertexViewOps, + }, + }, + graph::{ + path::{Operations, PathFromVertex}, + vertex::VertexView, + views::window_graph::WindowedGraph, + }, + task::{ + edge::window_eval_edge::WindowEvalEdgeView, task_state::Local2, + vertex::eval_vertex_state::EVState, + }, }, }; +use std::{cell::RefCell, marker::PhantomData, rc::Rc}; -use super::{eval_vertex_state::EVState, task_state::Local2, window_eval_edge::WindowEvalEdgeView}; +pub(crate) fn edge_filter( + graph: &G, + t_start: i64, + t_end: i64, +) -> Option { + graph.window(t_start, t_end).edge_filter().cloned() +} pub struct WindowEvalVertex<'a, G: GraphViewOps, CS: ComputeState, S: 'static> { ss: usize, - vertex: LocalVertexRef, + vertex: VID, pub(crate) graph: &'a G, - local_state: Option<&'a mut S>, + _local_state: Option<&'a mut S>, local_state_prev: &'a Local2<'a, S>, vertex_state: Rc>>, t_start: i64, t_end: i64, + edge_filter: Option>, } impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> WindowEvalVertex<'a, G, CS, S> { - fn pid(&self) -> usize { - self.vertex.pid + self.vertex.into() } pub fn update>( @@ -38,28 +59,30 @@ impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> WindowEvalVertex<'a, G, self.vertex_state .borrow_mut() .shard_mut() - .accumulate_into_pid(self.ss, self.id(), self.pid(), a, id); + .accumulate_into(self.ss, self.pid(), a, id); } pub(crate) fn new( ss: usize, - vertex: LocalVertexRef, + vertex: VID, graph: &'a G, local_state: Option<&'a mut S>, local_state_prev: &'a Local2<'a, S>, vertex_state: Rc>>, t_start: i64, t_end: i64, + edge_filter: Option>, ) -> Self { WindowEvalVertex { ss, vertex, graph, - local_state, + _local_state: local_state, local_state_prev, vertex_state, t_start, t_end, + edge_filter, } } } @@ -76,15 +99,19 @@ impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> TimeOps for WindowEvalVe } fn window(&self, t_start: T, t_end: T) -> Self::WindowedViewType { + let t_start = t_start.into_time().max(self.t_start); + let t_end = t_end.into_time().min(self.t_end); + let edge_filter = edge_filter(self.graph, t_start, t_end).map(Rc::new); WindowEvalVertex { ss: self.ss, - vertex: self.vertex.clone(), + vertex: self.vertex, graph: self.graph, - local_state: None, + _local_state: None, local_state_prev: self.local_state_prev, vertex_state: self.vertex_state.clone(), - t_start: t_start.into_time().max(self.t_start), - t_end: t_end.into_time().min(self.t_end), + t_start, + t_end, + edge_filter, } } } @@ -92,7 +119,7 @@ impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> TimeOps for WindowEvalVe impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> VertexViewOps for WindowEvalVertex<'a, G, CS, S> { - type Graph = G; + type Graph = WindowedGraph; type ValueType = T; type PathType<'b> = WindowEvalPathFromVertex<'a, G, CS, S> where Self: 'b; type EList = Box> + 'a>; @@ -115,107 +142,47 @@ impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> VertexViewOps .vertex_latest_time_window(self.vertex, self.t_start, self.t_end) } - fn property( - &self, - name: String, - include_static: bool, - ) -> Self::ValueType> { - let props = self.property_history(name.clone()); - match props.last() { - None => { - if include_static { - self.graph.static_vertex_prop(self.vertex, name) - } else { - None - } - } - Some((_, prop)) => Some(prop.clone()), - } - } - fn history(&self) -> Self::ValueType> { self.graph - .vertex_timestamps_window(self.vertex, self.t_start, self.t_end) - } - - fn property_history(&self, name: String) -> Self::ValueType> { - self.graph - .temporal_vertex_prop_vec_window(self.vertex, name, self.t_start, self.t_end) - } - - fn properties( - &self, - include_static: bool, - ) -> Self::ValueType> { - let mut props: HashMap = self - .property_histories() - .iter() - .map(|(key, values)| (key.clone(), values.last().unwrap().1.clone())) - .collect(); - - if include_static { - for prop_name in self.graph.static_vertex_prop_names(self.vertex) { - if let Some(prop) = self - .graph - .static_vertex_prop(self.vertex, prop_name.clone()) - { - props.insert(prop_name, prop); - } - } - } - props - } - - fn property_histories( - &self, - ) -> Self::ValueType>> { - self.graph - .temporal_vertex_props_window(self.vertex, self.t_start, self.t_end) - } - - fn property_names(&self, include_static: bool) -> Self::ValueType> { - let mut names: Vec = self.graph.temporal_vertex_prop_names(self.vertex); - if include_static { - names.extend(self.graph.static_vertex_prop_names(self.vertex)) - } - names - } - - fn has_property(&self, name: String, include_static: bool) -> Self::ValueType { - (!self.property_history(name.clone()).is_empty()) - || (include_static - && self - .graph - .static_vertex_prop_names(self.vertex) - .contains(&name)) - } - - fn has_static_property(&self, name: String) -> Self::ValueType { - self.graph - .static_vertex_prop_names(self.vertex) - .contains(&name) + .vertex_history_window(self.vertex, self.t_start..self.t_end) } - fn static_property(&self, name: String) -> Self::ValueType> { - self.graph.static_vertex_prop(self.vertex, name) + fn properties(&self) -> Self::ValueType>>> { + //FIXME: Need to implement this properly without cloning the graph + Properties::new(VertexView::new_internal( + WindowedGraph::new(self.graph.clone(), self.t_start, self.t_end), + self.vertex, + )) } fn degree(&self) -> Self::ValueType { let dir = Direction::BOTH; - self.graph - .degree_window(self.vertex, self.t_start, self.t_end, dir, None) + self.graph.degree( + self.vertex, + dir, + &self.graph.layer_ids(), + self.edge_filter.as_deref(), + ) } fn in_degree(&self) -> Self::ValueType { let dir = Direction::IN; - self.graph - .degree_window(self.vertex, self.t_start, self.t_end, dir, None) + self.graph.degree( + self.vertex, + dir, + &self.graph.layer_ids(), + self.edge_filter.as_deref(), + ) } fn out_degree(&self) -> Self::ValueType { let dir = Direction::OUT; - self.graph - .degree_window(self.vertex, self.t_start, self.t_end, dir, None) + self.graph.degree( + self.vertex, + dir, + &self.graph.layer_ids(), + self.edge_filter.as_deref(), + ) } fn edges(&self) -> Self::EList { @@ -225,10 +192,27 @@ impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> VertexViewOps let graph = self.graph; let t_start = self.t_start; let t_end = self.t_end; + let edge_filter = self.edge_filter.clone(); Box::new( self.graph - .vertex_edges_window(self.vertex, self.t_start, self.t_end, Direction::BOTH, None) - .map(move |e| WindowEvalEdgeView::new(ss, e, graph, local, vertex_state.clone(), t_start, t_end)), + .vertex_edges( + self.vertex, + Direction::BOTH, + self.graph.layer_ids(), + self.edge_filter.as_deref(), + ) + .map(move |e| { + WindowEvalEdgeView::new( + ss, + e, + graph, + local, + vertex_state.clone(), + t_start, + t_end, + edge_filter.clone(), + ) + }), ) } @@ -239,10 +223,27 @@ impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> VertexViewOps let graph = self.graph; let t_start = self.t_start; let t_end = self.t_end; + let edge_filter = self.edge_filter.clone(); Box::new( self.graph - .vertex_edges_window(self.vertex, self.t_start, self.t_end, Direction::IN, None) - .map(move |e| WindowEvalEdgeView::new(ss, e, graph, local, vertex_state.clone(), t_start, t_end)), + .vertex_edges( + self.vertex, + Direction::IN, + self.graph.layer_ids(), + self.edge_filter.as_deref(), + ) + .map(move |e| { + WindowEvalEdgeView::new( + ss, + e, + graph, + local, + vertex_state.clone(), + t_start, + t_end, + edge_filter.clone(), + ) + }), ) } @@ -253,10 +254,27 @@ impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> VertexViewOps let graph = self.graph; let t_start = self.t_start; let t_end = self.t_end; + let edge_filter = self.edge_filter.clone(); Box::new( self.graph - .vertex_edges_window(self.vertex, self.t_start, self.t_end, Direction::OUT, None) - .map(move |e| WindowEvalEdgeView::new(ss, e, graph, local, vertex_state.clone(), t_start, t_end)), + .vertex_edges( + self.vertex, + Direction::OUT, + self.graph.layer_ids(), + self.edge_filter.as_deref(), + ) + .map(move |e| { + WindowEvalEdgeView::new( + ss, + e, + graph, + local, + vertex_state.clone(), + t_start, + t_end, + edge_filter.clone(), + ) + }), ) } @@ -312,6 +330,7 @@ pub struct WindowEvalPathFromVertex<'a, G: GraphViewOps, CS: ComputeState, S> { _s: PhantomData, t_start: i64, t_end: i64, + edge_filter: Option>, } impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> WindowEvalPathFromVertex<'a, G, CS, S> { fn update_path(&self, path: PathFromVertex) -> Self { @@ -324,6 +343,7 @@ impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> WindowEvalPathFromVertex t_start: self.t_start, t_end: self.t_end, _s: PhantomData, + edge_filter: self.edge_filter.clone(), } } @@ -340,6 +360,7 @@ impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> WindowEvalPathFromVertex _s: PhantomData, t_start: vertex.t_start, t_end: vertex.t_end, + edge_filter: vertex.edge_filter.clone(), } } @@ -351,6 +372,7 @@ impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> WindowEvalPathFromVertex local_state_prev: &'a Local2<'a, S>, t_start: i64, t_end: i64, + edge_filter: Option>, ) -> Self { WindowEvalPathFromVertex { path, @@ -361,6 +383,7 @@ impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> WindowEvalPathFromVertex _s: PhantomData, t_start, t_end, + edge_filter, } } @@ -374,16 +397,26 @@ impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> WindowEvalPathFromVertex let local_state_prev = self.local_state_prev; let t_start = self.t_start; let t_end = self.t_end; - + let edge_filter = self.edge_filter.clone(); + let edge_filter_2 = edge_filter.clone(); + let layer_ids = g.layer_ids(); let iter = self .path .iter_refs() .flat_map(move |v_ref| { - let local_ref = g.localise_vertex_unchecked(v_ref); - g.vertex_edges_window(local_ref, t_start, t_end, dir, None) + g.vertex_edges(v_ref, dir, layer_ids.clone(), edge_filter_2.as_deref()) }) .map(move |e_ref| { - WindowEvalEdgeView::new(ss, e_ref, g, local_state_prev, vertex_state.clone(), t_start, t_end) + WindowEvalEdgeView::new( + ss, + e_ref, + g, + local_state_prev, + vertex_state.clone(), + t_start, + t_end, + edge_filter.clone(), + ) }); Box::new(iter) @@ -391,13 +424,12 @@ impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> WindowEvalPathFromVertex fn degree(&self, dir: Direction) -> Box + 'a> { let g = self.g; - let t_start = self.t_start; - let t_end = self.t_end; - - let iter = self.path.iter_refs().map(move |v_ref| { - let local_ref = g.localise_vertex_unchecked(v_ref); - g.degree_window(local_ref, t_start, t_end, dir, None) - }); + let edge_filter = self.edge_filter.clone(); + let layer_ids = g.layer_ids(); + let iter = self + .path + .iter_refs() + .map(move |v_ref| g.degree(v_ref, dir, &layer_ids, edge_filter.as_deref())); Box::new(iter) } @@ -417,14 +449,18 @@ impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> TimeOps } fn window(&self, t_start: T, t_end: T) -> Self::WindowedViewType { + let t_start = t_start.into_time().max(self.t_start); + let t_end = t_end.into_time().min(self.t_end); + let filter = edge_filter(self.g, t_start, t_end).map(Rc::new); WindowEvalPathFromVertex::new( self.path.clone(), self.ss, self.g, self.vertex_state.clone(), self.local_state_prev, - t_start.into_time().max(self.t_start), - t_end.into_time().min(self.t_end), + t_start, + t_end, + filter, ) } } @@ -432,7 +468,7 @@ impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> TimeOps impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> VertexViewOps for WindowEvalPathFromVertex<'a, G, CS, S> { - type Graph = G; + type Graph = WindowedGraph; type ValueType = Box + 'a>; @@ -456,105 +492,21 @@ impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> VertexViewOps self.path.latest_time() } - fn property( - &self, - name: String, - include_static: bool, - ) -> Self::ValueType> { - let g = self.g; - let t_start = self.t_start; - let t_end = self.t_end; - - let iter = self.path.iter_refs().map(move |v_ref| { - let local_ref = g.localise_vertex_unchecked(v_ref); - let props = g.temporal_vertex_prop_vec_window(local_ref, name.clone(), t_start, t_end); - match props.last() { - None => { - if include_static { - g.static_vertex_prop(local_ref, name.clone()) - } else { - None - } - } - Some((_, prop)) => Some(prop.clone()), - } - }); - Box::new(iter) - } - fn history(&self) -> Self::ValueType> { let g = self.g; let t_start = self.t_start; let t_end = self.t_end; - let iter = self.path.iter_refs().map(move |v_ref| { - let local_ref = g.localise_vertex_unchecked(v_ref); - g.vertex_timestamps_window(local_ref, t_start, t_end) - }); - - Box::new(iter) - } - - fn property_history(&self, name: String) -> Self::ValueType> { - let g = self.g; - let t_start = self.t_start; - let t_end = self.t_end; - - let iter = self.path.iter_refs().map(move |v_ref| { - let local_ref = g.localise_vertex_unchecked(v_ref); - g.temporal_vertex_prop_vec_window(local_ref, name.clone(), t_start, t_end) - }); - - Box::new(iter) - } - - fn properties( - &self, - include_static: bool, - ) -> Self::ValueType> { - self.path.properties(include_static) - } - - fn property_histories( - &self, - ) -> Self::ValueType>> { - let g = self.g; - let t_start = self.t_start; - let t_end = self.t_end; - - let iter = self.path.iter_refs().map(move |v_ref| { - let local_ref = g.localise_vertex_unchecked(v_ref); - g.temporal_vertex_props_window(local_ref, t_start, t_end) - }); - - Box::new(iter) - } - - fn property_names(&self, include_static: bool) -> Self::ValueType> { - self.path.property_names(include_static) - } - - fn has_property(&self, name: String, include_static: bool) -> Self::ValueType { - let g = self.g; - let t_start = self.t_start; - let t_end = self.t_end; - let iter = self.path.iter_refs().map(move |v_ref| { - let local_ref = g.localise_vertex_unchecked(v_ref); - let props = g.temporal_vertex_prop_vec_window(local_ref, name.clone(), t_start, t_end); - - !props.is_empty() - || (include_static && g.static_vertex_prop_names(local_ref).contains(&name)) - }); + let iter = self + .path + .iter_refs() + .map(move |v_ref| g.vertex_history_window(v_ref, t_start..t_end)); Box::new(iter) } - fn has_static_property(&self, name: String) -> Self::ValueType { - self.path.has_static_property(name) - } - - fn static_property(&self, name: String) -> Self::ValueType> { - self.path.static_property(name) + fn properties(&self) -> Self::ValueType>> { + self.path.window(self.t_start, self.t_end).properties() } fn degree(&self) -> Self::ValueType { @@ -603,11 +555,10 @@ impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> VertexViewOps } } - impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> VertexListOps for Box> + 'a> { - type Graph = G; + type Graph = WindowedGraph; type Vertex = WindowEvalVertex<'a, G, CS, S>; type IterType = Box + 'a>; type EList = Box> + 'a>; @@ -629,6 +580,10 @@ impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> VertexListOps Box::new(self.map(move |v| v.window(t_start, t_end))) } + fn at(self, end: i64) -> Self::IterType<::WindowedViewType> { + Box::new(self.map(move |v| v.at(end))) + } + fn id(self) -> Self::IterType { Box::new(self.map(|v| v.id())) } @@ -637,42 +592,14 @@ impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> VertexListOps Box::new(self.map(|v| v.name())) } - fn property(self, name: String, include_static: bool) -> Self::IterType> { - Box::new(self.map(move |v| v.property(name.clone(), include_static))) - } - - fn property_history(self, name: String) -> Self::IterType> { - Box::new(self.map(move |v| v.property_history(name.clone()))) - } - - fn properties(self, include_static: bool) -> Self::IterType> { - Box::new(self.map(move |v| v.properties(include_static))) + fn properties(self) -> Self::IterType>> { + Box::new(self.map(move |v| v.properties())) } fn history(self) -> Self::IterType> { Box::new(self.map(|v| v.history())) } - fn property_histories(self) -> Self::IterType>> { - Box::new(self.map(|v| v.property_histories())) - } - - fn property_names(self, include_static: bool) -> Self::IterType> { - Box::new(self.map(move |v| v.property_names(include_static))) - } - - fn has_property(self, name: String, include_static: bool) -> Self::IterType { - Box::new(self.map(move |v| v.has_property(name.clone(), include_static))) - } - - fn has_static_property(self, name: String) -> Self::IterType { - Box::new(self.map(move |v| v.has_static_property(name.clone()))) - } - - fn static_property(self, name: String) -> Self::IterType> { - Box::new(self.map(move |v| v.static_property(name.clone()))) - } - fn degree(self) -> Self::IterType { Box::new(self.map(|v| v.degree())) } @@ -694,7 +621,7 @@ impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> VertexListOps } fn out_edges(self) -> Self::EList { - Box::new(self.flat_map(|v| v.out_edges()).map(|ev| WindowEvalEdgeView::from(ev))) + Box::new(self.flat_map(|v| v.out_edges())) } fn neighbours(self) -> Self { @@ -710,7 +637,6 @@ impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> VertexListOps } } - impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> IntoIterator for WindowEvalPathFromVertex<'a, G, CS, S> { @@ -728,13 +654,14 @@ impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> IntoIterator Box::new(path.iter_refs().map(move |v| { WindowEvalVertex::new( ss, - self.g.localise_vertex_unchecked(v), + v, g, None, - self.local_state_prev.clone(), + self.local_state_prev, vertex_state.clone(), t_start, t_end, + self.edge_filter.clone(), ) })) } diff --git a/raphtory/src/db/task/window_eval_edge.rs b/raphtory/src/db/task/window_eval_edge.rs deleted file mode 100644 index 1387812fe7..0000000000 --- a/raphtory/src/db/task/window_eval_edge.rs +++ /dev/null @@ -1,264 +0,0 @@ -use std::{cell::RefCell, iter, marker::PhantomData, rc::Rc, collections::HashMap}; - -use crate::{ - core::{edge_ref::EdgeRef, state::compute_state::ComputeState, Prop}, - db::view_api::{edge::EdgeViewInternalOps, EdgeListOps, EdgeViewOps, GraphViewOps}, -}; - -use super::{eval_vertex_state::EVState, task_state::Local2, window_eval_vertex::WindowEvalVertex}; - -pub struct WindowEvalEdgeView<'a, G: GraphViewOps, CS: ComputeState, S: 'static> { - ss: usize, - ev: EdgeRef, - g: &'a G, - vertex_state: Rc>>, - local_state_prev: &'a Local2<'a, S>, - t_start: i64, - t_end: i64, - _s: PhantomData, -} - -impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> WindowEvalEdgeView<'a, G, CS, S> { - pub(crate) fn new( - ss: usize, - ev: EdgeRef, - g: &'a G, - local_state_prev: &'a Local2<'a, S>, - vertex_state: Rc>>, - t_start: i64, - t_end: i64, - ) -> Self { - Self { - ss, - ev, - g, - vertex_state, - local_state_prev, - t_start, - t_end, - _s: PhantomData, - } - } - - pub fn history(&self) -> Vec { - self.graph() - .edge_timestamps(self.eref(), Some(self.t_start..self.t_end)) - } -} -impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> - EdgeViewInternalOps> for WindowEvalEdgeView<'a, G, CS, S> -{ - fn graph(&self) -> G { - self.g.clone() - } - - fn eref(&self) -> EdgeRef { - self.ev.clone() - } - - fn new_vertex(&self, v: crate::core::vertex_ref::VertexRef) -> WindowEvalVertex<'a, G, CS, S> { - WindowEvalVertex::new( - self.ss, - self.g.localise_vertex_unchecked(v), - self.g, - None, - self.local_state_prev, - self.vertex_state.clone(), - self.t_start, - self.t_end, - ) - } - - fn new_edge(&self, e: EdgeRef) -> Self { - WindowEvalEdgeView::new( - self.ss, - e, - self.g, - self.local_state_prev, - self.vertex_state.clone(), - self.t_start, - self.t_end, - ) - } -} - -impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> EdgeViewOps - for WindowEvalEdgeView<'a, G, CS, S> -{ - type Graph = G; - - type Vertex = WindowEvalVertex<'a, G, CS, S>; - - type EList = Box + 'a>; - - fn explode(&self) -> Self::EList { - let e = self.ev.clone(); - let t_start = self.t_start; - let t_end = self.t_end; - let ss = self.ss; - let g = self.g; - let vertex_state = self.vertex_state.clone(); - let local_state_prev = self.local_state_prev; - - match self.ev.time() { - Some(_) => Box::new(iter::once(self.new_edge(e))), - None => { - let ts = self.g.edge_timestamps(self.ev, Some(t_start..t_end)); - Box::new(ts.into_iter().map(move |t| { - WindowEvalEdgeView::new( - ss, - e.at(t), - g, - local_state_prev, - vertex_state.clone(), - t_start, - t_end, - ) - })) - } - } - } - - fn history(&self) -> Vec { - self.graph() - .edge_timestamps(self.eref(), Some(self.t_start..self.t_end)) - } - - fn property_history(&self, name: String) -> Vec<(i64, Prop)> { - match self.eref().time() { - None => self.graph().temporal_edge_props_vec_window( - self.eref(), - name, - self.t_start, - self.t_end, - ), - Some(t) => self.graph().temporal_edge_props_vec_window( - self.eref(), - name, - t, - t.saturating_add(1), - ), - } - } - - fn property_histories(&self) -> HashMap> { - // match on the self.edge.time option property and run two function s - // one for static and one for temporal - match self.eref().time() { - None => self.graph().temporal_edge_props_window(self.eref(), self.t_start, self.t_end), - Some(t) => self - .graph() - .temporal_edge_props_window(self.eref(), t, t.saturating_add(1)), - } - } - - /// Check if edge is active at a given time point - fn active(&self, t: i64) -> bool { - match self.eref().time() { - Some(tt) => tt == t, - None => (self.t_start..self.t_end).contains(&t) && self.graph().has_edge_ref_window( - self.eref().src(), - self.eref().dst(), - t, - t.saturating_add(1), - self.eref().layer(), - ), - } - } - - /// Gets the first time an edge was seen - fn earliest_time(&self) -> Option { - self.eref().time().or_else(|| { - self.graph() - .edge_timestamps(self.eref(), Some(self.t_start..self.t_end)) - .first() - .copied() - }) - } - - /// Gets the latest time an edge was updated - fn latest_time(&self) -> Option { - self.eref().time().or_else(|| { - self.graph() - .edge_timestamps(self.eref(), Some(self.t_start..self.t_end)) - .last() - .copied() - }) - } -} - -impl<'a, G: GraphViewOps, CS: ComputeState, S: 'static> EdgeListOps - for Box> + 'a> -{ - type Graph = G; - type Vertex = WindowEvalVertex<'a, G, CS, S>; - type Edge = WindowEvalEdgeView<'a, G, CS, S>; - type ValueType = T; - type VList = Box + 'a>; - type IterType = Box + 'a>; - - fn id(self) -> Self::IterType<(u64, u64)> { - Box::new(self.map(|e| e.id())) - } - - fn has_property(self, name: String, include_static: bool) -> Self::IterType { - Box::new(self.map(move |e| e.has_property(name.clone(), include_static))) - } - - fn property( - self, - name: String, - include_static: bool, - ) -> Self::IterType> { - Box::new(self.map(move |e| e.property(name.clone(), include_static))) - } - - fn properties( - self, - include_static: bool, - ) -> Self::IterType> { - Box::new(self.map(move |e| e.properties(include_static))) - } - - fn property_names(self, include_static: bool) -> Self::IterType> { - Box::new(self.map(move |e| e.property_names(include_static))) - } - - fn has_static_property(self, name: String) -> Self::IterType { - Box::new(self.map(move |e| e.has_static_property(name.clone()))) - } - - fn static_property(self, name: String) -> Self::IterType> { - Box::new(self.map(move |it| it.static_property(name.clone()))) - } - - fn property_history(self, name: String) -> Self::IterType> { - Box::new(self.map(move |it| it.property_history(name.clone()))) - } - - fn property_histories( - self, - ) -> Self::IterType>> { - Box::new(self.map(|it| it.property_histories())) - } - - fn src(self) -> Self::VList { - Box::new(self.map(|e| e.src())) - } - - fn dst(self) -> Self::VList { - Box::new(self.map(|e| e.dst())) - } - - fn explode(self) -> Self::IterType { - Box::new(self.flat_map(move |it| it.explode())) - } - - fn earliest_time(self) -> Self::IterType> { - Box::new(self.map(|e| e.earliest_time())) - } - - fn latest_time(self) -> Self::IterType> { - Box::new(self.map(|e| e.latest_time())) - } -} diff --git a/raphtory/src/db/doc_strings.rs b/raphtory/src/db/utils/doc_strings.rs similarity index 69% rename from raphtory/src/db/doc_strings.rs rename to raphtory/src/db/utils/doc_strings.rs index 9578ac6599..139b5b41d3 100644 --- a/raphtory/src/db/doc_strings.rs +++ b/raphtory/src/db/utils/doc_strings.rs @@ -10,16 +10,16 @@ Returns: } #[macro_export] -macro_rules! layer_doc_string { +macro_rules! layers_doc_string { () => { " -Create a view including all the edges in the layer `name` +Create a view including all the edges in the layers `names` Arguments: - name (str) : the name of the layer + names (str) : the names of the layers to include Returns: - a view including all the edges in the layer `name`" + a view including all the edges in the layers `names`" }; } diff --git a/raphtory/src/db/utils/mod.rs b/raphtory/src/db/utils/mod.rs new file mode 100644 index 0000000000..aefeca739a --- /dev/null +++ b/raphtory/src/db/utils/mod.rs @@ -0,0 +1 @@ +pub mod doc_strings; diff --git a/raphtory/src/db/vertex.rs b/raphtory/src/db/vertex.rs deleted file mode 100644 index c378c33781..0000000000 --- a/raphtory/src/db/vertex.rs +++ /dev/null @@ -1,474 +0,0 @@ -//! Defines the `Vertex` struct, which represents a vertex in the graph. - -use crate::core::time::IntoTime; -use crate::core::vertex_ref::{LocalVertexRef, VertexRef}; -use crate::core::{Direction, Prop}; -use crate::db::edge::{EdgeList, EdgeView}; -use crate::db::graph_layer::LayeredGraph; -use crate::db::graph_window::WindowedGraph; -use crate::db::path::{Operations, PathFromVertex}; -use crate::db::view_api::layer::LayerOps; -use crate::db::view_api::vertex::VertexViewOps; -use crate::db::view_api::{BoxedIter, GraphViewOps, TimeOps, VertexListOps}; -use std::collections::HashMap; - -#[derive(Debug, Clone)] -pub struct VertexView { - pub graph: G, - pub vertex: LocalVertexRef, -} - -impl From> for VertexRef { - fn from(value: VertexView) -> Self { - VertexRef::Local(value.vertex) - } -} - -impl From<&VertexView> for VertexRef { - fn from(value: &VertexView) -> Self { - VertexRef::Local(value.vertex) - } -} - -impl VertexView { - /// Creates a new `VertexView` wrapping a vertex reference and a graph, localising any remote vertices to the correct shard. - pub(crate) fn new(graph: G, vertex: VertexRef) -> VertexView { - match vertex { - VertexRef::Local(local) => Self::new_local(graph, local), - _ => { - let v = graph.localise_vertex_unchecked(vertex); - VertexView { graph, vertex: v } - } - } - } - - /// Creates a new `VertexView` wrapping a local vertex reference and a graph - pub(crate) fn new_local(graph: G, vertex: LocalVertexRef) -> VertexView { - VertexView { graph, vertex } - } -} - -/// View of a Vertex in a Graph -impl VertexViewOps for VertexView { - type Graph = G; - type ValueType = T; - type PathType<'a> = PathFromVertex where Self: 'a; - type EList = BoxedIter>; - - fn id(&self) -> u64 { - self.graph.vertex_id(self.vertex) - } - - fn name(&self) -> String { - self.graph.vertex_name(self.vertex) - } - - fn earliest_time(&self) -> Option { - self.graph.vertex_earliest_time(self.vertex) - } - - fn latest_time(&self) -> Option { - self.graph.vertex_latest_time(self.vertex) - } - - fn property(&self, name: String, include_static: bool) -> Option { - let props = self.property_history(name.clone()); - match props.last() { - None => { - if include_static { - self.graph.static_vertex_prop(self.vertex, name) - } else { - None - } - } - Some((_, prop)) => Some(prop.clone()), - } - } - - fn history(&self) -> Vec { - self.graph.vertex_timestamps(self.vertex) - } - - fn property_history(&self, name: String) -> Vec<(i64, Prop)> { - self.graph.temporal_vertex_prop_vec(self.vertex, name) - } - - fn properties(&self, include_static: bool) -> HashMap { - let mut props: HashMap = self - .property_histories() - .iter() - .map(|(key, values)| (key.clone(), values.last().unwrap().1.clone())) - .collect(); - - if include_static { - for prop_name in self.graph.static_vertex_prop_names(self.vertex) { - if let Some(prop) = self - .graph - .static_vertex_prop(self.vertex, prop_name.clone()) - { - props.insert(prop_name, prop); - } - } - } - props - } - - fn property_histories(&self) -> HashMap> { - self.graph.temporal_vertex_props(self.vertex) - } - - fn property_names(&self, include_static: bool) -> Vec { - let mut names: Vec = self.graph.temporal_vertex_prop_names(self.vertex); - if include_static { - names.extend(self.graph.static_vertex_prop_names(self.vertex)) - } - names - } - - fn has_property(&self, name: String, include_static: bool) -> bool { - (!self.property_history(name.clone()).is_empty()) - || (include_static - && self - .graph - .static_vertex_prop_names(self.vertex) - .contains(&name)) - } - - fn has_static_property(&self, name: String) -> bool { - self.graph - .static_vertex_prop_names(self.vertex) - .contains(&name) - } - - fn static_property(&self, name: String) -> Option { - self.graph.static_vertex_prop(self.vertex, name) - } - - fn degree(&self) -> usize { - let dir = Direction::BOTH; - self.graph.degree(self.vertex, dir, None) - } - - fn in_degree(&self) -> usize { - let dir = Direction::IN; - self.graph.degree(self.vertex, dir, None) - } - - fn out_degree(&self) -> usize { - let dir = Direction::OUT; - self.graph.degree(self.vertex, dir, None) - } - - fn edges(&self) -> EdgeList { - let g = self.graph.clone(); - let dir = Direction::BOTH; - Box::new( - g.vertex_edges(self.vertex, dir, None) - .map(move |e| EdgeView::new(g.clone(), e)), - ) - } - - fn in_edges(&self) -> EdgeList { - let g = self.graph.clone(); - let dir = Direction::IN; - Box::new( - g.vertex_edges(self.vertex, dir, None) - .map(move |e| EdgeView::new(g.clone(), e)), - ) - } - - fn out_edges(&self) -> EdgeList { - let g = self.graph.clone(); - let dir = Direction::OUT; - Box::new( - g.vertex_edges(self.vertex, dir, None) - .map(move |e| EdgeView::new(g.clone(), e)), - ) - } - - fn neighbours(&self) -> PathFromVertex { - let g = self.graph.clone(); - let dir = Direction::BOTH; - PathFromVertex::new(g, self, Operations::Neighbours { dir }) - } - - fn in_neighbours(&self) -> PathFromVertex { - let g = self.graph.clone(); - let dir = Direction::IN; - PathFromVertex::new(g, self, Operations::Neighbours { dir }) - } - - fn out_neighbours(&self) -> PathFromVertex { - let g = self.graph.clone(); - let dir = Direction::OUT; - PathFromVertex::new(g, self, Operations::Neighbours { dir }) - } -} - -impl TimeOps for VertexView { - type WindowedViewType = VertexView>; - - fn start(&self) -> Option { - self.graph.start() - } - - fn end(&self) -> Option { - self.graph.end() - } - - fn window(&self, t_start: T, t_end: T) -> Self::WindowedViewType { - VertexView { - graph: self.graph.window(t_start, t_end), - vertex: self.vertex, - } - } -} - -impl LayerOps for VertexView { - type LayeredViewType = VertexView>; - - fn default_layer(&self) -> Self::LayeredViewType { - VertexView { - graph: self.graph.default_layer(), - vertex: self.vertex, - } - } - - fn layer(&self, name: &str) -> Option { - Some(VertexView { - graph: self.graph.layer(name)?, - vertex: self.vertex, - }) - } -} - -/// Implementation of the VertexListOps trait for an iterator of VertexView objects. -/// -impl VertexListOps for Box> + Send> { - type Graph = G; - type Vertex = VertexView; - type IterType = Box + Send>; - type EList = Box> + Send>; - type ValueType = T; - - fn earliest_time(self) -> BoxedIter> { - Box::new(self.map(|v| v.start())) - } - - fn latest_time(self) -> BoxedIter> { - Box::new(self.map(|v| v.end().map(|t| t - 1))) - } - - fn window(self, t_start: i64, t_end: i64) -> BoxedIter>> { - Box::new(self.map(move |v| v.window(t_start, t_end))) - } - - fn id(self) -> BoxedIter { - Box::new(self.map(|v| v.id())) - } - - fn name(self) -> BoxedIter { - Box::new(self.map(|v| v.name())) - } - - fn property(self, name: String, include_static: bool) -> BoxedIter> { - Box::new(self.map(move |v| v.property(name.clone(), include_static))) - } - - fn property_history(self, name: String) -> BoxedIter> { - Box::new(self.map(move |v| v.property_history(name.clone()))) - } - - fn properties(self, include_static: bool) -> BoxedIter> { - Box::new(self.map(move |v| v.properties(include_static))) - } - - fn history(self) -> BoxedIter> { - Box::new(self.map(|v| v.history())) - } - - fn property_histories(self) -> BoxedIter>> { - Box::new(self.map(|v| v.property_histories())) - } - - fn property_names(self, include_static: bool) -> BoxedIter> { - Box::new(self.map(move |v| v.property_names(include_static))) - } - - fn has_property(self, name: String, include_static: bool) -> BoxedIter { - Box::new(self.map(move |v| v.has_property(name.clone(), include_static))) - } - - fn has_static_property(self, name: String) -> BoxedIter { - Box::new(self.map(move |v| v.has_static_property(name.clone()))) - } - - fn static_property(self, name: String) -> BoxedIter> { - Box::new(self.map(move |v| v.static_property(name.clone()))) - } - - fn degree(self) -> BoxedIter { - Box::new(self.map(|v| v.degree())) - } - - fn in_degree(self) -> BoxedIter { - Box::new(self.map(|v| v.in_degree())) - } - - fn out_degree(self) -> BoxedIter { - Box::new(self.map(|v| v.out_degree())) - } - - fn edges(self) -> Self::EList { - Box::new(self.flat_map(|v| v.edges())) - } - - fn in_edges(self) -> Self::EList { - Box::new(self.flat_map(|v| v.in_edges())) - } - - fn out_edges(self) -> Self::EList { - Box::new(self.flat_map(|v| v.out_edges())) - } - - fn neighbours(self) -> Self { - Box::new(self.flat_map(|v| v.neighbours())) - } - - fn in_neighbours(self) -> Self { - Box::new(self.flat_map(|v| v.in_neighbours())) - } - - fn out_neighbours(self) -> Self { - Box::new(self.flat_map(|v| v.out_neighbours())) - } -} - -impl VertexListOps for BoxedIter>> { - type Graph = G; - type Vertex = VertexView; - type IterType = BoxedIter>; - type EList = BoxedIter>>; - type ValueType = BoxedIter; - - fn earliest_time(self) -> BoxedIter>> { - Box::new(self.map(|it| it.earliest_time())) - } - - fn latest_time(self) -> BoxedIter>> { - Box::new(self.map(|it| it.latest_time())) - } - - fn window( - self, - t_start: i64, - t_end: i64, - ) -> BoxedIter>>> { - Box::new(self.map(move |it| it.window(t_start, t_end))) - } - - fn id(self) -> BoxedIter> { - Box::new(self.map(|it| it.id())) - } - - fn name(self) -> BoxedIter> { - Box::new(self.map(|it| it.name())) - } - - fn property( - self, - name: String, - include_static: bool, - ) -> BoxedIter>> { - Box::new(self.map(move |it| it.property(name.clone(), include_static))) - } - - fn property_history(self, name: String) -> BoxedIter>> { - Box::new(self.map(move |it| it.property_history(name.clone()))) - } - - fn properties(self, include_static: bool) -> BoxedIter>> { - Box::new(self.map(move |it| it.properties(include_static))) - } - - fn history(self) -> BoxedIter>> { - Box::new(self.map(move |it| it.history())) - } - - fn property_histories(self) -> BoxedIter>>> { - Box::new(self.map(|it| it.property_histories())) - } - - fn property_names(self, include_static: bool) -> BoxedIter>> { - Box::new(self.map(move |it| it.property_names(include_static))) - } - - fn has_property(self, name: String, include_static: bool) -> BoxedIter> { - Box::new(self.map(move |it| it.has_property(name.clone(), include_static))) - } - - fn has_static_property(self, name: String) -> BoxedIter> { - Box::new(self.map(move |it| it.has_static_property(name.clone()))) - } - - fn static_property(self, name: String) -> BoxedIter>> { - Box::new(self.map(move |it| it.static_property(name.clone()))) - } - - fn degree(self) -> BoxedIter> { - Box::new(self.map(|it| it.degree())) - } - - fn in_degree(self) -> BoxedIter> { - Box::new(self.map(|it| it.in_degree())) - } - - fn out_degree(self) -> BoxedIter> { - Box::new(self.map(|it| it.out_degree())) - } - - fn edges(self) -> Self::EList { - Box::new(self.map(|it| it.edges())) - } - - fn in_edges(self) -> Self::EList { - Box::new(self.map(|it| it.in_edges())) - } - - fn out_edges(self) -> Self::EList { - Box::new(self.map(|it| it.out_edges())) - } - - fn neighbours(self) -> Self { - Box::new(self.map(|it| it.neighbours())) - } - - fn in_neighbours(self) -> Self { - Box::new(self.map(|it| it.in_neighbours())) - } - - fn out_neighbours(self) -> Self { - Box::new(self.map(|it| it.out_neighbours())) - } -} - -#[cfg(test)] -mod vertex_test { - use crate::db::graph::Graph; - use crate::db::view_api::*; - - #[test] - fn test_earliest_time() { - let g = Graph::new(4); - g.add_vertex(0, 1, &vec![]).unwrap(); - g.add_vertex(1, 1, &vec![]).unwrap(); - g.add_vertex(2, 1, &vec![]).unwrap(); - let mut view = g.at(1); - assert_eq!(view.vertex(1).expect("v").earliest_time().unwrap(), 0); - assert_eq!(view.vertex(1).expect("v").latest_time().unwrap(), 1); - - view = g.at(3); - assert_eq!(view.vertex(1).expect("v").earliest_time().unwrap(), 0); - assert_eq!(view.vertex(1).expect("v").latest_time().unwrap(), 2); - } -} diff --git a/raphtory/src/db/view_api/edge.rs b/raphtory/src/db/view_api/edge.rs deleted file mode 100644 index 054c32a1e8..0000000000 --- a/raphtory/src/db/view_api/edge.rs +++ /dev/null @@ -1,230 +0,0 @@ -use crate::core::edge_ref::EdgeRef; -use crate::core::vertex_ref::VertexRef; -use crate::core::Prop; -use crate::db::view_api::internal::GraphViewInternalOps; -use crate::db::view_api::{GraphViewOps, VertexListOps, VertexViewOps}; -use std::collections::HashMap; - -pub trait EdgeViewInternalOps> { - fn graph(&self) -> G; - - fn eref(&self) -> EdgeRef; - - fn new_vertex(&self, v: VertexRef) -> V; - - fn new_edge(&self, e: EdgeRef) -> Self; -} - -pub trait EdgeViewOps: EdgeViewInternalOps { - type Graph: GraphViewOps; - type Vertex: VertexViewOps; - type EList: EdgeListOps; - - fn property(&self, name: String, include_static: bool) -> Option { - let props = self.property_history(name.clone()); - match props.last() { - None => { - if include_static { - self.graph().static_edge_prop(self.eref(), name) - } else { - None - } - } - Some((_, prop)) => Some(prop.clone()), - } - } - - fn property_history(&self, name: String) -> Vec<(i64, Prop)> { - match self.eref().time() { - None => self.graph().temporal_edge_props_vec(self.eref(), name), - Some(t) => self.graph().temporal_edge_props_vec_window( - self.eref(), - name, - t, - t.saturating_add(1), - ), - } - } - - fn history(&self) -> Vec { - self.graph().edge_timestamps(self.eref(), None) - } - - fn properties(&self, include_static: bool) -> HashMap { - let mut props: HashMap = self - .property_histories() - .iter() - .map(|(key, values)| (key.clone(), values.last().unwrap().1.clone())) - .collect(); - - if include_static { - for prop_name in self.graph().static_edge_prop_names(self.eref()) { - if let Some(prop) = self - .graph() - .static_edge_prop(self.eref(), prop_name.clone()) - { - props.insert(prop_name, prop); - } - } - } - props - } - - fn property_histories(&self) -> HashMap> { - // match on the self.edge.time option property and run two function s - // one for static and one for temporal - match self.eref().time() { - None => self.graph().temporal_edge_props(self.eref()), - Some(t) => self - .graph() - .temporal_edge_props_window(self.eref(), t, t.saturating_add(1)), - } - } - - fn property_names(&self, include_static: bool) -> Vec { - let mut names: Vec = self.graph().temporal_edge_prop_names(self.eref()); - if include_static { - names.extend(self.graph().static_edge_prop_names(self.eref())) - } - names - } - - fn has_property(&self, name: String, include_static: bool) -> bool { - (!self.property_history(name.clone()).is_empty()) - || (include_static - && self - .graph() - .static_edge_prop_names(self.eref()) - .contains(&name)) - } - - fn has_static_property(&self, name: String) -> bool { - self.graph() - .static_edge_prop_names(self.eref()) - .contains(&name) - } - - fn static_property(&self, name: String) -> Option { - self.graph().static_edge_prop(self.eref(), name) - } - - /// Returns the source vertex of the edge. - fn src(&self) -> Self::Vertex { - let vertex = self.eref().src(); - self.new_vertex(vertex) - } - - /// Returns the destination vertex of the edge. - fn dst(&self) -> Self::Vertex { - let vertex = self.eref().dst(); - self.new_vertex(vertex) - } - - /// Check if edge is active at a given time point - fn active(&self, t: i64) -> bool { - match self.eref().time() { - Some(tt) => tt == t, - None => self.graph().has_edge_ref_window( - self.eref().src(), - self.eref().dst(), - t, - t.saturating_add(1), - self.eref().layer(), - ), - } - } - - fn id( - &self, - ) -> ( - ::ValueType, - ::ValueType, - ) { - (self.src().id(), self.dst().id()) - } - - /// Explodes an edge and returns all instances it had been updated as seperate edges - fn explode(&self) -> Self::EList; - - /// Gets the first time an edge was seen - fn earliest_time(&self) -> Option { - self.eref().time().or_else(|| { - self.graph() - .edge_timestamps(self.eref(), None) - .first() - .copied() - }) - } - - /// Gets the latest time an edge was updated - fn latest_time(&self) -> Option { - self.eref().time().or_else(|| { - self.graph() - .edge_timestamps(self.eref(), None) - .last() - .copied() - }) - } - - /// Gets the time stamp of the edge if it is exploded - fn time(&self) -> Option { - self.eref().time() - } - - /// Gets the name of the layer this edge belongs to - fn layer_name(&self) -> String { - if self.eref().layer() == 0 { - "default layer".to_string() - } else { - self.graph().get_layer_name_by_id(self.eref().layer()) - } - } -} - -/// This trait defines the operations that can be -/// performed on a list of edges in a temporal graph view. -pub trait EdgeListOps: - IntoIterator, IntoIter = Self::IterType> + Sized -{ - type Graph: GraphViewOps; - type Vertex: VertexViewOps; - type Edge: EdgeViewOps; - type ValueType; - - /// the type of list of vertices - type VList: VertexListOps; - - /// the type of iterator - type IterType: Iterator>; - - fn has_property(self, name: String, include_static: bool) -> Self::IterType; - - fn property(self, name: String, include_static: bool) -> Self::IterType>; - fn properties(self, include_static: bool) -> Self::IterType>; - fn property_names(self, include_static: bool) -> Self::IterType>; - - fn has_static_property(self, name: String) -> Self::IterType; - fn static_property(self, name: String) -> Self::IterType>; - - /// gets a property of an edge with the given name - /// includes the timestamp of the property - fn property_history(self, name: String) -> Self::IterType>; - fn property_histories(self) -> Self::IterType>>; - - /// gets the source vertices of the edges in the list - fn src(self) -> Self::VList; - - /// gets the destination vertices of the edges in the list - fn dst(self) -> Self::VList; - - fn id(self) -> Self::IterType<(u64, u64)>; - - /// returns a list of exploded edges that include an edge at each point in time - fn explode(self) -> Self::IterType; - - /// Get the timestamp for the earliest activity of the edge - fn earliest_time(self) -> Self::IterType>; - - /// Get the timestamp for the latest activity of the edge - fn latest_time(self) -> Self::IterType>; -} diff --git a/raphtory/src/db/view_api/graph.rs b/raphtory/src/db/view_api/graph.rs deleted file mode 100644 index 11c41920be..0000000000 --- a/raphtory/src/db/view_api/graph.rs +++ /dev/null @@ -1,176 +0,0 @@ -use itertools::Itertools; -use rustc_hash::FxHashSet; - -use crate::core::time::IntoTime; -use crate::core::vertex_ref::{LocalVertexRef, VertexRef}; -use crate::db::edge::EdgeView; -use crate::db::graph_layer::LayeredGraph; -use crate::db::graph_window::WindowedGraph; -use crate::db::subgraph_vertex::VertexSubgraph; -use crate::db::vertex::VertexView; -use crate::db::vertices::Vertices; -use crate::db::view_api::internal::GraphViewInternalOps; -use crate::db::view_api::layer::LayerOps; -use crate::db::view_api::time::TimeOps; -use crate::db::view_api::VertexViewOps; - -/// This trait GraphViewOps defines operations for accessing -/// information about a graph. The trait has associated types -/// that are used to define the type of the vertices, edges -/// and the corresponding iterators. -pub trait GraphViewOps: Send + Sync + Sized + GraphViewInternalOps + 'static + Clone { - fn subgraph, V: Into>( - &self, - vertices: I, - ) -> VertexSubgraph; - fn get_unique_layers(&self) -> Vec; - /// Timestamp of earliest activity in the graph - fn earliest_time(&self) -> Option; - /// Timestamp of latest activity in the graph - fn latest_time(&self) -> Option; - /// Return the number of vertices in the graph. - fn num_vertices(&self) -> usize; - - /// Check if the graph is empty. - fn is_empty(&self) -> bool { - self.num_vertices() == 0 - } - - /// Return the number of edges in the graph. - fn num_edges(&self) -> usize; - - /// Check if the graph contains a vertex `v`. - fn has_vertex>(&self, v: T) -> bool; - - /// Check if the graph contains an edge given a pair of vertices `(src, dst)`. - fn has_edge>(&self, src: T, dst: T, layer: Option<&str>) -> bool; - - /// Get a vertex `v`. - fn vertex>(&self, v: T) -> Option>; - - /// Return a View of the vertices in the Graph - fn vertices(&self) -> Vertices; - - /// Get an edge `(src, dst)`. - fn edge>( - &self, - src: T, - dst: T, - layer: Option<&str>, - ) -> Option>; - - /// Return an iterator over all edges in the graph. - fn edges(&self) -> Box> + Send>; -} - -impl GraphViewOps for G { - fn subgraph, V: Into>( - &self, - vertices: I, - ) -> VertexSubgraph { - let vertices: FxHashSet = vertices - .into_iter() - .flat_map(|v| self.local_vertex(v.into())) - .collect(); - VertexSubgraph::new(self.clone(), vertices) - } - - fn get_unique_layers(&self) -> Vec { - self.get_unique_layers_internal() - .into_iter() - .filter(|id| *id != 0) // the default layer has no name - .map(|id| self.get_layer_name_by_id(id)) - .collect_vec() - } - - fn earliest_time(&self) -> Option { - self.earliest_time_global() - } - - fn latest_time(&self) -> Option { - self.latest_time_global() - } - - fn num_vertices(&self) -> usize { - self.vertices_len() - } - - fn num_edges(&self) -> usize { - self.edges_len(None) - } - - fn has_vertex>(&self, v: T) -> bool { - self.has_vertex_ref(v.into()) - } - - fn has_edge>(&self, src: T, dst: T, layer: Option<&str>) -> bool { - match self.get_layer(layer) { - Some(layer_id) => self.has_edge_ref(src.into(), dst.into(), layer_id), - None => false, - } - } - - fn vertex>(&self, v: T) -> Option> { - let v = v.into(); - self.local_vertex(v) - .map(|v| VertexView::new_local(self.clone(), v)) - } - - fn vertices(&self) -> Vertices { - let graph = self.clone(); - Vertices::new(graph) - } - - fn edge>( - &self, - src: T, - dst: T, - layer: Option<&str>, - ) -> Option> { - let layer_id = match layer { - Some(_) => self.get_layer(layer)?, - None => { - let layers = self.get_unique_layers_internal(); - match layers[..] { - [layer_id] => layer_id, // if only one layer we search the edge there - _ => 0, // if more than one, we point to the default one - } - } - }; - self.edge_ref(src.into(), dst.into(), layer_id) - .map(|e| EdgeView::new(self.clone(), e)) - } - - fn edges(&self) -> Box> + Send> { - Box::new(self.vertices().iter().flat_map(|v| v.out_edges())) - } -} - -impl TimeOps for G { - type WindowedViewType = WindowedGraph; - - fn start(&self) -> Option { - self.view_start() - } - - fn end(&self) -> Option { - self.view_end() - } - - fn window(&self, t_start: T, t_end: T) -> WindowedGraph { - WindowedGraph::new(self.clone(), t_start, t_end) - } -} - -impl LayerOps for G { - type LayeredViewType = LayeredGraph; - - fn default_layer(&self) -> Self::LayeredViewType { - LayeredGraph::new(self.clone(), 0) - } - - fn layer(&self, name: &str) -> Option { - let id = self.get_layer(Some(name))?; - Some(LayeredGraph::new(self.clone(), id)) - } -} diff --git a/raphtory/src/db/view_api/internal.rs b/raphtory/src/db/view_api/internal.rs deleted file mode 100644 index b484bba887..0000000000 --- a/raphtory/src/db/view_api/internal.rs +++ /dev/null @@ -1,1014 +0,0 @@ -use crate::core::edge_ref::EdgeRef; -use crate::core::vertex_ref::{LocalVertexRef, VertexRef}; -use crate::core::{Direction, Prop}; -use std::collections::HashMap; -use std::ops::Range; - -/// The GraphViewInternalOps trait provides a set of methods to query a directed graph -/// represented by the raphtory_core::tgraph::TGraph struct. -pub trait GraphViewInternalOps { - /// Gets the local reference for a remote vertex and keeps local references unchanged. Assumes vertex exists! - fn localise_vertex_unchecked(&self, v: VertexRef) -> LocalVertexRef { - match v { - VertexRef::Local(v) => v, - VertexRef::Remote(g_id) => self.vertex_ref(g_id).expect("Vertex should already exists"), - } - } - - /// Check if a vertex exists locally and returns local reference. - fn local_vertex(&self, v: VertexRef) -> Option; - - /// Check if a vertex exists locally in the window and returns local reference. - fn local_vertex_window(&self, v: VertexRef, t_start: i64, t_end: i64) - -> Option; - - fn get_unique_layers_internal(&self) -> Vec; - - fn get_layer_name_by_id(&self, layer_id: usize) -> String; - - /// Get the layer id for the given layer name - fn get_layer(&self, key: Option<&str>) -> Option; - - /// Returns the default start time for perspectives over the view - fn view_start(&self) -> Option; - - /// Returns the default end time for perspectives over the view - fn view_end(&self) -> Option; - - /// Returns the timestamp for the earliest activity - fn earliest_time_global(&self) -> Option; - - /// Returns the timestamp for the earliest activity in the window - fn earliest_time_window(&self, t_start: i64, t_end: i64) -> Option; - - /// Returns the timestamp for the latest activity - fn latest_time_global(&self) -> Option; - - /// Returns the timestamp for the latest activity in the window - fn latest_time_window(&self, t_start: i64, t_end: i64) -> Option; - - /// Returns the total number of vertices in the graph. - fn vertices_len(&self) -> usize; - - /// Returns the number of vertices in the graph that were created between - /// the start (t_start) and end (t_end) timestamps (inclusive). - /// # Arguments - /// - /// * `t_start` - The start time of the window (inclusive). - /// * `t_end` - The end time of the window (exclusive). - fn vertices_len_window(&self, t_start: i64, t_end: i64) -> usize; - - /// Returns the total number of edges in the graph. - fn edges_len(&self, layer: Option) -> usize; - - /// Returns the number of edges in the graph that were created between the - /// start (t_start) and end (t_end) timestamps (inclusive). - /// # Arguments - /// - /// * `t_start` - The start time of the window (inclusive). - /// * `t_end` - The end time of the window (exclusive). - fn edges_len_window(&self, t_start: i64, t_end: i64, layer: Option) -> usize; - - /// Returns true if the graph contains an edge between the source vertex - /// (src) and the destination vertex (dst). - /// # Arguments - /// - /// * `src` - The source vertex of the edge. - /// * `dst` - The destination vertex of the edge. - fn has_edge_ref(&self, src: VertexRef, dst: VertexRef, layer: usize) -> bool; - - /// Returns true if the graph contains an edge between the source vertex (src) and the - /// destination vertex (dst) created between the start (t_start) and end (t_end) timestamps - /// (inclusive). - /// # Arguments - /// - /// * `t_start` - The start time of the window (inclusive). - /// * `t_end` - The end time of the window (exclusive). - /// * `src` - The source vertex of the edge. - /// * `dst` - The destination vertex of the edge. - fn has_edge_ref_window( - &self, - src: VertexRef, - dst: VertexRef, - t_start: i64, - t_end: i64, - layer: usize, - ) -> bool; - - /// Returns true if the graph contains the specified vertex (v). - /// # Arguments - /// - /// * `v` - VertexRef of the vertex to check. - fn has_vertex_ref(&self, v: VertexRef) -> bool; - - /// Returns true if the graph contains the specified vertex (v) created between the - /// start (t_start) and end (t_end) timestamps (inclusive). - /// # Arguments - /// - /// * `v` - VertexRef of the vertex to check. - /// * `t_start` - The start time of the window (inclusive). - /// * `t_end` - The end time of the window (exclusive). - fn has_vertex_ref_window(&self, v: VertexRef, t_start: i64, t_end: i64) -> bool; - - /// Returns the number of edges that point towards or from the specified vertex - /// (v) based on the direction (d). - /// # Arguments - /// - /// * `v` - LocalVertexRef of the vertex to check. - /// * `d` - Direction of the edges to count. - fn degree(&self, v: LocalVertexRef, d: Direction, layer: Option) -> usize; - - /// Returns the number of edges that point towards or from the specified vertex (v) - /// created between the start (t_start) and end (t_end) timestamps (inclusive) based - /// on the direction (d). - /// # Arguments - /// - /// * `v` - LocalVertexRef of the vertex to check. - /// * `t_start` - The start time of the window (inclusive). - /// * `t_end` - The end time of the window (exclusive). - fn degree_window( - &self, - v: LocalVertexRef, - t_start: i64, - t_end: i64, - d: Direction, - layer: Option, - ) -> usize; - - /// Returns the LocalVertexRef that corresponds to the specified vertex ID (v). - /// Returns None if the vertex ID is not present in the graph. - /// # Arguments - /// - /// * `v` - The vertex ID to lookup. - fn vertex_ref(&self, v: u64) -> Option; - - /// Returns the global ID for a vertex - fn vertex_id(&self, v: LocalVertexRef) -> u64; - - /// Returns the string name for a vertex - fn vertex_name(&self, v: LocalVertexRef) -> String { - match self.static_vertex_prop(v, "_id".to_string()) { - None => self.vertex_id(v).to_string(), - Some(prop) => prop.to_string(), - } - } - - /// Returns the LocalVertexRef that corresponds to the specified vertex ID (v) created - /// between the start (t_start) and end (t_end) timestamps (inclusive). - /// Returns None if the vertex ID is not present in the graph. - /// # Arguments - /// - /// * `v` - The vertex ID to lookup. - /// * `t_start` - The start time of the window (inclusive). - /// * `t_end` - The end time of the window (exclusive). - /// - /// # Returns - /// * `Option` - The LocalVertexRef of the vertex if it exists in the graph. - fn vertex_ref_window(&self, v: u64, t_start: i64, t_end: i64) -> Option; - - /// Return the earliest time for a vertex - fn vertex_earliest_time(&self, v: LocalVertexRef) -> Option; - - /// Return the earliest time for a vertex in a window - fn vertex_earliest_time_window( - &self, - v: LocalVertexRef, - t_start: i64, - t_end: i64, - ) -> Option; - - /// Return the latest time for a vertex - fn vertex_latest_time(&self, v: LocalVertexRef) -> Option; - - /// Return the latest time for a vertex in a window - fn vertex_latest_time_window(&self, v: LocalVertexRef, t_start: i64, t_end: i64) - -> Option; - - /// Returns all the vertex references in the graph. - /// # Returns - /// * `Box + Send>` - An iterator over all the vertex - /// references in the graph. - fn vertex_refs(&self) -> Box + Send>; - - /// Returns all the vertex references in the graph created between the start (t_start) and - /// end (t_end) timestamps (inclusive). - /// # Arguments - /// - /// * `t_start` - The start time of the window (inclusive). - /// * `t_end` - The end time of the window (exclusive). - /// - /// # Returns - /// * `Box + Send>` - An iterator over all the vertexes - fn vertex_refs_window( - &self, - t_start: i64, - t_end: i64, - ) -> Box + Send>; - - fn vertex_refs_shard(&self, shard: usize) -> Box + Send>; - - /// Returns all the vertex references in the graph that are in the specified shard. - /// Between the start (t_start) and end (t_end) - /// - /// # Arguments - /// shard - The shard to return the vertex references for. - /// t_start - The start time of the window (inclusive). - /// t_end - The end time of the window (exclusive). - /// - /// # Returns - /// * `Box + Send>` - An iterator over all the vertexes - fn vertex_refs_window_shard( - &self, - shard: usize, - t_start: i64, - t_end: i64, - ) -> Box + Send>; - - /// Returns the edge reference that corresponds to the specified src and dst vertex - /// # Arguments - /// - /// * `src` - The source vertex. - /// * `dst` - The destination vertex. - /// - /// # Returns - /// - /// * `Option` - The edge reference if it exists. - fn edge_ref(&self, src: VertexRef, dst: VertexRef, layer: usize) -> Option; - - /// Returns the edge reference that corresponds to the specified src and dst vertex - /// created between the start (t_start) and end (t_end) timestamps (exclusive). - /// - /// # Arguments - /// - /// * `src` - The source vertex. - /// * `dst` - The destination vertex. - /// * `t_start` - The start time of the window (inclusive). - /// * `t_end` - The end time of the window (exclusive). - /// - /// # Returns - /// - /// * `Option` - The edge reference if it exists. - fn edge_ref_window( - &self, - src: VertexRef, - dst: VertexRef, - t_start: i64, - t_end: i64, - layer: usize, - ) -> Option; - - /// Returns all the edge references in the graph. - /// - /// # Returns - /// - /// * `Box + Send>` - An iterator over all the edge references. - fn edge_refs(&self, layer: Option) -> Box + Send>; - - /// Returns all the edge references in the graph created between the start (t_start) and - /// end (t_end) timestamps (inclusive). - /// - /// # Arguments - /// - /// * `t_start` - The start time of the window (inclusive). - /// * `t_end` - The end time of the window (exclusive). - /// # Returns - /// - /// * `Box + Send>` - An iterator over all the edge references. - fn edge_refs_window( - &self, - t_start: i64, - t_end: i64, - layer: Option, - ) -> Box + Send>; - - /// Returns an iterator over the edges connected to a given vertex in a given direction. - /// - /// # Arguments - /// - /// * `v` - A reference to the vertex for which the edges are being queried. - /// * `d` - The direction in which to search for edges. - /// * `layer` - The optional layer to consider - /// - /// # Returns - /// - /// Box + Send> - A boxed iterator that yields references to - /// the edges connected to the vertex. - fn vertex_edges( - &self, - v: LocalVertexRef, - d: Direction, - layer: Option, - ) -> Box + Send>; - - /// Returns an iterator over the exploded edges connected to a given vertex in a given direction. - /// - /// # Arguments - /// - /// * `v` - A reference to the vertex for which the edges are being queried. - /// * `d` - The direction in which to search for edges. - /// - /// # Returns - /// - /// Box + Send> - A boxed iterator that yields references to - /// the edges connected to the vertex. - fn vertex_edges_t( - &self, - v: LocalVertexRef, - d: Direction, - layer: Option, - ) -> Box + Send>; - - /// Returns an iterator over the edges connected to a given vertex within a - /// specified time window in a given direction. - /// - /// # Arguments - /// - /// * `v` - A reference to the vertex for which the edges are being queried. - /// * `t_start` - The start time of the window (inclusive). - /// * `t_end` - The end time of the window (exclusive). - /// * `d` - The direction in which to search for edges. - /// - /// # Returns - /// - /// Box + Send> - A boxed iterator that yields references - /// to the edges connected to the vertex within the specified time window. - fn vertex_edges_window( - &self, - v: LocalVertexRef, - t_start: i64, - t_end: i64, - d: Direction, - layer: Option, - ) -> Box + Send>; - - /// Returns an iterator over the edges connected to a given vertex within - /// a specified time window in a given direction but exploded. - /// - /// # Arguments - /// - /// * `v` - A reference to the vertex for which the edges are being queried. - /// * `t_start` - The start time of the window (inclusive). - /// * `t_end` - The end time of the window (exclusive). - /// * `d` - The direction in which to search for edges. - /// - /// # Returns - /// - /// A boxed iterator that yields references to the edges connected to the vertex - /// within the specified time window but exploded. - fn vertex_edges_window_t( - &self, - v: LocalVertexRef, - t_start: i64, - t_end: i64, - d: Direction, - layer: Option, - ) -> Box + Send>; - - /// Returns an iterator over the neighbors of a given vertex in a given direction. - /// - /// # Arguments - /// - /// * `v` - A reference to the vertex for which the neighbors are being queried. - /// * `d` - The direction in which to search for neighbors. - /// - /// # Returns - /// - /// A boxed iterator that yields references to the neighboring vertices. - fn neighbours( - &self, - v: LocalVertexRef, - d: Direction, - layer: Option, - ) -> Box + Send>; - - /// Returns an iterator over the neighbors of a given vertex within a specified time window in a given direction. - /// - /// # Arguments - /// - /// * `v` - A reference to the vertex for which the neighbors are being queried. - /// * `t_start` - The start time of the window (inclusive). - /// * `t_end` - The end time of the window (exclusive). - /// * `d` - The direction in which to search for neighbors. - /// - /// # Returns - /// - /// A boxed iterator that yields references to the neighboring vertices within the specified time window. - fn neighbours_window( - &self, - v: LocalVertexRef, - t_start: i64, - t_end: i64, - d: Direction, - layer: Option, - ) -> Box + Send>; - - /// Gets a static property of a given vertex given the name and vertex reference. - /// - /// # Arguments - /// - /// * `v` - A reference to the vertex for which the property is being queried. - /// * `name` - The name of the property. - /// - /// # Returns - /// - /// Option - The property value if it exists. - fn static_vertex_prop(&self, v: LocalVertexRef, name: String) -> Option; - - /// Gets the keys of static properties of a given vertex - /// - /// # Arguments - /// - /// * `v` - A reference to the vertex for which the property is being queried. - /// - /// # Returns - /// - /// Vec - The keys of the static properties. - fn static_vertex_prop_names(&self, v: LocalVertexRef) -> Vec; - - /// Returns a vector of all names of temporal properties within the given vertex - /// - /// # Arguments - /// - /// * `v` - A reference to the vertex for which to retrieve the names. - /// - /// # Returns - /// - /// A vector of strings representing the names of the temporal properties - fn temporal_vertex_prop_names(&self, v: LocalVertexRef) -> Vec; - - /// Returns a vector of all temporal values of the vertex property with the given name for the - /// given vertex - /// - /// # Arguments - /// - /// * `v` - A reference to the vertex for which to retrieve the temporal property vector. - /// * `name` - The name of the property to retrieve. - /// - /// # Returns - /// - /// A vector of tuples representing the temporal values of the property for the given vertex - /// that fall within the specified time window, where the first element of each tuple is the timestamp - /// and the second element is the property value. - fn temporal_vertex_prop_vec(&self, v: LocalVertexRef, name: String) -> Vec<(i64, Prop)>; - - /// Returns a vector of all temporal values of the vertex - /// - /// # Arguments - /// - /// * `v` - A reference to the vertex for which to retrieve the timestamp. - /// - /// # Returns - /// - /// A vector of timestamps representing the temporal values for the given vertex. - fn vertex_timestamps(&self, v: LocalVertexRef) -> Vec; - - /// Returns a vector of all temporal values of the vertex for a given window. - /// - /// # Arguments - /// - /// * `v` - A reference to the vertex for which to retrieve the timestamp. - /// * `t_start` - The start time of the window. - /// * `t_end` - The end time of the window. - /// - /// # Returns - /// - /// A vector of timestamps representing the temporal values for the given vertex in a given window. - fn vertex_timestamps_window(&self, v: LocalVertexRef, t_start: i64, t_end: i64) -> Vec; - - /// Returns a vector of all temporal values of the vertex property with the given name for the given vertex - /// that fall within the specified time window. - /// - /// # Arguments - /// - /// * `v` - A reference to the vertex for which to retrieve the temporal property vector. - /// * `name` - The name of the property to retrieve. - /// * `t_start` - The start time of the window to consider. - /// * `t_end` - The end time of the window to consider. - /// - /// # Returns - /// - /// A vector of tuples representing the temporal values of the property for the given vertex - /// that fall within the specified time window, where the first element of each tuple is the timestamp - /// and the second element is the property value. - fn temporal_vertex_prop_vec_window( - &self, - v: LocalVertexRef, - name: String, - t_start: i64, - t_end: i64, - ) -> Vec<(i64, Prop)>; - - /// Returns a map of all temporal values of the vertex properties for the given vertex. - /// The keys of the map are the names of the properties, and the values are vectors of tuples - /// - /// # Arguments - /// - /// - `v` - A reference to the vertex for which to retrieve the temporal property vector. - /// - /// # Returns - /// - A map of all temporal values of the vertex properties for the given vertex. - fn temporal_vertex_props(&self, v: LocalVertexRef) -> HashMap>; - - /// Returns a map of all temporal values of the vertex properties for the given vertex - /// that fall within the specified time window. - /// - /// # Arguments - /// - /// - `v` - A reference to the vertex for which to retrieve the temporal property vector. - /// - `t_start` - The start time of the window to consider (inclusive). - /// - `t_end` - The end time of the window to consider (exclusive). - /// - /// # Returns - /// - A map of all temporal values of the vertex properties for the given vertex - fn temporal_vertex_props_window( - &self, - v: LocalVertexRef, - t_start: i64, - t_end: i64, - ) -> HashMap>; - - /// Returns a vector of all temporal values of the edge property with the given name for the - /// given edge reference. - /// - /// # Arguments - /// - /// * `e` - An `EdgeRef` reference to the edge of interest. - /// * `name` - A `String` containing the name of the temporal property. - /// - /// # Returns - /// - /// A property if it exists - fn static_edge_prop(&self, e: EdgeRef, name: String) -> Option; - - /// Returns a vector of keys for the static properties of the given edge reference. - /// - /// # Arguments - /// - /// * `e` - An `EdgeRef` reference to the edge of interest. - /// - /// # Returns - /// - /// * A `Vec` of `String` containing the keys for the static properties of the given edge. - fn static_edge_prop_names(&self, e: EdgeRef) -> Vec; - - /// Returns a vector of keys for the temporal properties of the given edge reference. - /// - /// # Arguments - /// - /// * `e` - An `EdgeRef` reference to the edge of interest. - /// - /// # Returns - /// - /// * A `Vec` of `String` containing the keys for the temporal properties of the given edge. - fn temporal_edge_prop_names(&self, e: EdgeRef) -> Vec; - - /// Returns a vector of tuples containing the values of the temporal property with the given name - /// for the given edge reference. - /// - /// # Arguments - /// - /// * `e` - An `EdgeRef` reference to the edge of interest. - /// * `name` - A `String` containing the name of the temporal property. - /// - /// # Returns - /// - /// * A `Vec` of tuples containing the values of the temporal property with the given name for the given edge. - fn temporal_edge_props_vec(&self, e: EdgeRef, name: String) -> Vec<(i64, Prop)>; - - /// Returns a vector of tuples containing the values of the temporal property with the given name - /// for the given edge reference within the specified time window. - /// - /// # Arguments - /// - /// * `e` - An `EdgeRef` reference to the edge of interest. - /// * `name` - A `String` containing the name of the temporal property. - /// * `t_start` - An `i64` containing the start time of the time window (inclusive). - /// * `t_end` - An `i64` containing the end time of the time window (exclusive). - /// - /// # Returns - /// - /// * A `Vec` of tuples containing the values of the temporal property with the given name for the given edge - /// within the specified time window. - /// - fn temporal_edge_props_vec_window( - &self, - e: EdgeRef, - name: String, - t_start: i64, - t_end: i64, - ) -> Vec<(i64, Prop)>; - - fn edge_timestamps(&self, e: EdgeRef, window: Option>) -> Vec; - - /// Returns a hash map containing all the temporal properties of the given edge reference, - /// where each key is the name of a temporal property and each value is a vector of tuples containing - /// the property value and the time it was recorded. - /// - /// # Arguments - /// - /// * `e` - An `EdgeRef` reference to the edge. - /// - /// # Returns - /// - /// * A `HashMap` containing all the temporal properties of the given edge, where each key is the name of a - /// temporal property and each value is a vector of tuples containing the property value and the time it was recorded. - /// - fn temporal_edge_props(&self, e: EdgeRef) -> HashMap>; - - /// Returns a hash map containing all the temporal properties of the given edge reference within the specified - /// time window, where each key is the name of a temporal property and each value is a vector of tuples containing - /// the property value and the time it was recorded. - /// - /// # Arguments - /// - /// * `e` - An `EdgeRef` reference to the edge. - /// * `t_start` - An `i64` containing the start time of the time window (inclusive). - /// * `t_end` - An `i64` containing the end time of the time window (exclusive). - /// - /// # Returns - /// - /// * A `HashMap` containing all the temporal properties of the given edge within the specified time window, - /// where each key is the name of a temporal property and each value is a vector of tuples containing the property - /// value and the time it was recorded. - /// - fn temporal_edge_props_window( - &self, - e: EdgeRef, - t_start: i64, - t_end: i64, - ) -> HashMap>; - - fn num_shards(&self) -> usize; -} - -pub trait WrappedGraph { - type Internal: GraphViewInternalOps + Send + Sync + 'static + ?Sized; - - fn as_graph(&self) -> &Self::Internal; -} - -/// Helper trait for various graphs that just delegate to the internal graph -/// -impl GraphViewInternalOps for G -where - G: WrappedGraph, -{ - fn local_vertex(&self, v: VertexRef) -> Option { - self.as_graph().local_vertex(v) - } - - fn local_vertex_window( - &self, - v: VertexRef, - t_start: i64, - t_end: i64, - ) -> Option { - self.as_graph().local_vertex_window(v, t_start, t_end) - } - - fn get_unique_layers_internal(&self) -> Vec { - self.as_graph().get_unique_layers_internal() - } - - fn get_layer_name_by_id(&self, layer_id: usize) -> String { - self.as_graph().get_layer_name_by_id(layer_id) - } - - fn get_layer(&self, key: Option<&str>) -> Option { - self.as_graph().get_layer(key) - } - - fn view_start(&self) -> Option { - self.as_graph().view_start() - } - - fn view_end(&self) -> Option { - self.as_graph().view_end() - } - - fn earliest_time_global(&self) -> Option { - self.as_graph().earliest_time_global() - } - - fn earliest_time_window(&self, t_start: i64, t_end: i64) -> Option { - self.as_graph().earliest_time_window(t_start, t_end) - } - - fn latest_time_global(&self) -> Option { - self.as_graph().latest_time_global() - } - - fn latest_time_window(&self, t_start: i64, t_end: i64) -> Option { - self.as_graph().latest_time_window(t_start, t_end) - } - - fn vertices_len(&self) -> usize { - self.as_graph().vertices_len() - } - - fn vertices_len_window(&self, t_start: i64, t_end: i64) -> usize { - self.as_graph().vertices_len_window(t_start, t_end) - } - - fn edges_len(&self, layer: Option) -> usize { - self.as_graph().edges_len(layer) - } - - fn edges_len_window(&self, t_start: i64, t_end: i64, layer: Option) -> usize { - self.as_graph().edges_len_window(t_start, t_end, layer) - } - - fn has_edge_ref(&self, src: VertexRef, dst: VertexRef, layer: usize) -> bool { - self.as_graph().has_edge_ref(src, dst, layer) - } - - fn has_edge_ref_window( - &self, - src: VertexRef, - dst: VertexRef, - t_start: i64, - t_end: i64, - layer: usize, - ) -> bool { - self.as_graph() - .has_edge_ref_window(src, dst, t_start, t_end, layer) - } - - fn has_vertex_ref(&self, v: VertexRef) -> bool { - self.as_graph().has_vertex_ref(v) - } - - fn has_vertex_ref_window(&self, v: VertexRef, t_start: i64, t_end: i64) -> bool { - self.as_graph().has_vertex_ref_window(v, t_start, t_end) - } - - fn degree(&self, v: LocalVertexRef, d: Direction, layer: Option) -> usize { - self.as_graph().degree(v, d, layer) - } - - fn degree_window( - &self, - v: LocalVertexRef, - t_start: i64, - t_end: i64, - d: Direction, - layer: Option, - ) -> usize { - self.as_graph().degree_window(v, t_start, t_end, d, layer) - } - - fn vertex_ref(&self, v: u64) -> Option { - self.as_graph().vertex_ref(v) - } - - fn vertex_id(&self, v: LocalVertexRef) -> u64 { - self.as_graph().vertex_id(v) - } - - fn vertex_ref_window(&self, v: u64, t_start: i64, t_end: i64) -> Option { - self.as_graph().vertex_ref_window(v, t_start, t_end) - } - - fn vertex_earliest_time(&self, v: LocalVertexRef) -> Option { - self.as_graph().vertex_earliest_time(v) - } - - fn vertex_earliest_time_window( - &self, - v: LocalVertexRef, - t_start: i64, - t_end: i64, - ) -> Option { - self.as_graph() - .vertex_earliest_time_window(v, t_start, t_end) - } - - fn vertex_latest_time(&self, v: LocalVertexRef) -> Option { - self.as_graph().vertex_latest_time(v) - } - - fn vertex_latest_time_window( - &self, - v: LocalVertexRef, - t_start: i64, - t_end: i64, - ) -> Option { - self.as_graph().vertex_latest_time_window(v, t_start, t_end) - } - - fn vertex_refs(&self) -> Box + Send> { - self.as_graph().vertex_refs() - } - - fn vertex_refs_window( - &self, - t_start: i64, - t_end: i64, - ) -> Box + Send> { - self.as_graph().vertex_refs_window(t_start, t_end) - } - - fn vertex_refs_shard(&self, shard: usize) -> Box + Send> { - self.as_graph().vertex_refs_shard(shard) - } - - fn vertex_refs_window_shard( - &self, - shard: usize, - t_start: i64, - t_end: i64, - ) -> Box + Send> { - self.as_graph() - .vertex_refs_window_shard(shard, t_start, t_end) - } - - fn edge_ref(&self, src: VertexRef, dst: VertexRef, layer: usize) -> Option { - self.as_graph().edge_ref(src, dst, layer) - } - - fn edge_ref_window( - &self, - src: VertexRef, - dst: VertexRef, - t_start: i64, - t_end: i64, - layer: usize, - ) -> Option { - self.as_graph() - .edge_ref_window(src, dst, t_start, t_end, layer) - } - - fn edge_refs(&self, layer: Option) -> Box + Send> { - self.as_graph().edge_refs(layer) - } - - fn edge_refs_window( - &self, - t_start: i64, - t_end: i64, - layer: Option, - ) -> Box + Send> { - self.as_graph().edge_refs_window(t_start, t_end, layer) - } - - fn vertex_edges( - &self, - v: LocalVertexRef, - d: Direction, - layer: Option, - ) -> Box + Send> { - self.as_graph().vertex_edges(v, d, layer) - } - - fn vertex_edges_t( - &self, - v: LocalVertexRef, - d: Direction, - layer: Option, - ) -> Box + Send> { - self.as_graph().vertex_edges_t(v, d, layer) - } - - fn vertex_edges_window( - &self, - v: LocalVertexRef, - t_start: i64, - t_end: i64, - d: Direction, - layer: Option, - ) -> Box + Send> { - self.as_graph() - .vertex_edges_window(v, t_start, t_end, d, layer) - } - - fn vertex_edges_window_t( - &self, - v: LocalVertexRef, - t_start: i64, - t_end: i64, - d: Direction, - layer: Option, - ) -> Box + Send> { - self.as_graph() - .vertex_edges_window_t(v, t_start, t_end, d, layer) - } - - fn neighbours( - &self, - v: LocalVertexRef, - d: Direction, - layer: Option, - ) -> Box + Send> { - self.as_graph().neighbours(v, d, layer) - } - - fn neighbours_window( - &self, - v: LocalVertexRef, - t_start: i64, - t_end: i64, - d: Direction, - layer: Option, - ) -> Box + Send> { - self.as_graph() - .neighbours_window(v, t_start, t_end, d, layer) - } - - fn static_vertex_prop(&self, v: LocalVertexRef, name: String) -> Option { - self.as_graph().static_vertex_prop(v, name) - } - - fn static_vertex_prop_names(&self, v: LocalVertexRef) -> Vec { - self.as_graph().static_vertex_prop_names(v) - } - - fn temporal_vertex_prop_names(&self, v: LocalVertexRef) -> Vec { - self.as_graph().temporal_vertex_prop_names(v) - } - - fn temporal_vertex_prop_vec(&self, v: LocalVertexRef, name: String) -> Vec<(i64, Prop)> { - self.as_graph().temporal_vertex_prop_vec(v, name) - } - - fn vertex_timestamps(&self, v: LocalVertexRef) -> Vec { - self.as_graph().vertex_timestamps(v) - } - - fn vertex_timestamps_window(&self, v: LocalVertexRef, t_start: i64, t_end: i64) -> Vec { - self.as_graph().vertex_timestamps_window(v, t_start, t_end) - } - - fn temporal_vertex_prop_vec_window( - &self, - v: LocalVertexRef, - name: String, - t_start: i64, - t_end: i64, - ) -> Vec<(i64, Prop)> { - self.as_graph() - .temporal_vertex_prop_vec_window(v, name, t_start, t_end) - } - - fn temporal_vertex_props(&self, v: LocalVertexRef) -> HashMap> { - self.as_graph().temporal_vertex_props(v) - } - - fn temporal_vertex_props_window( - &self, - v: LocalVertexRef, - t_start: i64, - t_end: i64, - ) -> HashMap> { - self.as_graph() - .temporal_vertex_props_window(v, t_start, t_end) - } - - fn static_edge_prop(&self, e: EdgeRef, name: String) -> Option { - self.as_graph().static_edge_prop(e, name) - } - - fn static_edge_prop_names(&self, e: EdgeRef) -> Vec { - self.as_graph().static_edge_prop_names(e) - } - - fn temporal_edge_prop_names(&self, e: EdgeRef) -> Vec { - self.as_graph().temporal_edge_prop_names(e) - } - - fn temporal_edge_props_vec(&self, e: EdgeRef, name: String) -> Vec<(i64, Prop)> { - self.as_graph().temporal_edge_props_vec(e, name) - } - - fn temporal_edge_props_vec_window( - &self, - e: EdgeRef, - name: String, - t_start: i64, - t_end: i64, - ) -> Vec<(i64, Prop)> { - self.as_graph() - .temporal_edge_props_vec_window(e, name, t_start, t_end) - } - - fn edge_timestamps(&self, e: EdgeRef, window: Option>) -> Vec { - self.as_graph().edge_timestamps(e, window) - } - - fn temporal_edge_props(&self, e: EdgeRef) -> HashMap> { - self.as_graph().temporal_edge_props(e) - } - - fn temporal_edge_props_window( - &self, - e: EdgeRef, - t_start: i64, - t_end: i64, - ) -> HashMap> { - self.as_graph() - .temporal_edge_props_window(e, t_start, t_end) - } - - fn num_shards(&self) -> usize { - self.as_graph().num_shards() - } -} diff --git a/raphtory/src/db/view_api/layer.rs b/raphtory/src/db/view_api/layer.rs deleted file mode 100644 index 409af1e58d..0000000000 --- a/raphtory/src/db/view_api/layer.rs +++ /dev/null @@ -1,10 +0,0 @@ -/// Trait defining layer operations -pub trait LayerOps { - type LayeredViewType; - - /// Return a graph containing only the default edge layer - fn default_layer(&self) -> Self::LayeredViewType; - - /// Return a graph containing the layer `name` - fn layer(&self, name: &str) -> Option; -} diff --git a/raphtory/src/db/view_api/mod.rs b/raphtory/src/db/view_api/mod.rs deleted file mode 100644 index 7a61e4976c..0000000000 --- a/raphtory/src/db/view_api/mod.rs +++ /dev/null @@ -1,17 +0,0 @@ -//! Defines the `ViewApi` trait, which represents the API for querying a view of the graph. - -pub mod edge; -pub mod graph; -pub mod internal; -pub mod layer; -pub mod time; -pub mod vertex; - -pub use edge::EdgeListOps; -pub use edge::EdgeViewOps; -pub use graph::GraphViewOps; -pub use time::TimeOps; -pub use vertex::VertexListOps; -pub use vertex::VertexViewOps; - -pub type BoxedIter = Box + Send>; diff --git a/raphtory-io/src/graph_loader/example/company_house.rs b/raphtory/src/graph_loader/example/company_house.rs similarity index 55% rename from raphtory-io/src/graph_loader/example/company_house.rs rename to raphtory/src/graph_loader/example/company_house.rs index 9e39a2e82d..5473b94260 100644 --- a/raphtory-io/src/graph_loader/example/company_house.rs +++ b/raphtory/src/graph_loader/example/company_house.rs @@ -1,12 +1,7 @@ -use crate::graph_loader::source::csv_loader::CsvLoader; +use crate::{graph_loader::source::csv_loader::CsvLoader, prelude::*}; use chrono::NaiveDateTime; -use raphtory::core::Prop; -use raphtory::db::graph::Graph; -use raphtory::db::view_api::internal::GraphViewInternalOps; -use raphtory::db::view_api::{GraphViewOps, VertexViewOps}; use serde::Deserialize; -use std::path::PathBuf; -use std::{fs, time::Instant}; +use std::{fs, path::PathBuf, time::Instant}; #[derive(Deserialize, std::fmt::Debug)] pub struct CompanyHouse { @@ -14,10 +9,10 @@ pub struct CompanyHouse { pincode: String, company: String, owner: String, - illegal_hmo: Option + illegal_hmo: Option, } -pub fn company_house_graph(path: Option, num_shards: usize) -> Graph { +pub fn company_house_graph(path: Option) -> Graph { let default_data_dir: PathBuf = PathBuf::from("/tmp/company-house"); let data_dir = match path { @@ -43,11 +38,10 @@ pub fn company_house_graph(path: Option, num_shards: usize) -> Graph { .ok()?; println!( - "Loaded graph with {} shards from encoded data files {} with {} vertices, {} edges which took {} seconds", - g.num_shards(), + "Loaded graph from encoded data files {} with {} vertices, {} edges which took {} seconds", encoded_data_dir.to_str().unwrap(), - g.num_vertices(), - g.num_edges(), + g.count_vertices(), + g.count_edges(), now.elapsed().as_secs() ); @@ -58,7 +52,7 @@ pub fn company_house_graph(path: Option, num_shards: usize) -> Graph { } let g = restore_from_bincode(&encoded_data_dir).unwrap_or_else(|| { - let g = Graph::new(num_shards); + let g = Graph::new(); let now = Instant::now(); let ts = 1; @@ -67,7 +61,7 @@ pub fn company_house_graph(path: Option, num_shards: usize) -> Graph { .set_delimiter(",") .load_into_graph(&g, |company_house: CompanyHouse, g: &Graph| { let pincode = &company_house.pincode; - let address = company_house.address + ", " + pincode; + let address = format!("{}, {pincode}", company_house.address); let company = company_house.company; let owner = company_house.owner; // let illegal_flag : Option = match company_house.illegal_hmo { @@ -82,81 +76,71 @@ pub fn company_house_graph(path: Option, num_shards: usize) -> Graph { g.add_vertex( NaiveDateTime::from_timestamp_opt(ts, 0).unwrap(), owner.clone(), - &vec![], - ).expect("Failed to add vertex"); - - g.add_vertex_properties(owner.clone(), &vec![ - ("type".into(), Prop::Str("owner".into())) - ]) - .expect("Failed to add vertex static property"); + NO_PROPS, + ) + .expect("Failed to add vertex") + .add_constant_properties([("type", "owner")]) + .expect("Failed to add vertex static property"); - g.add_vertex( NaiveDateTime::from_timestamp_opt(ts, 0).unwrap(), company.clone(), - &vec![], - ).expect("Failed to add vertex"); - - g.add_vertex_properties(company.clone(), &vec![ - ("type".into(), Prop::Str("company".into())), - ("flag".into(), Prop::Str(company_house.illegal_hmo.clone().unwrap_or("None".into()))) - ]) - .expect("Failed to add vertex static property"); + NO_PROPS, + ) + .expect("Failed to add vertex") + .add_constant_properties([ + ("type", "company".into_prop()), + ( + "flag", + (company_house.illegal_hmo.clone().unwrap_or("None".into())).into_prop(), + ), + ]) + .expect("Failed to add vertex static property"); g.add_vertex( NaiveDateTime::from_timestamp_opt(ts, 0).unwrap(), address.clone(), - &vec![], - ).expect("Failed to add vertex"); - - g.add_vertex_properties(address.clone(), &vec![ - ("type".into(), Prop::Str("address".into())), - ("flag".into(), Prop::Str(company_house.illegal_hmo.clone().unwrap_or("None".into()))) - ]) - .expect("Failed to add vertex static property"); + NO_PROPS, + ) + .expect("Failed to add vertex") + .add_constant_properties([ + ("type", "address".into_prop()), + ( + "flag", + (company_house.illegal_hmo.clone().unwrap_or("None".into())).into_prop(), + ), + ]) + .expect("Failed to add vertex static property"); g.add_edge( NaiveDateTime::from_timestamp_opt(ts, 0).unwrap(), owner.clone(), company.clone(), - &vec![], + NO_PROPS, Some(pincode), ) - .expect("Failed to add edge"); - - g.add_edge_properties( - owner, - company.clone(), - &vec![("rel".into(), Prop::Str("owns".into()))], - Some(pincode), - ) - .expect("Failed to add edge static property"); + .expect("Failed to add edge") + .add_constant_properties([("rel", "owns")], Some(pincode)) + .expect("Failed to add edge static property"); g.add_edge( NaiveDateTime::from_timestamp_opt(ts, 0).unwrap(), company.clone(), address.clone(), - &vec![], - None, - ) - .expect("Failed to add edge"); - - g.add_edge_properties( - company, - address, - &vec![("rel".into(), Prop::Str("owns".into()))], + NO_PROPS, None, ) - .expect("Failed to add edge static property"); + .expect("Failed to add edge") + .add_constant_properties([("rel", "owns")], None) + .expect("Failed to add edge static property"); }) .expect("Failed to load graph from CSV data files"); println!( - "Loaded graph with {} shards from CSV data files {} with {} vertices, {} edges which took {} seconds", - g.num_shards(), + "Loaded graph from CSV data files {} with {} vertices, {} edges which took {} seconds", encoded_data_dir.to_str().unwrap(), - g.num_vertices(), - g.num_edges(), + g.count_vertices(), + g.count_edges(), now.elapsed().as_secs() ); @@ -172,15 +156,12 @@ pub fn company_house_graph(path: Option, num_shards: usize) -> Graph { #[cfg(test)] mod company_house_graph_test { use super::*; - use raphtory::db::view_api::{TimeOps, VertexViewOps}; + use crate::db::api::view::{TimeOps, VertexViewOps}; #[test] #[ignore] fn test_ch_load() { - let g = company_house_graph( - None, - 1, - ); + let g = company_house_graph(None); assert_eq!(g.start().unwrap(), 1000); assert_eq!(g.end().unwrap(), 1001); g.window(1000, 1001) diff --git a/raphtory-io/src/graph_loader/example/lotr_graph.rs b/raphtory/src/graph_loader/example/lotr_graph.rs similarity index 75% rename from raphtory-io/src/graph_loader/example/lotr_graph.rs rename to raphtory/src/graph_loader/example/lotr_graph.rs index e33c3d3701..20ff674e49 100644 --- a/raphtory-io/src/graph_loader/example/lotr_graph.rs +++ b/raphtory/src/graph_loader/example/lotr_graph.rs @@ -13,20 +13,18 @@ //! //! Example: //! ```rust -//! use raphtory_io::graph_loader::example::lotr_graph::lotr_graph; -//! use raphtory::db::graph::Graph; -//! use raphtory::db::view_api::*; +//! use raphtory::graph_loader::example::lotr_graph::lotr_graph; +//! use raphtory::prelude::*; //! -//! let graph = lotr_graph(1); +//! let graph = lotr_graph(); //! -//! println!("The graph has {:?} vertices", graph.num_vertices()); -//! println!("The graph has {:?} edges", graph.num_edges()); +//! println!("The graph has {:?} vertices", graph.count_vertices()); +//! println!("The graph has {:?} edges", graph.count_edges()); //! ``` -use raphtory::db::graph::Graph; - -use crate::graph_loader::fetch_file; - -use crate::graph_loader::source::csv_loader::CsvLoader; +use crate::{ + graph_loader::{fetch_file, source::csv_loader::CsvLoader}, + prelude::*, +}; use serde::Deserialize; use std::path::PathBuf; @@ -60,9 +58,9 @@ pub fn lotr_file() -> Result> { /// /// # Returns /// - A Graph containing the LOTR dataset -pub fn lotr_graph(shards: usize) -> Graph { +pub fn lotr_graph() -> Graph { let graph = { - let g = Graph::new(shards); + let g = Graph::new(); CsvLoader::new(lotr_file().unwrap()) .load_into_graph(&g, |lotr: Lotr, g: &Graph| { @@ -70,13 +68,13 @@ pub fn lotr_graph(shards: usize) -> Graph { let dst_id = lotr.dst_id; let time = lotr.time; - g.add_vertex(time, src_id.clone(), &vec![]) + g.add_vertex(time, src_id.clone(), NO_PROPS) .map_err(|err| println!("{:?}", err)) .ok(); - g.add_vertex(time, dst_id.clone(), &vec![]) + g.add_vertex(time, dst_id.clone(), NO_PROPS) .map_err(|err| println!("{:?}", err)) .ok(); - g.add_edge(time, src_id.clone(), dst_id.clone(), &vec![], None) + g.add_edge(time, src_id.clone(), dst_id.clone(), NO_PROPS, None) .expect("Error: Unable to add edge"); }) .expect("Failed to load graph from CSV data files"); diff --git a/raphtory-io/src/graph_loader/example/mod.rs b/raphtory/src/graph_loader/example/mod.rs similarity index 100% rename from raphtory-io/src/graph_loader/example/mod.rs rename to raphtory/src/graph_loader/example/mod.rs diff --git a/raphtory-io/src/graph_loader/example/neo4j_examples.rs b/raphtory/src/graph_loader/example/neo4j_examples.rs similarity index 62% rename from raphtory-io/src/graph_loader/example/neo4j_examples.rs rename to raphtory/src/graph_loader/example/neo4j_examples.rs index 467ae1e426..6bf70d13cf 100644 --- a/raphtory-io/src/graph_loader/example/neo4j_examples.rs +++ b/raphtory/src/graph_loader/example/neo4j_examples.rs @@ -1,7 +1,9 @@ -use crate::graph_loader::source::neo4j_loader::Neo4JConnection; +use crate::{ + db::{api::mutation::AdditionOps, graph::graph as rap}, + graph_loader::source::neo4j_loader::Neo4JConnection, + prelude::{IntoProp, NO_PROPS}, +}; use neo4rs::*; -use raphtory::core::Prop; -use raphtory::db::graph as rap; fn load_movies(row: Row, graph: &rap::Graph) { let film: Node = row.get("film").unwrap(); @@ -17,32 +19,24 @@ fn load_movies(row: Row, graph: &rap::Graph) { let relation_type = relation.typ(); graph - .add_vertex(actor_born, actor_name.clone(), &vec![]) + .add_vertex(actor_born, actor_name.clone(), NO_PROPS) + .unwrap() + .add_constant_properties([("type", "actor")]) .unwrap(); graph - .add_vertex_properties( - actor_name.clone(), - &vec![("type".into(), Prop::Str("actor".into()))], - ) - .unwrap(); - graph - .add_vertex(film_release, film_title.clone(), &vec![]) - .unwrap(); - graph - .add_vertex_properties( - film_title.clone(), - &vec![ - ("type".into(), Prop::Str("film".into())), - ("tagline".into(), Prop::Str(film_tagline)), - ], - ) + .add_vertex(film_release, film_title.clone(), NO_PROPS) + .unwrap() + .add_constant_properties([ + ("type", "film".into_prop()), + ("tagline", film_tagline.into_prop()), + ]) .unwrap(); graph .add_edge( film_release, actor_name, film_title, - &vec![], + NO_PROPS, Some(relation_type.as_str()), ) .unwrap(); @@ -53,9 +47,8 @@ pub async fn neo4j_movie_graph( username: String, password: String, database: String, - shards: usize, ) -> rap::Graph { - let g = rap::Graph::new(shards); + let g = rap::Graph::new(); let neo = Neo4JConnection::new(uri, username, password, database) .await .unwrap(); diff --git a/raphtory-io/src/graph_loader/example/reddit_hyperlinks.rs b/raphtory/src/graph_loader/example/reddit_hyperlinks.rs similarity index 81% rename from raphtory-io/src/graph_loader/example/reddit_hyperlinks.rs rename to raphtory/src/graph_loader/example/reddit_hyperlinks.rs index 597bed9392..e9c18f7395 100644 --- a/raphtory-io/src/graph_loader/example/reddit_hyperlinks.rs +++ b/raphtory/src/graph_loader/example/reddit_hyperlinks.rs @@ -29,25 +29,23 @@ //! //! Example: //! ```no_run -//! use raphtory_io::graph_loader::example::reddit_hyperlinks::reddit_graph; -//! use raphtory::db::graph::Graph; -//! use raphtory::db::view_api::*; +//! use raphtory::graph_loader::example::reddit_hyperlinks::reddit_graph; +//! use raphtory::prelude::*; //! -//! let graph = reddit_graph(1, 120, false); +//! let graph = reddit_graph(120, false); //! -//! println!("The graph has {:?} vertices", graph.num_vertices()); -//! println!("The graph has {:?} edges", graph.num_edges()); +//! println!("The graph has {:?} vertices", graph.count_vertices()); +//! println!("The graph has {:?} edges", graph.count_edges()); //! ``` -use crate::graph_loader::fetch_file; +use crate::{core::Prop, db::api::mutation::AdditionOps, graph_loader::fetch_file, prelude::*}; use chrono::*; use itertools::Itertools; -use raphtory::core::Prop; -use raphtory::db::graph::Graph; -use std::fs::File; -use std::io::{self, BufRead}; -use std::path::Path; -use std::path::PathBuf; +use std::{ + fs::File, + io::{self, BufRead}, + path::{Path, PathBuf}, +}; /// Download the dataset and return the path to the file /// # Arguments @@ -68,7 +66,7 @@ pub fn reddit_file( _ => fetch_file( "reddit-title.tsv", true, - "http://snap.stanford.edu/data/soc-redditHyperlinks-title.tsv", + "http://web.archive.org/web/20201107005944/http://snap.stanford.edu/data/soc-redditHyperlinks-title.tsv", timeout, ), } @@ -87,15 +85,14 @@ where /// /// # Arguments /// -/// * `shards` - The number of shards to use for the graph /// * `timeout` - The timeout in seconds for downloading the dataset /// /// # Returns /// /// * `Graph` - The graph containing the Reddit hyperlinks dataset -pub fn reddit_graph(shards: usize, timeout: u64, test_file: bool) -> Graph { +pub fn reddit_graph(timeout: u64, test_file: bool) -> Graph { let graph = { - let g = Graph::new(shards); + let g = Graph::new(); if let Ok(path) = reddit_file(timeout, Some(test_file)) { if let Ok(lines) = read_lines(path.as_path()) { @@ -114,9 +111,9 @@ pub fn reddit_graph(shards: usize, timeout: u64, test_file: bool) -> Graph { .split(',') .map(|s| s.parse::().unwrap()) .collect(); - let edge_properties = &vec![ + let edge_properties = [ ("post_label".to_string(), Prop::I32(post_label)), - ("post_id".to_string(), Prop::Str(post_id)), + ("post_id".to_string(), Prop::str(post_id)), ("word_count".to_string(), Prop::F64(post_properties[7])), ("long_words".to_string(), Prop::F64(post_properties[9])), ("sentences".to_string(), Prop::F64(post_properties[13])), @@ -134,10 +131,10 @@ pub fn reddit_graph(shards: usize, timeout: u64, test_file: bool) -> Graph { Prop::F64(post_properties[20]), ), ]; - g.add_vertex(time, *src_id, &vec![]) + g.add_vertex(time, *src_id, NO_PROPS) .map_err(|err| println!("{:?}", err)) .ok(); - g.add_vertex(time, *dst_id, &vec![]) + g.add_vertex(time, *dst_id, NO_PROPS) .map_err(|err| println!("{:?}", err)) .ok(); g.add_edge(time, *src_id, *dst_id, edge_properties, None) @@ -158,8 +155,10 @@ pub fn reddit_graph(shards: usize, timeout: u64, test_file: bool) -> Graph { #[cfg(test)] mod reddit_test { - use crate::graph_loader::example::reddit_hyperlinks::{reddit_file, reddit_graph}; - use raphtory::db::view_api::GraphViewOps; + use crate::{ + db::api::view::*, + graph_loader::example::reddit_hyperlinks::{reddit_file, reddit_graph}, + }; #[test] fn check_data() { @@ -169,8 +168,8 @@ mod reddit_test { #[test] fn check_graph() { - let graph = reddit_graph(1, 100, true); - assert_eq!(graph.num_vertices(), 16); - assert_eq!(graph.num_edges(), 9); + let graph = reddit_graph(100, true); + assert_eq!(graph.count_vertices(), 16); + assert_eq!(graph.count_edges(), 9); } } diff --git a/raphtory-io/src/graph_loader/example/stable_coins.rs b/raphtory/src/graph_loader/example/stable_coins.rs similarity index 74% rename from raphtory-io/src/graph_loader/example/stable_coins.rs rename to raphtory/src/graph_loader/example/stable_coins.rs index 920de9250b..4dc3d7c547 100644 --- a/raphtory-io/src/graph_loader/example/stable_coins.rs +++ b/raphtory/src/graph_loader/example/stable_coins.rs @@ -1,19 +1,13 @@ -use crate::graph_loader::source::csv_loader::CsvLoader; +use crate::{ + graph_loader::{fetch_file, source::csv_loader::CsvLoader, unzip_file}, + prelude::*, +}; use chrono::NaiveDateTime; -use raphtory::core::Prop; -use raphtory::db::graph::Graph; -use raphtory::db::view_api::internal::GraphViewInternalOps; -use raphtory::db::view_api::GraphViewOps; -use serde::Deserialize; -use std::collections::HashMap; -use std::fs::File; -use std::io::{copy, Cursor}; -use std::path::{Path, PathBuf}; -use std::time::Duration; -use std::{fs, time::Instant}; use regex::Regex; -use crate::graph_loader::{fetch_file, unzip_file}; +use serde::Deserialize; +use std::{collections::HashMap, fs, path::PathBuf, time::Instant}; +#[allow(dead_code)] #[derive(Deserialize, std::fmt::Debug)] pub struct StableCoin { block_number: String, @@ -25,7 +19,7 @@ pub struct StableCoin { value: f64, } -pub fn stable_coin_graph(path: Option, subset:bool, num_shards: usize) -> Graph { +pub fn stable_coin_graph(path: Option, subset: bool) -> Graph { let data_dir = match path { Some(path) => PathBuf::from(path), None => PathBuf::from("/tmp/stablecoin"), @@ -33,7 +27,7 @@ pub fn stable_coin_graph(path: Option, subset:bool, num_shards: usize) - if !data_dir.join("token_transfers.csv").exists() { let dir_str = data_dir.to_str().unwrap(); - let zip_path =data_dir.join("ERC20-stablecoins.zip"); + let zip_path = data_dir.join("ERC20-stablecoins.zip"); let zip_str = zip_path.to_str().unwrap(); fs::create_dir_all(dir_str).expect(&format!("Failed to create directory {}", dir_str)); fetch_file(zip_str,false,"https://snap.stanford.edu/data/ERC20-stablecoins.zip",600000).expect("Failed to fetch stable coin data: https://snap.stanford.edu/data/ERC20-stablecoins.zip"); @@ -53,11 +47,10 @@ pub fn stable_coin_graph(path: Option, subset:bool, num_shards: usize) - .ok()?; println!( - "Loaded graph with {} shards from encoded data files {} with {} vertices, {} edges which took {} seconds", - g.num_shards(), + "Loaded graph from encoded data files {} with {} vertices, {} edges which took {} seconds", encoded_data_dir.to_str().unwrap(), - g.num_vertices(), - g.num_edges(), + g.count_vertices(), + g.count_edges(), now.elapsed().as_secs() ); @@ -69,7 +62,7 @@ pub fn stable_coin_graph(path: Option, subset:bool, num_shards: usize) - let encoded_data_dir = data_dir.join("graphdb.bincode"); let g = restore_from_bincode(&encoded_data_dir).unwrap_or_else(|| { - let g = Graph::new(num_shards); + let g = Graph::new(); let now = Instant::now(); let contract_addr_labels = HashMap::from([ @@ -83,10 +76,8 @@ pub fn stable_coin_graph(path: Option, subset:bool, num_shards: usize) - let re = if subset { Regex::new(r"token_transfers.csv").unwrap() - } - else{ + } else { Regex::new(r"token_transfers(_V\d+\.\d+\.\d+)?\.csv").unwrap() - }; CsvLoader::new(data_dir) .with_filter(re) @@ -99,7 +90,7 @@ pub fn stable_coin_graph(path: Option, subset:bool, num_shards: usize) - NaiveDateTime::from_timestamp_opt(stablecoin.time_stamp, 0).unwrap(), stablecoin.from_address, stablecoin.to_address, - &vec![("value".into(), Prop::F64(stablecoin.value.into()))], + [("value", stablecoin.value)], Some(label), ) .expect("Failed to add edge"); @@ -107,11 +98,10 @@ pub fn stable_coin_graph(path: Option, subset:bool, num_shards: usize) - .expect("Failed to load graph from CSV data files"); println!( - "Loaded graph with {} shards from CSV data files {} with {} vertices, {} edges which took {} seconds", - g.num_shards(), + "Loaded graph from CSV data files {} with {} vertices, {} edges which took {} seconds", encoded_data_dir.to_str().unwrap(), - g.num_vertices(), - g.num_edges(), + g.count_vertices(), + g.count_edges(), now.elapsed().as_secs() ); diff --git a/raphtory-io/src/graph_loader/example/sx_superuser_graph.rs b/raphtory/src/graph_loader/example/sx_superuser_graph.rs similarity index 76% rename from raphtory-io/src/graph_loader/example/sx_superuser_graph.rs rename to raphtory/src/graph_loader/example/sx_superuser_graph.rs index b163353ace..0b293857d7 100644 --- a/raphtory-io/src/graph_loader/example/sx_superuser_graph.rs +++ b/raphtory/src/graph_loader/example/sx_superuser_graph.rs @@ -36,19 +36,19 @@ //! //! Example: //! ```no_run -//! use raphtory_io::graph_loader::example::sx_superuser_graph::sx_superuser_graph; -//! use raphtory::db::graph::Graph; -//! use raphtory::db::view_api::*; +//! use raphtory::graph_loader::example::sx_superuser_graph::sx_superuser_graph; +//! use raphtory::prelude::*; //! -//! let graph = sx_superuser_graph(1).unwrap(); +//! let graph = sx_superuser_graph().unwrap(); //! -//! println!("The graph has {:?} vertices", graph.num_vertices()); -//! println!("The graph has {:?} edges", graph.num_edges()); +//! println!("The graph has {:?} vertices", graph.count_vertices()); +//! println!("The graph has {:?} edges", graph.count_edges()); //! ``` -use raphtory::db::graph::Graph; - -use crate::graph_loader::{fetch_file, source::csv_loader::CsvLoader}; +use crate::{ + graph_loader::{fetch_file, source::csv_loader::CsvLoader}, + prelude::*, +}; use serde::Deserialize; use std::path::PathBuf; @@ -68,7 +68,7 @@ pub fn sx_superuser_file() -> Result> { fetch_file( "sx-superuser.txt.gz", true, - "https://snap.stanford.edu/data/sx-superuser.txt.gz", + "http://web.archive.org/web/20230309171639/https://snap.stanford.edu/data/sx-superuser.txt.gz", 600, ) } @@ -82,12 +82,12 @@ pub fn sx_superuser_file() -> Result> { /// # Returns /// /// - A Result containing the graph or an error -pub fn sx_superuser_graph(shards: usize) -> Result> { - let graph = Graph::new(shards); +pub fn sx_superuser_graph() -> Result> { + let graph = Graph::new(); CsvLoader::new(sx_superuser_file()?) .set_delimiter(" ") .load_into_graph(&graph, |edge: TEdge, g: &Graph| { - g.add_edge(edge.time, edge.src_id, edge.dst_id, &vec![], None) + g.add_edge(edge.time, edge.src_id, edge.dst_id, NO_PROPS, None) .expect("Error: Unable to add edge"); })?; @@ -99,13 +99,15 @@ mod sx_superuser_test { use crate::graph_loader::example::sx_superuser_graph::{sx_superuser_file, sx_superuser_graph}; #[test] + #[ignore] // don't hit SNAP by default fn test_download_works() { let file = sx_superuser_file().unwrap(); assert!(file.is_file()) } #[test] + #[ignore] // don't hit SNAP by default FIXME: add a truncated test file for this one? fn test_graph_loading_works() { - sx_superuser_graph(2).unwrap(); + sx_superuser_graph().unwrap(); } } diff --git a/raphtory-io/src/graph_loader/mod.rs b/raphtory/src/graph_loader/mod.rs similarity index 64% rename from raphtory-io/src/graph_loader/mod.rs rename to raphtory/src/graph_loader/mod.rs index 737a9f7796..fd0a4b6a74 100644 --- a/raphtory-io/src/graph_loader/mod.rs +++ b/raphtory/src/graph_loader/mod.rs @@ -1,11 +1,87 @@ -//! `GraphLoader` trait and provides some default implementations for loading a graph. +//! Module for loading graphs into raphtory from various sources, like csv, neo4j, etc. +//! +//! Provides the `GraphLoader` trait and some default implementations for loading a graph. //! This base class is used to load in-built graphs such as the LOTR, reddit and StackOverflow. //! It also provides a method to download a CSV file. //! -//! # Example +//! # Examples +//! +//! Load a pre-built graph +//! ```rust +//! use raphtory::algorithms::degree::average_degree; +//! use raphtory::prelude::*; +//! use raphtory::graph_loader::example::lotr_graph::lotr_graph; +//! +//! let graph = lotr_graph(); +//! +//! // Get the in-degree, out-degree of Gandalf +//! // The graph.vertex option returns a result of an option, +//! // so we need to unwrap the result and the option or +//! // we can use this if let instead +//! if let Some(gandalf) = graph.vertex("Gandalf") { +//! println!("Gandalf in degree: {:?}", gandalf.in_degree()); +//! println!("Gandalf out degree: {:?}", gandalf.out_degree()); +//! } +//! +//! // Run an average degree algorithm on the graph +//! println!("Average degree: {:?}", average_degree(&graph)); +//! ``` +//! +//! Load a graph from csv +//! +//! ```no_run +//! use std::time::Instant; +//! use serde::Deserialize; +//! use raphtory::graph_loader::source::csv_loader::CsvLoader; +//! use raphtory::prelude::*; +//! +//! let data_dir = "/tmp/lotr.csv"; +//! +//! #[derive(Deserialize, std::fmt::Debug)] +//! pub struct Lotr { +//! src_id: String, +//! dst_id: String, +//! time: i64, +//! } +//! +//! let g = Graph::new(); +//! let now = Instant::now(); +//! +//! CsvLoader::new(data_dir) +//! .load_into_graph(&g, |lotr: Lotr, g: &Graph| { +//! g.add_vertex( +//! lotr.time, +//! lotr.src_id.clone(), +//! [("type", Prop::str("Character"))], +//! ) +//! .expect("Failed to add vertex"); +//! +//! g.add_vertex( +//! lotr.time, +//! lotr.dst_id.clone(), +//! [("type", Prop::str("Character"))], +//! ) +//! .expect("Failed to add vertex"); +//! +//! g.add_edge( +//! lotr.time, +//! lotr.src_id.clone(), +//! lotr.dst_id.clone(), +//! [( +//! "type", +//! Prop::str("Character Co-occurrence"), +//! )], +//! None, +//! ) +//! .expect("Failed to add edge"); +//! }) +//! .expect("Failed to load graph from CSV data files"); +//! ``` +//! +//! download a file without creating the graph //! //! ```rust -//! use raphtory_io::graph_loader::fetch_file; +//! use raphtory::graph_loader::fetch_file; //! //! let path = fetch_file( //! "lotr.csv", @@ -17,38 +93,36 @@ //! // check if a file exists at the path //! assert!(path.is_ok()); //! ``` -//! -use std::env; -use std::fs::File; -use std::io::{copy, Cursor}; -use std::path::{Path, PathBuf}; -use std::time::Duration; -use std::io::prelude::*; -use zip::read::{ZipArchive, ZipFile}; -use std::fs::*; +use std::{ + env, + fs::{File, *}, + io::{copy, Cursor}, + path::{Path, PathBuf}, + time::Duration, +}; +use zip::read::ZipArchive; pub mod example; pub mod source; pub fn fetch_file( name: &str, - tmp_save:bool, + tmp_save: bool, url: &str, timeout: u64, ) -> Result> { let filepath = if tmp_save { let tmp_dir = env::temp_dir(); tmp_dir.join(name) - } - else { + } else { PathBuf::from(name) }; if !filepath.exists() { let client = reqwest::blocking::Client::builder() .timeout(Duration::from_secs(timeout)) .build()?; - let response = client.get(url).send()?; + let response = client.get(url).send()?.error_for_status()?; let mut content = Cursor::new(response.bytes()?); if !filepath.exists() { let mut file = File::create(&filepath)?; @@ -58,7 +132,6 @@ pub fn fetch_file( Ok(filepath) } - fn unzip_file(zip_file_path: &str, destination_path: &str) -> std::io::Result<()> { let file = File::open(zip_file_path)?; let mut archive = ZipArchive::new(file)?; @@ -73,7 +146,7 @@ fn unzip_file(zip_file_path: &str, destination_path: &str) -> std::io::Result<() } else { if let Some(parent) = Path::new(&dest_path).parent() { if !parent.exists() { - create_dir_all(&parent)?; + create_dir_all(&parent)?; } } let mut output_file = File::create(&dest_path)?; @@ -84,23 +157,10 @@ fn unzip_file(zip_file_path: &str, destination_path: &str) -> std::io::Result<() Ok(()) } - - - #[cfg(test)] mod graph_loader_test { + use crate::{core::utils::hashing, graph_loader::fetch_file, prelude::*}; use csv::StringRecord; - use raphtory::{ - core::{utils, Prop}, - db::{ - graph::Graph, - view_api::{GraphViewOps, TimeOps, VertexViewOps}, - }, - }; - - use crate::graph_loader::{fetch_file, unzip_file}; - use crate::graph_loader::example::stable_coins::stable_coin_graph; - #[test] fn test_fetch_file() { @@ -115,13 +175,13 @@ mod graph_loader_test { #[test] fn test_lotr_load_graph() { - let g = crate::graph_loader::example::lotr_graph::lotr_graph(4); - assert_eq!(g.num_edges(), 701); + let g = crate::graph_loader::example::lotr_graph::lotr_graph(); + assert_eq!(g.count_edges(), 701); } #[test] fn test_graph_at() { - let g = crate::graph_loader::example::lotr_graph::lotr_graph(1); + let g = crate::graph_loader::example::lotr_graph::lotr_graph(); let g_at_empty = g.at(1); let g_at_start = g.at(7059); @@ -129,16 +189,16 @@ mod graph_loader_test { let g_at_max = g.at(i64::MAX); let g_at_min = g.at(i64::MIN); - assert_eq!(g_at_empty.num_vertices(), 0); - assert_eq!(g_at_start.num_vertices(), 70); - assert_eq!(g_at_another.num_vertices(), 123); - assert_eq!(g_at_max.num_vertices(), 139); - assert_eq!(g_at_min.num_vertices(), 0); + assert_eq!(g_at_empty.count_vertices(), 0); + assert_eq!(g_at_start.count_vertices(), 70); + assert_eq!(g_at_another.count_vertices(), 123); + assert_eq!(g_at_max.count_vertices(), 139); + assert_eq!(g_at_min.count_vertices(), 0); } #[test] fn db_lotr() { - let g = Graph::new(4); + let g = Graph::new(); let data_dir = crate::graph_loader::example::lotr_graph::lotr_file() .expect("Failed to get lotr.csv file"); @@ -153,29 +213,18 @@ mod graph_loader_test { if let Ok(mut reader) = csv::Reader::from_path(data_dir) { for rec in reader.records().flatten() { if let Some((src, dst, t)) = parse_record(&rec) { - let src_id = utils::calculate_hash(&src); - let dst_id = utils::calculate_hash(&dst); + let src_id = hashing::calculate_hash(&src); + let dst_id = hashing::calculate_hash(&dst); - g.add_vertex( - t, - src_id, - &vec![("name".to_string(), Prop::Str("Character".to_string()))], - ) - .unwrap(); - g.add_vertex( - t, - dst_id, - &vec![("name".to_string(), Prop::Str("Character".to_string()))], - ) - .unwrap(); + g.add_vertex(t, src_id, [("name", Prop::str("Character"))]) + .unwrap(); + g.add_vertex(t, dst_id, [("name", Prop::str("Character"))]) + .unwrap(); g.add_edge( t, src_id, dst_id, - &vec![( - "name".to_string(), - Prop::Str("Character Co-occurrence".to_string()), - )], + [("name", Prop::str("Character Co-occurrence"))], None, ) .unwrap(); @@ -183,16 +232,16 @@ mod graph_loader_test { } } - let gandalf = utils::calculate_hash(&"Gandalf"); + let gandalf = hashing::calculate_hash(&"Gandalf"); assert!(g.has_vertex(gandalf)); assert!(g.has_vertex("Gandalf")) } #[test] fn test_all_degrees_window() { - let g = crate::graph_loader::example::lotr_graph::lotr_graph(4); + let g = crate::graph_loader::example::lotr_graph::lotr_graph(); - assert_eq!(g.num_edges(), 701); + assert_eq!(g.count_edges(), 701); assert_eq!(g.vertex("Gandalf").unwrap().degree(), 49); assert_eq!( g.vertex("Gandalf").unwrap().window(1356, 24792).degree(), @@ -215,9 +264,9 @@ mod graph_loader_test { #[test] fn test_all_neighbours_window() { - let g = crate::graph_loader::example::lotr_graph::lotr_graph(4); + let g = crate::graph_loader::example::lotr_graph::lotr_graph(); - assert_eq!(g.num_edges(), 701); + assert_eq!(g.count_edges(), 701); assert_eq!(g.vertex("Gandalf").unwrap().neighbours().iter().count(), 49); for v in g @@ -268,9 +317,9 @@ mod graph_loader_test { #[test] fn test_all_edges_window() { - let g = crate::graph_loader::example::lotr_graph::lotr_graph(4); + let g = crate::graph_loader::example::lotr_graph::lotr_graph(); - assert_eq!(g.num_edges(), 701); + assert_eq!(g.count_edges(), 701); assert_eq!(g.vertex("Gandalf").unwrap().edges().count(), 59); assert_eq!( g.vertex("Gandalf") diff --git a/raphtory-io/src/graph_loader/source/csv_loader.rs b/raphtory/src/graph_loader/source/csv_loader.rs similarity index 73% rename from raphtory-io/src/graph_loader/source/csv_loader.rs rename to raphtory/src/graph_loader/source/csv_loader.rs index 2ec34639f1..615eda1134 100644 --- a/raphtory-io/src/graph_loader/source/csv_loader.rs +++ b/raphtory/src/graph_loader/source/csv_loader.rs @@ -4,13 +4,12 @@ //! ```no_run //! use std::path::{Path, PathBuf}; //! use regex::Regex; -//! use raphtory::core::Prop; -//! use raphtory::core::utils::calculate_hash; -//! use raphtory_io::graph_loader::source::csv_loader::CsvLoader; -//! use raphtory::db::graph::Graph; -//! use raphtory_io::graph_loader::example::lotr_graph::Lotr; +//! use raphtory::core::utils::hashing::calculate_hash; +//! use raphtory::graph_loader::source::csv_loader::CsvLoader; +//! use raphtory::graph_loader::example::lotr_graph::Lotr; +//! use raphtory::prelude::*; //! -//! let g = Graph::new(2); +//! let g = Graph::new(); //! let csv_path: PathBuf = [env!("CARGO_MANIFEST_DIR"), "../../resource/"] //! .iter() //! .collect(); @@ -33,14 +32,14 @@ //! g.add_vertex( //! time, //! src_id, -//! &vec![("name".to_string(), Prop::Str("Character".to_string()))], +//! [("name", Prop::str("Character"))], //! ) //! .map_err(|err| println!("{:?}", err)) //! .ok(); //! g.add_vertex( //! time, //! dst_id, -//! &vec![("name".to_string(), Prop::Str("Character".to_string()))], +//! [("name", Prop::str("Character"))], //! ) //! .map_err(|err| println!("{:?}", err)) //! .ok(); @@ -48,9 +47,9 @@ //! time, //! src_id, //! dst_id, -//! &vec![( -//! "name".to_string(), -//! Prop::Str("Character Co-occurrence".to_string()), +//! [( +//! "name", +//! Prop::str("Character Co-occurrence"), //! )], //! None, //! ).expect("Failed to add edge"); @@ -61,18 +60,22 @@ /// Module for loading CSV files into a graph. use bzip2::read::BzDecoder; +use csv::StringRecord; use flate2; // 1.0 use flate2::read::GzDecoder; use rayon::prelude::*; use regex::Regex; use serde::de::DeserializeOwned; -use std::collections::VecDeque; -use std::error::Error; -use std::fmt::{Debug, Display, Formatter}; -use std::fs::File; -use std::io::BufReader; -use std::path::{Path, PathBuf}; -use std::{fs, io}; +use std::{ + collections::VecDeque, + error::Error, + fmt::{Debug, Display, Formatter}, + fs, + fs::File, + io, + io::BufReader, + path::{Path, PathBuf}, +}; #[derive(Debug)] pub enum CsvErr { @@ -123,6 +126,8 @@ pub struct CsvLoader { header: bool, /// The delimiter character used in the CSV file. delimiter: u8, + /// print the name of the file being loaded + print_file_name: bool, } impl CsvLoader { @@ -136,7 +141,7 @@ impl CsvLoader { /// /// ```no_run /// - /// use raphtory_io::graph_loader::source::csv_loader::CsvLoader; + /// use raphtory::graph_loader::source::csv_loader::CsvLoader; /// let loader = CsvLoader::new("/path/to/csv_file.csv"); /// ``` pub fn new>(p: P) -> Self { @@ -145,6 +150,7 @@ impl CsvLoader { regex_filter: None, header: false, delimiter: b',', + print_file_name: false, } } @@ -157,7 +163,7 @@ impl CsvLoader { /// # Example /// /// ```no_run - /// use raphtory_io::graph_loader::source::csv_loader::CsvLoader; + /// use raphtory::graph_loader::source::csv_loader::CsvLoader; /// let loader = CsvLoader::new("/path/to/csv_file.csv").set_header(true); /// ``` pub fn set_header(mut self, h: bool) -> Self { @@ -165,6 +171,22 @@ impl CsvLoader { self } + /// If set to true will print the file name as it reads it + /// + /// # Arguments + /// + /// * `p` - A boolean value indicating whether the CSV file has a header. + /// + /// # Example + /// ```no_run + /// use raphtory::graph_loader::source::csv_loader::CsvLoader; + /// let loader = CsvLoader::new("/path/to/csv_file.csv").set_print_file_name(true); + /// ``` + pub fn set_print_file_name(mut self, p: bool) -> Self { + self.print_file_name = p; + self + } + /// Sets the delimiter character used in the CSV file. /// /// # Arguments @@ -174,7 +196,7 @@ impl CsvLoader { /// # Example /// /// ```no_run - /// use raphtory_io::graph_loader::source::csv_loader::CsvLoader; + /// use raphtory::graph_loader::source::csv_loader::CsvLoader; /// let loader = CsvLoader::new("/path/to/csv_file.csv").set_delimiter("|"); /// ``` pub fn set_delimiter(mut self, d: &str) -> Self { @@ -192,7 +214,7 @@ impl CsvLoader { /// /// ```no_run /// use regex::Regex; - /// use raphtory_io::graph_loader::source::csv_loader::CsvLoader; + /// use raphtory::graph_loader::source::csv_loader::CsvLoader; /// /// let loader = CsvLoader::new("/path/to/csv_files") /// .with_filter(Regex::new(r"file_name_pattern").unwrap()); @@ -268,14 +290,12 @@ impl CsvLoader { while let Some(ref path) = queue.pop_back() { match fs::read_dir(path) { Ok(entries) => { - for entry in entries { - if let Ok(f_path) = entry { - let p = f_path.path(); - if Self::is_dir(&p)? { - queue.push_back(p.clone()) - } else { - self.accept_file(f_path.path(), &mut paths); - } + for f_path in entries.flatten() { + let p = f_path.path(); + if Self::is_dir(&p)? { + queue.push_back(p.clone()) + } else { + self.accept_file(f_path.path(), &mut paths); } } } @@ -321,6 +341,34 @@ impl CsvLoader { Ok(()) } + /// Load data from all CSV files in the directory into a graph. + /// + /// # Arguments + /// + /// * `g` - A reference to the graph object where the data should be loaded. + /// * `loader` - A closure that takes a deserialized record and the graph object as arguments and adds the record to the graph. + /// + /// # Returns + /// + /// A Result containing an empty Ok value if the data is loaded successfully. + /// + /// # Errors + /// + /// An error of type CsvErr is returned if an I/O error occurs while reading the files or parsing the CSV data. + /// + pub fn load_rec_into_graph(&self, g: &G, loader: F) -> Result<(), CsvErr> + where + F: Fn(StringRecord, &G) + Send + Sync, + G: Sync, + { + //FIXME: loader function should return a result for reporting parsing errors + let paths = self.files_vec()?; + paths + .par_iter() + .try_for_each(move |path| self.load_file_into_graph_record(path, g, &loader))?; + Ok(()) + } + /// Loads a CSV file into a graph using the specified loader function. /// /// # Arguments @@ -344,7 +392,9 @@ impl CsvLoader { F: Fn(REC, &G), { let file_path: PathBuf = path.into(); - + if self.print_file_name { + println!("Loading file: {:?}", file_path); + } let mut csv_reader = self.csv_reader(file_path)?; let records_iter = csv_reader.deserialize::(); @@ -357,6 +407,26 @@ impl CsvLoader { Ok(()) } + fn load_file_into_graph_record + Debug, G>( + &self, + path: P, + g: &G, + loader: &F, + ) -> Result<(), CsvErr> + where + F: Fn(StringRecord, &G), + { + let file_path: PathBuf = path.into(); + + let mut csv_reader = self.csv_reader(file_path)?; + for rec in csv_reader.records() { + let record = rec?; + loader(record, g) + } + + Ok(()) + } + /// Returns a `csv::Reader` for the specified file path, automatically detecting and handling gzip and bzip compression. /// /// # Arguments @@ -402,10 +472,11 @@ impl CsvLoader { #[cfg(test)] mod csv_loader_test { - use crate::graph_loader::source::csv_loader::CsvLoader; - use raphtory::core::utils::calculate_hash; - use raphtory::core::Prop; - use raphtory::db::graph::Graph; + use crate::{ + core::utils::hashing::calculate_hash, graph_loader::source::csv_loader::CsvLoader, + prelude::*, + }; + use csv::StringRecord; use regex::Regex; use serde::Deserialize; use std::path::{Path, PathBuf}; @@ -449,28 +520,51 @@ mod csv_loader_test { let dst_id = calculate_hash(&lotr.dst_id); let time = lotr.time; - g.add_vertex( + g.add_vertex(time, src_id, [("name", Prop::str("Character"))]) + .map_err(|err| println!("{:?}", err)) + .ok(); + g.add_vertex(time, dst_id, [("name", Prop::str("Character"))]) + .map_err(|err| println!("{:?}", err)) + .ok(); + g.add_edge( time, src_id, - &vec![("name".to_string(), Prop::Str("Character".to_string()))], - ) - .map_err(|err| println!("{:?}", err)) - .ok(); - g.add_vertex( - time, dst_id, - &vec![("name".to_string(), Prop::Str("Character".to_string()))], + [("name", Prop::str("Character Co-occurrence"))], + None, ) - .map_err(|err| println!("{:?}", err)) - .ok(); + .unwrap(); + }) + .expect("Csv did not parse."); + } + + fn lotr_test_rec(g: Graph, csv_loader: CsvLoader, has_header: bool, delimiter: &str, r: Regex) { + csv_loader + .set_header(has_header) + .set_delimiter(delimiter) + .with_filter(r) + .load_rec_into_graph(&g, |lotr: StringRecord, g: &Graph| { + let src_id = lotr + .get(0) + .map(|s| calculate_hash(&(s.to_owned()))) + .unwrap(); + let dst_id = lotr + .get(1) + .map(|s| calculate_hash(&(s.to_owned()))) + .unwrap(); + let time = lotr.get(2).map(|s| s.parse::().unwrap()).unwrap(); + + g.add_vertex(time, src_id, [("name", Prop::str("Character"))]) + .map_err(|err| println!("{:?}", err)) + .ok(); + g.add_vertex(time, dst_id, [("name", Prop::str("Character"))]) + .map_err(|err| println!("{:?}", err)) + .ok(); g.add_edge( time, src_id, dst_id, - &vec![( - "name".to_string(), - Prop::Str("Character Co-occurrence".to_string()), - )], + [("name", Prop::str("Character Co-occurrence"))], None, ) .unwrap(); @@ -480,7 +574,7 @@ mod csv_loader_test { #[test] fn test_headers_flag_and_delimiter() { - let g = Graph::new(2); + let g = Graph::new(); // todo: move file path to data module let csv_path: PathBuf = [env!("CARGO_MANIFEST_DIR"), "../resource/"] .iter() @@ -492,12 +586,16 @@ mod csv_loader_test { let r = Regex::new(r".+(lotr.csv)").unwrap(); let delimiter = ","; lotr_test(g, csv_loader, has_header, delimiter, r); + let g = Graph::new(); + let csv_loader = CsvLoader::new(Path::new(&csv_path)); + let r = Regex::new(r".+(lotr.csv)").unwrap(); + lotr_test_rec(g, csv_loader, has_header, delimiter, r); } #[test] #[should_panic] fn test_wrong_header_flag_file_with_header() { - let g = Graph::new(2); + let g = Graph::new(); // todo: move file path to data module let csv_path: PathBuf = [env!("CARGO_MANIFEST_DIR"), "../../resource/"] .iter() @@ -512,7 +610,7 @@ mod csv_loader_test { #[test] #[should_panic] fn test_flag_has_header_but_file_has_no_header() { - let g = Graph::new(2); + let g = Graph::new(); // todo: move file path to data module let csv_path: PathBuf = [env!("CARGO_MANIFEST_DIR"), "../../resource/"] .iter() @@ -527,7 +625,7 @@ mod csv_loader_test { #[test] #[should_panic] fn test_wrong_header_names() { - let g = Graph::new(2); + let g = Graph::new(); // todo: move file path to data module let csv_path: PathBuf = [env!("CARGO_MANIFEST_DIR"), "../../resource/"] .iter() @@ -542,7 +640,7 @@ mod csv_loader_test { #[test] #[should_panic] fn test_wrong_delimiter() { - let g = Graph::new(2); + let g = Graph::new(); // todo: move file path to data module let csv_path: PathBuf = [env!("CARGO_MANIFEST_DIR"), "../../resource/"] .iter() diff --git a/raphtory-io/src/graph_loader/source/json_loader.rs b/raphtory/src/graph_loader/source/json_loader.rs similarity index 59% rename from raphtory-io/src/graph_loader/source/json_loader.rs rename to raphtory/src/graph_loader/source/json_loader.rs index 64609b53ae..4162445b5b 100644 --- a/raphtory-io/src/graph_loader/source/json_loader.rs +++ b/raphtory/src/graph_loader/source/json_loader.rs @@ -1,9 +1,21 @@ -use std::{io, path::{PathBuf, Path}, collections::VecDeque, fs, error::Error, fmt::{Display, Formatter}}; - -use raphtory::core::tgraph_shard::errors::GraphError; +use crate::core::utils::errors::GraphError; +use bzip2::read::BzDecoder; +use flate2; // 1.0 +use flate2::read::GzDecoder; +use rayon::prelude::*; use regex::Regex; use serde::de::DeserializeOwned; -use rayon::prelude::*; +use serde_json::{de::IoRead, Deserializer}; +use std::{ + collections::VecDeque, + error::Error, + fmt::{Display, Formatter}, + fs, + fs::File, + io, + io::BufReader, + path::{Path, PathBuf}, +}; #[derive(Debug)] pub enum JsonErr { @@ -12,7 +24,7 @@ pub enum JsonErr { /// A CSV parsing error that occurred while parsing the CSV data. JsonError(serde_json::Error), /// A GraphError that occurred while loading the CSV data into the graph. - GraphError(GraphError) + GraphError(GraphError), } impl From for JsonErr { @@ -60,18 +72,31 @@ pub struct JsonLinesLoader { /// Optional regex filter to select specific CSV files by name. regex_filter: Option, _a: std::marker::PhantomData, + /// print the name of the file being loaded + print_file_name: bool, } -impl JsonLinesLoader { +impl JsonLinesLoader { /// Creates a new CSV loader with the given path. pub fn new(path: PathBuf, regex_filter: Option) -> Self { Self { path, regex_filter, _a: std::marker::PhantomData, + print_file_name: false, } } + /// If set to true will print the file name as it reads it + /// + /// # Arguments + /// + /// * `p` - A boolean value indicating whether the CSV file has a header. + /// + pub fn set_print_file_name(mut self, p: bool) -> Self { + self.print_file_name = p; + self + } /// Check if the provided path is a directory or not. /// @@ -139,14 +164,12 @@ impl JsonLinesLoade while let Some(ref path) = queue.pop_back() { match fs::read_dir(path) { Ok(entries) => { - for entry in entries { - if let Ok(f_path) = entry { - let p = f_path.path(); - if Self::is_dir(&p)? { - queue.push_back(p.clone()) - } else { - self.accept_file(f_path.path(), &mut paths); - } + for f_path in entries.flatten() { + let p = f_path.path(); + if Self::is_dir(&p)? { + queue.push_back(p.clone()) + } else { + self.accept_file(f_path.path(), &mut paths); } } } @@ -181,7 +204,7 @@ impl JsonLinesLoade pub fn load_into_graph(&self, g: &G, loader: F) -> Result<(), JsonErr> where REC: DeserializeOwned + std::fmt::Debug, - F: Fn(REC, &G)->Result<(), GraphError> + Send + Sync, + F: Fn(REC, &G) -> Result<(), GraphError> + Send + Sync, G: Sync, { //FIXME: loader function should return a result for reporting parsing errors @@ -192,6 +215,37 @@ impl JsonLinesLoade Ok(()) } + fn json_reader( + &self, + file_path: PathBuf, + ) -> Result>>>, JsonErr> { + let is_gziped = file_path + .file_name() + .and_then(|name| name.to_str()) + .filter(|name| name.ends_with(".gz")) + .is_some(); + + let is_bziped = file_path + .file_name() + .and_then(|name| name.to_str()) + .filter(|name| name.ends_with(".bz2")) + .is_some(); + + let f = File::open(&file_path)?; + + if is_gziped { + Ok(Deserializer::from_reader(BufReader::new(Box::new( + GzDecoder::new(f), + )))) + } else if is_bziped { + Ok(Deserializer::from_reader(BufReader::new(Box::new( + BzDecoder::new(f), + )))) + } else { + Ok(Deserializer::from_reader(BufReader::new(Box::new(f)))) + } + } + /// Loads a JSON file into a graph using the specified loader function. /// /// # Arguments @@ -214,17 +268,19 @@ impl JsonLinesLoade F: Fn(REC, &G) -> Result<(), GraphError>, { let file_path: PathBuf = path.into(); + if self.print_file_name { + println!("Loading file: {:?}", file_path); + } + + let json_reader = self.json_reader(file_path)?; - let json_reader = serde_json::Deserializer::from_reader(std::io::BufReader::new( - std::fs::File::open(file_path)?, - )); let records_iter = json_reader.into_iter::(); //TODO this needs better error handling for files without perfect data for rec in records_iter { if let Ok(record) = rec { loader(record, g)? - } else{ + } else { println!("Error parsing record: {:?}", rec); } } @@ -232,3 +288,66 @@ impl JsonLinesLoade Ok(()) } } + +#[cfg(test)] +mod tests { + use super::*; + use crate::prelude::*; + use bzip2::{write::BzEncoder, Compression as BzCompression}; + use flate2::{write::GzEncoder, Compression}; + use serde::Deserialize; + use std::{fs::File, io::Write}; + use tempfile::tempdir; + + #[derive(Debug, Deserialize)] + struct TestRecord { + name: String, + time: i64, + } + + fn test_json_rec(g: Graph, loader: JsonLinesLoader) { + loader + .load_into_graph(&g, |testrec: TestRecord, g: &Graph| { + let _ = g.add_vertex(testrec.time.clone(), testrec.name.clone(), NO_PROPS); + Ok(()) + }) + .expect("Unable to add vertex to graph"); + assert_eq!(g.count_vertices(), 3); + assert_eq!(g.count_edges(), 0); + let mut names = g.vertices().into_iter().name().collect::>(); + names.sort(); + assert_eq!(names, vec!["test", "testbz", "testgz"]); + } + + #[test] + fn test_load_into_graph() { + let dir = tempdir().unwrap(); + let plain_file = dir.path().join("test.json"); + let gzip_file = dir.path().join("test.json.gz"); + let bzip_file = dir.path().join("test.json.bz2"); + + // Create plain json file + File::create(&plain_file) + .unwrap() + .write_all(b"{\"name\": \"test\", \"time\": 1}\n") + .expect("unable to make plain file"); + + // Create gzip compressed json file + let f = File::create(&gzip_file).unwrap(); + let mut gz = GzEncoder::new(f, Compression::fast()); + gz.write_all(b"{\"name\": \"testgz\", \"time\": 2}\n") + .expect("unable to write to gz file"); + gz.finish().expect("Unable to write GZ file"); + + // Create bzip2 compressed json file + let f = File::create(&bzip_file).unwrap(); + let mut bz = BzEncoder::new(f, BzCompression::fast()); + bz.write_all(b"{\"name\": \"testbz\", \"time\": 3}\n") + .expect("unable to write to bz file"); + bz.finish().expect("Unable to write BZ file"); + + let g = Graph::new(); + let loader = JsonLinesLoader::::new(dir.path().to_path_buf(), None); + test_json_rec(g, loader); + } +} diff --git a/raphtory-io/src/graph_loader/source/mod.rs b/raphtory/src/graph_loader/source/mod.rs similarity index 73% rename from raphtory-io/src/graph_loader/source/mod.rs rename to raphtory/src/graph_loader/source/mod.rs index 150475e422..ea9fc4dc61 100644 --- a/raphtory-io/src/graph_loader/source/mod.rs +++ b/raphtory/src/graph_loader/source/mod.rs @@ -1,4 +1,3 @@ pub mod csv_loader; pub mod json_loader; pub mod neo4j_loader; -pub mod polars_loader; diff --git a/raphtory-io/src/graph_loader/source/neo4j_loader.rs b/raphtory/src/graph_loader/source/neo4j_loader.rs similarity index 78% rename from raphtory-io/src/graph_loader/source/neo4j_loader.rs rename to raphtory/src/graph_loader/source/neo4j_loader.rs index 406659e0df..f8646117e5 100644 --- a/raphtory-io/src/graph_loader/source/neo4j_loader.rs +++ b/raphtory/src/graph_loader/source/neo4j_loader.rs @@ -1,5 +1,5 @@ +use crate::db::graph::graph as rap; use neo4rs::*; -use raphtory::db::graph as rap; /// A struct that defines the Neo4J loader with configurable options. pub struct Neo4JConnection { // The created graph object given the arguments @@ -13,7 +13,7 @@ impl Neo4JConnection { password: String, database: String, ) -> Result { - let config = config() + let config = ConfigBuilder::default() .uri(uri.as_str()) .user(username.as_str()) .password(password.as_str()) @@ -24,11 +24,11 @@ impl Neo4JConnection { } pub async fn run(&self, query: Query) -> Result<()> { - Ok(self.neo_graph.run(query).await?) + self.neo_graph.run(query).await } pub async fn execute(&self, query: Query) -> Result { - Ok(self.neo_graph.execute(query).await?) + self.neo_graph.execute(query).await } pub async fn load_query_into_graph( @@ -48,11 +48,15 @@ impl Neo4JConnection { #[cfg(test)] mod neo_loader_test { - use crate::graph_loader::source::neo4j_loader::Neo4JConnection; + use crate::{ + db::{ + api::{mutation::AdditionOps, view::GraphViewOps}, + graph::graph as rap, + }, + graph_loader::source::neo4j_loader::Neo4JConnection, + prelude::{IntoProp, NO_PROPS}, + }; use neo4rs::*; - use raphtory::core::Prop; - use raphtory::db::graph as rap; - use raphtory::db::view_api::GraphViewOps; fn load_movies(row: Row, graph: &rap::Graph) { let film: Node = row.get("film").unwrap(); @@ -68,32 +72,24 @@ mod neo_loader_test { let relation_type = relation.typ(); graph - .add_vertex(actor_born, actor_name.clone(), &vec![]) + .add_vertex(actor_born, actor_name.clone(), NO_PROPS) + .unwrap() + .add_constant_properties([("type", "actor")]) .unwrap(); graph - .add_vertex_properties( - actor_name.clone(), - &vec![("type".into(), Prop::Str("actor".into()))], - ) - .unwrap(); - graph - .add_vertex(film_release, film_title.clone(), &vec![]) - .unwrap(); - graph - .add_vertex_properties( - film_title.clone(), - &vec![ - ("type".into(), Prop::Str("film".into())), - ("tagline".into(), Prop::Str(film_tagline)), - ], - ) + .add_vertex(film_release, film_title.clone(), NO_PROPS) + .unwrap() + .add_constant_properties([ + ("type", "film".into_prop()), + ("tagline", film_tagline.into_prop()), + ]) .unwrap(); graph .add_edge( film_release, actor_name, film_title, - &vec![], + NO_PROPS, Some(relation_type.as_str()), ) .unwrap(); @@ -110,7 +106,7 @@ mod neo_loader_test { ) .await .unwrap(); - let doc_graph = rap::Graph::new(1); + let doc_graph = rap::Graph::new(); neo.load_query_into_graph( &doc_graph, diff --git a/raphtory/src/graphgen/preferential_attachment.rs b/raphtory/src/graphgen/preferential_attachment.rs index 5a528d9b55..f1164ffdf8 100644 --- a/raphtory/src/graphgen/preferential_attachment.rs +++ b/raphtory/src/graphgen/preferential_attachment.rs @@ -5,15 +5,20 @@ //! # Examples //! //! ``` -//! use raphtory::db::graph::Graph; +//! use raphtory::prelude::*; //! use raphtory::graphgen::preferential_attachment::ba_preferential_attachment; //! -//! let graph = Graph::new(2); +//! let graph = Graph::new(); //! ba_preferential_attachment(&graph, 1000, 10); //! ``` -use crate::db::graph::Graph; -use crate::db::view_api::*; +use crate::{ + db::{ + api::{mutation::AdditionOps, view::*}, + graph::graph::Graph, + }, + prelude::NO_PROPS, +}; use rand::prelude::*; use std::collections::HashSet; @@ -37,10 +42,10 @@ use std::collections::HashSet; /// # Examples /// /// ``` -/// use raphtory::db::graph::Graph; +/// use raphtory::prelude::*; /// use raphtory::graphgen::preferential_attachment::ba_preferential_attachment; /// -/// let graph = Graph::new(2); +/// let graph = Graph::new(); /// ba_preferential_attachment(&graph, 1000, 10); /// ``` pub fn ba_preferential_attachment(graph: &Graph, vertices_to_add: usize, edges_per_step: usize) { @@ -60,17 +65,17 @@ pub fn ba_preferential_attachment(graph: &Graph, vertices_to_add: usize, edges_p while ids.len() < edges_per_step { max_id += 1; graph - .add_vertex(latest_time, max_id, &vec![]) + .add_vertex(latest_time, max_id, NO_PROPS) .map_err(|err| println!("{:?}", err)) .ok(); degrees.push(0); ids.push(max_id); } - if graph.num_edges() < edges_per_step { + if graph.count_edges() < edges_per_step { for pos in 1..ids.len() { graph - .add_edge(latest_time, ids[pos], ids[pos - 1], &vec![], None) + .add_edge(latest_time, ids[pos], ids[pos - 1], NO_PROPS, None) .expect("Not able to add edge"); edge_count += 2; degrees[pos] += 1; @@ -102,7 +107,7 @@ pub fn ba_preferential_attachment(graph: &Graph, vertices_to_add: usize, edges_p let dst = ids[pos]; degrees[pos] += 1; graph - .add_edge(latest_time, max_id, dst, &vec![], None) + .add_edge(latest_time, max_id, dst, NO_PROPS, None) .expect("Not able to add edge"); } ids.push(max_id); @@ -118,33 +123,33 @@ mod preferential_attachment_tests { use crate::graphgen::random_attachment::random_attachment; #[test] fn blank_graph() { - let graph = Graph::new(2); + let graph = Graph::new(); ba_preferential_attachment(&graph, 1000, 10); - assert_eq!(graph.num_edges(), 10009); - assert_eq!(graph.num_vertices(), 1010); + assert_eq!(graph.count_edges(), 10009); + assert_eq!(graph.count_vertices(), 1010); } #[test] fn only_nodes() { - let graph = Graph::new(2); + let graph = Graph::new(); for i in 0..10 { graph - .add_vertex(i, i as u64, &vec![]) + .add_vertex(i, i as u64, NO_PROPS) .map_err(|err| println!("{:?}", err)) .ok(); } ba_preferential_attachment(&graph, 1000, 5); - assert_eq!(graph.num_edges(), 5009); - assert_eq!(graph.num_vertices(), 1010); + assert_eq!(graph.count_edges(), 5009); + assert_eq!(graph.count_vertices(), 1010); } #[test] fn prior_graph() { - let graph = Graph::new(2); + let graph = Graph::new(); random_attachment(&graph, 1000, 3); ba_preferential_attachment(&graph, 500, 4); - assert_eq!(graph.num_edges(), 5000); - assert_eq!(graph.num_vertices(), 1503); + assert_eq!(graph.count_edges(), 5000); + assert_eq!(graph.count_vertices(), 1503); } } diff --git a/raphtory/src/graphgen/random_attachment.rs b/raphtory/src/graphgen/random_attachment.rs index 8e7e074ad4..c458ac355d 100644 --- a/raphtory/src/graphgen/random_attachment.rs +++ b/raphtory/src/graphgen/random_attachment.rs @@ -7,14 +7,19 @@ //! # Examples //! //! ``` -//! use raphtory::db::graph::Graph; +//! use raphtory::prelude::*; //! use raphtory::graphgen::random_attachment::random_attachment; -//! let graph = Graph::new(2); +//! let graph = Graph::new(); //! random_attachment(&graph, 1000, 10); //! ``` -use crate::db::graph::Graph; -use crate::db::view_api::*; +use crate::{ + db::{ + api::{mutation::AdditionOps, view::*}, + graph::graph::Graph, + }, + prelude::NO_PROPS, +}; use rand::seq::SliceRandom; /// Given a graph this function will add a user defined number of vertices, each with a @@ -34,9 +39,9 @@ use rand::seq::SliceRandom; /// # Examples /// /// ``` -/// use raphtory::db::graph::Graph; +/// use raphtory::prelude::*; /// use raphtory::graphgen::random_attachment::random_attachment; -/// let graph = Graph::new(2); +/// let graph = Graph::new(); /// random_attachment(&graph, 1000, 10); /// ``` pub fn random_attachment(graph: &Graph, vertices_to_add: usize, edges_per_step: usize) { @@ -49,7 +54,7 @@ pub fn random_attachment(graph: &Graph, vertices_to_add: usize, edges_per_step: max_id += 1; latest_time += 1; graph - .add_vertex(latest_time, max_id, &vec![]) + .add_vertex(latest_time, max_id, NO_PROPS) .map_err(|err| println!("{:?}", err)) .ok(); ids.push(max_id); @@ -61,7 +66,7 @@ pub fn random_attachment(graph: &Graph, vertices_to_add: usize, edges_per_step: latest_time += 1; edges.for_each(|neighbour| { graph - .add_edge(latest_time, max_id, *neighbour, &vec![], None) + .add_edge(latest_time, max_id, *neighbour, NO_PROPS, None) .expect("Not able to add edge"); }); ids.push(max_id); @@ -74,33 +79,33 @@ mod random_graph_test { use crate::graphgen::preferential_attachment::ba_preferential_attachment; #[test] fn blank_graph() { - let graph = Graph::new(2); + let graph = Graph::new(); random_attachment(&graph, 100, 20); - assert_eq!(graph.num_edges(), 2000); - assert_eq!(graph.num_vertices(), 120); + assert_eq!(graph.count_edges(), 2000); + assert_eq!(graph.count_vertices(), 120); } #[test] fn only_nodes() { - let graph = Graph::new(2); + let graph = Graph::new(); for i in 0..10 { graph - .add_vertex(i, i as u64, &vec![]) + .add_vertex(i, i as u64, NO_PROPS) .map_err(|err| println!("{:?}", err)) .ok(); } random_attachment(&graph, 1000, 5); - assert_eq!(graph.num_edges(), 5000); - assert_eq!(graph.num_vertices(), 1010); + assert_eq!(graph.count_edges(), 5000); + assert_eq!(graph.count_vertices(), 1010); } #[test] fn prior_graph() { - let graph = Graph::new(2); + let graph = Graph::new(); ba_preferential_attachment(&graph, 300, 7); random_attachment(&graph, 4000, 12); - assert_eq!(graph.num_edges(), 50106); - assert_eq!(graph.num_vertices(), 4307); + assert_eq!(graph.count_edges(), 50106); + assert_eq!(graph.count_vertices(), 4307); } } diff --git a/raphtory/src/lib.rs b/raphtory/src/lib.rs index 688915dc8c..9e53a8eac3 100644 --- a/raphtory/src/lib.rs +++ b/raphtory/src/lib.rs @@ -23,65 +23,42 @@ //! - **Fast** - raphtory is fast, and can process large amounts of data in a short amount of time. //! - **Open Source** - raphtory is open source, and is available on Github under a GPL-3.0 license. //! -//! ### Shards -//! -//! The sub module `Core` contains the underlying implementation of the graph. -//! Users interact with the graph via the `DB` submodule. -//! -//! The sub module `DB` is the overarching manager for the graph. A GraphDB instance can have N number of shards. -//! These shards (also called TemporalGraphParts) store fragments of a graph. -//! Each shard contains a part of a graph, similar to how data is partitioned. -//! -//! When an edge or node is added to the graph, GraphDB will search for an appropriate -//! place inside a shard to place these. -//! -//! For example, if your graph has 4 shards, altogether they make up the entire temporal graph. -//! Vertices and Edges will be spread across the varying shards. -//! -//! Shards are used for performance and distribution reasons. Having multiple shards running in -//! parallel increases the overall speed. In a matter of seconds, you are able to see your -//! results from your temporal graph analysis. Furthermore, you can run your analysis across -//! multiple machines (e.g. one shard per machine). -//! //! ## Example //! //! Create your own graph below //! ``` -//! use raphtory::db::graph::Graph; -//! use raphtory::core::Direction; -//! use raphtory::core::Prop; -//! use raphtory::db::view_api::*; +//! use raphtory::prelude::*; //! //! // Create your GraphDB object and state the number of shards you would like, here we have 2 -//! let graph = Graph::new(2); +//! let graph = Graph::new(); //! //! // Add vertex and edges to your graph with the respective properties //! graph.add_vertex( //! 1, //! "Gandalf", -//! &vec![("type".to_string(), Prop::Str("Character".to_string()))], -//! ); +//! [("type", Prop::str("Character"))], +//! ).unwrap(); //! //! graph.add_vertex( //! 2, //! "Frodo", -//! &vec![("type".to_string(), Prop::Str("Character".to_string()))], -//! ); +//! [("type", Prop::str("Character"))], +//! ).unwrap(); //! //! graph.add_edge( //! 3, //! "Gandalf", //! "Frodo", -//! &vec![( -//! "meeting".to_string(), -//! Prop::Str("Character Co-occurrence".to_string()), +//! [( +//! "meeting", +//! Prop::str("Character Co-occurrence"), //! )], //! None, -//! ); +//! ).unwrap(); //! //! // Get the in-degree, out-degree and degree of Gandalf -//! println!("Number of vertices {:?}", graph.num_vertices()); -//! println!("Number of Edges {:?}", graph.num_edges()); +//! println!("Number of vertices {:?}", graph.count_vertices()); +//! println!("Number of Edges {:?}", graph.count_edges()); //! ``` //! //! ## Supported Operating Systems @@ -112,3 +89,32 @@ pub mod algorithms; pub mod core; pub mod db; pub mod graphgen; + +#[cfg(feature = "python")] +pub mod python; + +#[cfg(feature = "io")] +pub mod graph_loader; + +#[cfg(feature = "search")] +pub mod search; + +#[cfg(feature = "vectors")] +pub mod vectors; + +pub mod prelude { + pub const NO_PROPS: [(&str, Prop); 0] = []; + pub use crate::{ + core::{IntoProp, Prop, PropUnwrap}, + db::{ + api::{ + mutation::{AdditionOps, DeletionOps, PropertyAdditionOps}, + view::{ + EdgeListOps, EdgeViewOps, GraphViewOps, Layer, LayerOps, TimeOps, + VertexListOps, VertexViewOps, + }, + }, + graph::graph::Graph, + }, + }; +} diff --git a/raphtory/src/python/graph/algorithm_result.rs b/raphtory/src/python/graph/algorithm_result.rs new file mode 100644 index 0000000000..dcf67888dc --- /dev/null +++ b/raphtory/src/python/graph/algorithm_result.rs @@ -0,0 +1,177 @@ +use ordered_float::OrderedFloat; +use pyo3::prelude::*; + +/// Create a macro for py_algorithm_result +macro_rules! py_algorithm_result { + ($name:ident, $rustKey:ty, $rustValue:ty, $rustSortValue:ty) => { + #[pyclass] + pub struct $name( + $crate::algorithms::algorithm_result::AlgorithmResult< + $rustKey, + $rustValue, + $rustSortValue, + >, + ); + + impl pyo3::IntoPy + for $crate::algorithms::algorithm_result::AlgorithmResult< + $rustKey, + $rustValue, + $rustSortValue, + > + { + fn into_py(self, py: Python<'_>) -> pyo3::PyObject { + $name(self).into_py(py) + } + } + }; + + ($name:ident, $rustKey:ty, $rustValue:ty) => { + py_algorithm_result!($name, $rustKey, $rustValue, $rustValue); + }; +} + +#[macro_export] +macro_rules! py_algorithm_result_base { + ($name:ident, $rustKey:ty, $rustValue:ty) => { + #[pymethods] + impl $name { + /// Returns a reference to the entire `result` hashmap. + fn get_all(&self) -> std::collections::HashMap<$rustKey, $rustValue> { + self.0.get_all().clone() + } + + /// Returns the value corresponding to the provided key in the `result` hashmap. + /// + /// # Arguments + /// + /// * `key`: The key of type `H` for which the value is to be retrieved. + fn get(&self, key: $rustKey) -> Option<$rustValue> { + self.0.get(&key).cloned() + } + + /// Creates a dataframe from the result + /// + /// # Returns + /// + /// A `pandas.DataFrame` containing the result + pub fn to_df(&self) -> PyResult { + let hashmap = &self.0.result; + let mut keys = Vec::new(); + let mut values = Vec::new(); + Python::with_gil(|py| { + for (key, value) in hashmap.iter() { + keys.push(key.to_object(py)); + values.push(value.to_object(py)); + } + let dict = pyo3::types::PyDict::new(py); + dict.set_item("Key", pyo3::types::PyList::new(py, keys.as_slice()))?; + dict.set_item("Value", pyo3::types::PyList::new(py, values.as_slice()))?; + let pandas = pyo3::types::PyModule::import(py, "pandas")?; + let df: &PyAny = pandas.getattr("DataFrame")?.call1((dict,))?; + Ok(df.to_object(py)) + }) + } + } + }; +} + +#[macro_export] +macro_rules! py_algorithm_result_partial_ord { + ($name:ident, $rustKey:ty, $rustValue:ty) => { + #[pymethods] + impl $name { + /// Sorts the `AlgorithmResult` by its values in ascending or descending order. + /// + /// # Arguments + /// + /// * `reverse`: If `true`, sorts the result in descending order; otherwise, sorts in ascending order. + /// + /// # Returns + /// + /// A sorted vector of tuples containing keys of type `H` and values of type `Y`. + #[pyo3(signature = (reverse=true))] + fn sort_by_value(&self, reverse: bool) -> Vec<($rustKey, $rustValue)> { + self.0.sort_by_value(reverse) + } + + /// Sorts the `AlgorithmResult` by its keys in ascending or descending order. + /// + /// # Arguments + /// + /// * `reverse`: If `true`, sorts the result in descending order; otherwise, sorts in ascending order. + /// + /// # Returns + /// + /// A sorted vector of tuples containing keys of type `H` and values of type `Y`. + #[pyo3(signature = (reverse=true))] + fn sort_by_key(&self, reverse: bool) -> Vec<($rustKey, $rustValue)> { + self.0.sort_by_key(reverse) + } + + /// Retrieves the top-k elements from the `AlgorithmResult` based on its values. + /// + /// # Arguments + /// + /// * `k`: The number of elements to retrieve. + /// * `percentage`: If `true`, the `k` parameter is treated as a percentage of total elements. + /// * `reverse`: If `true`, retrieves the elements in descending order; otherwise, in ascending order. + /// + /// # Returns + /// + /// An `Option` containing a vector of tuples with keys of type `H` and values of type `Y`. + /// If `percentage` is `true`, the returned vector contains the top `k` percentage of elements. + /// If `percentage` is `false`, the returned vector contains the top `k` elements. + /// Returns `None` if the result is empty or if `k` is 0. + #[pyo3(signature = (k, percentage=false, reverse=true))] + fn top_k( + &self, + k: usize, + percentage: bool, + reverse: bool, + ) -> Vec<($rustKey, $rustValue)> { + self.0.top_k(k, percentage, reverse) + } + } + py_algorithm_result_base!($name, $rustKey, $rustValue); + }; +} + +#[macro_export] +macro_rules! py_algorithm_result_ord_hash_eq { + ($name:ident, $rustKey:ty, $rustValue:ty) => { + #[pymethods] + impl $name { + /// Groups the `AlgorithmResult` by its values. + /// + /// # Returns + /// + /// A `HashMap` where keys are unique values from the `AlgorithmResult` and values are vectors + /// containing keys of type `H` that share the same value. + fn group_by(&self) -> std::collections::HashMap<$rustValue, Vec<$rustKey>> { + self.0.group_by() + } + } + py_algorithm_result_partial_ord!($name, $rustKey, $rustValue); + }; +} + +py_algorithm_result!(AlgorithmResultStrU64, String, u64); +py_algorithm_result_ord_hash_eq!(AlgorithmResultStrU64, String, u64); + +py_algorithm_result!( + AlgorithmResultStrTupleF32F32, + String, + (f32, f32), + (OrderedFloat, OrderedFloat) +); +py_algorithm_result_partial_ord!(AlgorithmResultStrTupleF32F32, String, (f32, f32)); + +py_algorithm_result!(AlgorithmResultStrVecI64Str, String, Vec<(i64, String)>); +py_algorithm_result_ord_hash_eq!(AlgorithmResultStrVecI64Str, String, Vec<(i64, String)>); + +py_algorithm_result!(AlgorithmResultU64VecUsize, u64, Vec); +py_algorithm_result_ord_hash_eq!(AlgorithmResultU64VecUsize, u64, Vec); + +py_algorithm_result!(AlgorithmResultStrF64, String, f64, OrderedFloat); +py_algorithm_result_partial_ord!(AlgorithmResultStrF64, String, f64); diff --git a/raphtory/src/python/graph/edge.rs b/raphtory/src/python/graph/edge.rs new file mode 100644 index 0000000000..1f2a4ca29f --- /dev/null +++ b/raphtory/src/python/graph/edge.rs @@ -0,0 +1,754 @@ +//! The edge module contains the PyEdge class, which is used to represent edges in the graph and +//! provides access to the edge's properties and vertices. +//! +//! The PyEdge class also provides access to the perspective APIs, which allow the user to view the +//! edge as it existed at a particular point in time, or as it existed over a particular time range. +//! +use crate::{ + core::{ + utils::{errors::GraphError, time::error::ParseTimeError}, + ArcStr, Direction, + }, + db::{ + api::{ + properties::Properties, + view::{ + internal::{DynamicGraph, Immutable, IntoDynamic, MaterializedGraph}, + BoxedIter, WindowSet, + }, + }, + graph::{ + edge::EdgeView, + views::{ + deletion_graph::GraphWithDeletions, layer_graph::LayeredGraph, + window_graph::WindowedGraph, + }, + }, + }, + prelude::*, + python::{ + graph::{ + properties::{PyNestedPropsIterable, PyPropsList}, + vertex::{PyNestedVertexIterable, PyVertex, PyVertexIterable}, + }, + types::{ + repr::{iterator_repr, Repr}, + wrappers::iterators::{ + NestedOptionI64Iterable, NestedU64U64Iterable, OptionI64Iterable, + }, + }, + utils::{PyGenericIterable, PyGenericIterator, PyInterval, PyTime}, + }, +}; +use chrono::NaiveDateTime; +use itertools::Itertools; +use pyo3::{prelude::*, pyclass::CompareOp}; +use std::{ + collections::{hash_map::DefaultHasher, HashMap}, + hash::{Hash, Hasher}, + ops::Deref, + sync::Arc, +}; + +/// PyEdge is a Python class that represents an edge in the graph. +/// An edge is a directed connection between two vertices. +#[pyclass(name = "Edge", subclass)] +pub struct PyEdge { + pub(crate) edge: EdgeView, +} + +#[pyclass(name="MutableEdge", extends=PyEdge)] +pub struct PyMutableEdge { + edge: EdgeView, +} + +impl From> for PyEdge { + fn from(value: EdgeView) -> Self { + Self { + edge: EdgeView { + graph: value.graph.clone().into_dynamic(), + edge: value.edge, + }, + } + } +} + +impl + GraphViewOps> From> for PyMutableEdge { + fn from(value: EdgeView) -> Self { + let edge = EdgeView { + edge: value.edge, + graph: value.graph.into(), + }; + + Self { edge } + } +} + +impl IntoPy for EdgeView { + fn into_py(self, py: Python<'_>) -> PyObject { + let py_version: PyEdge = self.into(); + py_version.into_py(py) + } +} + +impl IntoPy for EdgeView { + fn into_py(self, py: Python<'_>) -> PyObject { + let graph: MaterializedGraph = self.graph.into(); + let edge = self.edge; + let vertex = EdgeView { graph, edge }; + vertex.into_py(py) + } +} + +impl IntoPy for EdgeView { + fn into_py(self, py: Python<'_>) -> PyObject { + let graph: MaterializedGraph = self.graph.into(); + let edge = self.edge; + let vertex = EdgeView { graph, edge }; + vertex.into_py(py) + } +} + +impl IntoPy for EdgeView { + fn into_py(self, py: Python<'_>) -> PyObject { + Py::new(py, (PyMutableEdge::from(self.clone()), PyEdge::from(self))) + .unwrap() // I think this only fails if we are out of memory? Seems to be unavoidable! + .into_py(py) + } +} + +impl IntoPy for ArcStr { + fn into_py(self, py: Python<'_>) -> PyObject { + self.0.into_py(py) + } +} + +impl<'source> FromPyObject<'source> for ArcStr { + fn extract(ob: &'source PyAny) -> PyResult { + ob.extract::().map(|v| v.into()) + } +} + +/// PyEdge is a Python class that represents an edge in the graph. +/// An edge is a directed connection between two vertices. +#[pymethods] +impl PyEdge { + /// Rich Comparison for Vertex objects + pub fn __richcmp__(&self, other: PyRef, op: CompareOp) -> Py { + let py = other.py(); + match op { + CompareOp::Eq => (self.edge.id() == other.id()).into_py(py), + CompareOp::Ne => (self.edge.id() != other.id()).into_py(py), + _ => py.NotImplemented(), + } + } + + /// Returns the hash of the edge and edge properties. + /// + /// Returns: + /// A hash of the edge. + pub fn __hash__(&self) -> u64 { + let mut s = DefaultHasher::new(); + self.edge.id().hash(&mut s); + s.finish() + } + + /// The id of the edge. + #[getter] + pub fn id(&self) -> (u64, u64) { + self.edge.id() + } + + pub fn __getitem__(&self, name: &str) -> Option { + self.edge.properties().get(name) + } + + /// Returns a list of timestamps of when an edge is added or change to an edge is made. + /// + /// Returns: + /// A list of timestamps. + /// + pub fn history(&self) -> Vec { + self.edge.history() + } + + /// Returns a view of the properties of the edge. + #[getter] + pub fn properties(&self) -> Properties> { + self.edge.properties() + } + + /// Get the source vertex of the Edge. + /// + /// Returns: + /// The source vertex of the Edge. + #[getter] + fn src(&self) -> PyVertex { + self.edge.src().into() + } + + /// Get the destination vertex of the Edge. + /// + /// Returns: + /// The destination vertex of the Edge. + #[getter] + fn dst(&self) -> PyVertex { + self.edge.dst().into() + } + + //****** Perspective APIS ******// + + /// Get the start time of the Edge. + /// + /// Returns: + /// The start time of the Edge. + #[getter] + pub fn start(&self) -> Option { + self.edge.start() + } + + /// Get the start datetime of the Edge. + /// + /// Returns: + /// the start datetime of the Edge. + #[getter] + pub fn start_date_time(&self) -> Option { + let start_time = self.edge.start()?; + NaiveDateTime::from_timestamp_millis(start_time) + } + + /// Get the end time of the Edge. + /// + /// Returns: + /// The end time of the Edge. + #[getter] + pub fn end(&self) -> Option { + self.edge.end() + } + + /// Get the end datetime of the Edge. + /// + /// Returns: + /// The end datetime of the Edge + #[getter] + pub fn end_date_time(&self) -> Option { + let end_time = self.edge.end()?; + NaiveDateTime::from_timestamp_millis(end_time) + } + + /// Get the duration of the Edge. + /// + /// Arguments: + /// step (int): The step size to use when calculating the duration. + /// + /// Returns: + /// A set of windows containing edges that fall in the time period + #[pyo3(signature = (step))] + fn expanding( + &self, + step: PyInterval, + ) -> Result>, ParseTimeError> { + self.edge.expanding(step) + } + + /// Get a set of Edge windows for a given window size, step, start time + /// and end time using rolling window. + /// A rolling window is a window that moves forward by `step` size at each iteration. + /// + /// Arguments: + /// window (int | str): The size of the window. + /// step (int | str): The step size to use when calculating the duration. + /// + /// Returns: + /// A set of windows containing edges that fall in the time period + fn rolling( + &self, + window: PyInterval, + step: Option, + ) -> Result>, ParseTimeError> { + self.edge.rolling(window, step) + } + + /// Get a new Edge with the properties of this Edge within the specified time window. + /// + /// Arguments: + /// t_start (int | str): The start time of the window (optional). + /// t_end (int | str): The end time of the window (optional). + /// + /// Returns: + /// A new Edge with the properties of this Edge within the specified time window. + #[pyo3(signature = (t_start = None, t_end = None))] + pub fn window( + &self, + t_start: Option, + t_end: Option, + ) -> EdgeView> { + self.edge + .window(t_start.unwrap_or(PyTime::MIN), t_end.unwrap_or(PyTime::MAX)) + } + + /// Get a new Edge with the properties of this Edge within the specified layers. + /// + /// Arguments: + /// layer_names ([str]): Layers to be included in the new edge. + /// + /// Returns: + /// A new Edge with the properties of this Edge within the specified time window. + #[pyo3(signature = (layer_names))] + pub fn layers( + &self, + layer_names: Vec, + ) -> PyResult>> { + if let Some(edge) = self.edge.layer(layer_names.clone()) { + Ok(edge) + } else { + let available_layers: Vec<_> = self.edge.layer_names().collect(); + Err(PyErr::new::( + format!("Layers {layer_names:?} not available for edge, available layers: {available_layers:?}"), + )) + } + } + + /// Get a new Edge with the properties of this Edge at a specified time. + /// + /// Arguments: + /// end (int): The time to get the properties at. + /// + /// Returns: + /// A new Edge with the properties of this Edge at a specified time. + #[pyo3(signature = (end))] + pub fn at(&self, end: PyTime) -> EdgeView> { + self.edge.at(end) + } + + /// Explodes an Edge into a list of PyEdges. This is useful when you want to iterate over + /// the properties of an Edge at every single point in time. This will return a seperate edge + /// each time a property had been changed. + /// + /// Returns: + /// A list of PyEdges + pub fn explode(&self) -> PyEdges { + let edge = self.edge.clone(); + (move || edge.explode()).into() + } + + /// Explodes an Edge into a list of PyEdges, one for each layer the edge is part of. This is useful when you want to iterate over + /// the properties of an Edge for every layer. + /// + /// Returns: + /// A list of PyEdges + pub fn explode_layers(&self) -> PyEdges { + let edge = self.edge.clone(); + (move || edge.explode_layers()).into() + } + + /// Gets the earliest time of an edge. + /// + /// Returns: + /// (int) The earliest time of an edge + #[getter] + pub fn earliest_time(&self) -> Option { + self.edge.earliest_time() + } + + /// Gets of earliest datetime of an edge. + /// + /// Returns: + /// the earliest datetime of an edge + #[getter] + pub fn earliest_date_time(&self) -> Option { + NaiveDateTime::from_timestamp_millis(self.edge.earliest_time()?) + } + + /// Gets the latest time of an edge. + /// + /// Returns: + /// (int) The latest time of an edge + #[getter] + pub fn latest_time(&self) -> Option { + self.edge.latest_time() + } + + /// Gets of latest datetime of an edge. + /// + /// Returns: + /// the latest datetime of an edge + #[getter] + pub fn latest_date_time(&self) -> Option { + let latest_time = self.edge.latest_time()?; + NaiveDateTime::from_timestamp_millis(latest_time) + } + + /// Gets the time of an exploded edge. + /// + /// Returns: + /// (int) The time of an exploded edge + #[getter] + pub fn time(&self) -> Option { + self.edge.time() + } + + /// Gets the names of the layers this edge belongs to + /// + /// Returns: + /// ([str]) The name of the layer + #[getter] + pub fn layer_names(&self) -> Vec { + self.edge.layer_names().collect() + } + + /// Gets the name of the layer this edge belongs to - assuming it only belongs to one layer + /// + /// Returns: + /// ([str]) The name of the layer + #[getter] + pub fn layer_name(&self) -> Option { + self.edge.layer_name().map(|v| v.clone()) + } + + /// Gets the datetime of an exploded edge. + /// + /// Returns: + /// (datetime) the datetime of an exploded edge + #[getter] + pub fn date_time(&self) -> Option { + let date_time = self.edge.time()?; + NaiveDateTime::from_timestamp_millis(date_time) + } + + /// Displays the Edge as a string. + pub fn __repr__(&self) -> String { + self.repr() + } +} + +impl Repr for PyEdge { + fn repr(&self) -> String { + self.edge.repr() + } +} + +impl Repr for EdgeView { + fn repr(&self) -> String { + let properties: String = self + .properties() + .iter() + .map(|(k, v)| format!("{}: {}", k.deref(), v)) + .join(", "); + + let source = self.src().name(); + let target = self.dst().name(); + let earliest_time = self.earliest_time().repr(); + let latest_time = self.latest_time().repr(); + if properties.is_empty() { + format!( + "Edge(source={}, target={}, earliest_time={}, latest_time={})", + source.trim_matches('"'), + target.trim_matches('"'), + earliest_time, + latest_time, + ) + } else { + format!( + "Edge(source={}, target={}, earliest_time={}, latest_time={}, properties={})", + source.trim_matches('"'), + target.trim_matches('"'), + earliest_time, + latest_time, + format!("{{{properties}}}") + ) + } + } +} + +impl Repr for PyMutableEdge { + fn repr(&self) -> String { + self.edge.repr() + } +} +#[pymethods] +impl PyMutableEdge { + fn add_updates( + &self, + t: PyTime, + properties: Option>, + layer: Option<&str>, + ) -> Result<(), GraphError> { + self.edge + .add_updates(t, properties.unwrap_or_default(), layer) + } + + fn add_constant_properties( + &self, + properties: HashMap, + layer: Option<&str>, + ) -> Result<(), GraphError> { + self.edge.add_constant_properties(properties, layer) + } + + fn __repr__(&self) -> String { + self.repr() + } +} + +/// A list of edges that can be iterated over. +#[pyclass(name = "Edges")] +pub struct PyEdges { + builder: Arc BoxedIter> + Send + Sync + 'static>, +} + +impl PyEdges { + /// an iterable that can be used in rust + fn iter(&self) -> BoxedIter> { + (self.builder)() + } + + /// returns an iterable used in python + fn py_iter(&self) -> BoxedIter { + Box::new(self.iter().map(|e| e.into())) + } +} + +#[pymethods] +impl PyEdges { + fn __iter__(&self) -> PyGenericIterator { + self.py_iter().into() + } + + /// Returns all source vertices of the Edges as an iterable. + /// + /// Returns: + /// The source vertices of the Edges as an iterable. + #[getter] + fn src(&self) -> PyVertexIterable { + let builder = self.builder.clone(); + (move || builder().src()).into() + } + + /// Returns all destination vertices as an iterable + #[getter] + fn dst(&self) -> PyVertexIterable { + let builder = self.builder.clone(); + (move || builder().dst()).into() + } + + /// Returns all edges as a list + fn collect(&self) -> Vec { + self.py_iter().collect() + } + + /// Returns the number of edges + fn count(&self) -> usize { + self.py_iter().count() + } + + /// Explodes the edges into a list of edges. This is useful when you want to iterate over + /// the properties of an Edge at every single point in time. This will return a seperate edge + /// each time a property had been changed. + fn explode(&self) -> PyEdges { + let builder = self.builder.clone(); + (move || { + let iter: BoxedIter> = + Box::new(builder().flat_map(|e| e.explode())); + iter + }) + .into() + } + + /// Explodes each edge into a list of edges, one for each layer the edge is part of. This is useful when you want to iterate over + /// the properties of an Edge for every layer. + fn explode_layers(&self) -> PyEdges { + let builder = self.builder.clone(); + (move || { + let iter: BoxedIter> = + Box::new(builder().flat_map(|e| e.explode_layers())); + iter + }) + .into() + } + + /// Returns the earliest time of the edges. + #[getter] + fn earliest_time(&self) -> OptionI64Iterable { + let edges: Arc< + dyn Fn() -> Box> + Send> + Send + Sync, + > = self.builder.clone(); + (move || edges().earliest_time()).into() + } + + /// Returns the latest time of the edges. + #[getter] + fn latest_time(&self) -> OptionI64Iterable { + let edges: Arc< + dyn Fn() -> Box> + Send> + Send + Sync, + > = self.builder.clone(); + (move || edges().latest_time()).into() + } + + /// Returns all properties of the edges + #[getter] + fn properties(&self) -> PyPropsList { + let builder = self.builder.clone(); + (move || builder().properties()).into() + } + + /// Returns all ids of the edges. + #[getter] + fn id(&self) -> PyGenericIterable { + let edges = self.builder.clone(); + (move || edges().id()).into() + } + + fn __repr__(&self) -> String { + self.repr() + } +} + +impl Repr for PyEdges { + fn repr(&self) -> String { + format!("Edges({})", iterator_repr(self.iter())) + } +} + +impl BoxedIter> + Send + Sync + 'static> From for PyEdges { + fn from(value: F) -> Self { + Self { + builder: Arc::new(value), + } + } +} + +py_nested_iterable!(PyNestedEdges, EdgeView); + +#[pymethods] +impl PyNestedEdges { + /// Returns all source vertices of the Edges as an iterable. + /// + /// Returns: + /// The source verticeÍs of the Edges as an iterable. + #[getter] + fn src(&self) -> PyNestedVertexIterable { + let builder = self.builder.clone(); + (move || builder().src()).into() + } + + /// Returns all destination vertices as an iterable + #[getter] + fn dst(&self) -> PyNestedVertexIterable { + let builder = self.builder.clone(); + (move || builder().dst()).into() + } + + /// Returns the earliest time of the edges. + #[getter] + fn earliest_time(&self) -> NestedOptionI64Iterable { + let edges = self.builder.clone(); + (move || edges().earliest_time()).into() + } + + /// Returns the latest time of the edges. + #[getter] + fn latest_time(&self) -> NestedOptionI64Iterable { + let edges = self.builder.clone(); + (move || edges().latest_time()).into() + } + + // FIXME: needs a view that allows indexing into the properties + /// Returns all properties of the edges + #[getter] + fn properties(&self) -> PyNestedPropsIterable { + let builder = self.builder.clone(); + (move || builder().properties()).into() + } + + /// Returns all ids of the edges. + #[getter] + fn id(&self) -> NestedU64U64Iterable { + let edges = self.builder.clone(); + (move || edges().id()).into() + } + + /// Explode each edge, creating a separate edge instance for each edge event + fn explode(&self) -> PyNestedEdges { + let builder = self.builder.clone(); + (move || { + let iter: BoxedIter>> = Box::new(builder().map(|e| { + let inner_box: BoxedIter> = + Box::new(e.flat_map(|e| e.explode())); + inner_box + })); + iter + }) + .into() + } + + /// Explode each edge over layers, creating a separate edge instance for each layer the edge is part of + fn explode_layers(&self) -> PyNestedEdges { + let builder = self.builder.clone(); + (move || { + let iter: BoxedIter>> = Box::new(builder().map(|e| { + let inner_box: BoxedIter> = + Box::new(e.flat_map(|e| e.explode_layers())); + inner_box + })); + iter + }) + .into() + } +} + +#[pyclass] +#[derive(Clone)] +pub struct PyDirection { + inner: Direction, +} + +#[pymethods] +impl PyDirection { + #[new] + pub fn new(direction: &str) -> Self { + match direction { + "OUT" => PyDirection { + inner: Direction::OUT, + }, + "IN" => PyDirection { + inner: Direction::IN, + }, + "BOTH" => PyDirection { + inner: Direction::BOTH, + }, + _ => panic!("Invalid direction"), + } + } + + fn as_str(&self) -> &str { + match self.inner { + Direction::OUT => "OUT", + Direction::IN => "IN", + Direction::BOTH => "BOTH", + } + } +} + +impl Into for PyDirection { + fn into(self) -> Direction { + self.inner + } +} + +impl From for PyDirection { + fn from(s: String) -> Self { + match s.to_uppercase().as_str() { + "OUT" => PyDirection { + inner: Direction::OUT, + }, + "IN" => PyDirection { + inner: Direction::IN, + }, + "BOTH" => PyDirection { + inner: Direction::BOTH, + }, + _ => panic!("Invalid direction string"), + } + } +} diff --git a/raphtory/src/python/graph/graph.rs b/raphtory/src/python/graph/graph.rs new file mode 100644 index 0000000000..4741c7dbd8 --- /dev/null +++ b/raphtory/src/python/graph/graph.rs @@ -0,0 +1,460 @@ +//! Defines the `Graph` struct, which represents a raphtory graph in memory. +//! +//! This is the base class used to create a temporal graph, add vertices and edges, +//! create windows, and query the graph with a variety of algorithms. +//! It is a wrapper around a set of shards, which are the actual graph data structures. +//! In Python, this class wraps around the rust graph. +use crate::{ + core::utils::errors::GraphError, + db::api::view::internal::MaterializedGraph, + prelude::*, + python::{ + graph::{graph_with_deletions::PyGraphWithDeletions, views::graph_view::PyGraphView}, + utils::{PyInputVertex, PyTime}, + }, +}; +use pyo3::prelude::*; + +use crate::{ + core::entities::vertices::vertex_ref::VertexRef, + db::{ + api::view::internal::{DynamicGraph, IntoDynamic}, + graph::{edge::EdgeView, vertex::VertexView}, + }, + python::graph::pandas::{load_edges_props_from_df, load_vertex_props_from_df}, +}; +use pyo3::types::{IntoPyDict, PyBytes}; +use std::{ + collections::HashMap, + fmt::{Debug, Formatter}, + path::{Path, PathBuf}, +}; + +use super::pandas::{ + load_edges_from_df, load_vertices_from_df, process_pandas_py_df, GraphLoadException, +}; + +/// A temporal graph. +#[derive(Clone)] +#[pyclass(name="Graph", extends=PyGraphView)] +pub struct PyGraph { + pub graph: Graph, +} + +impl Debug for PyGraph { + fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result { + write!(f, "{}", self.graph) + } +} + +impl From for PyGraph { + fn from(value: Graph) -> Self { + Self { graph: value } + } +} + +impl From for Graph { + fn from(value: PyGraph) -> Self { + value.graph + } +} + +impl From for DynamicGraph { + fn from(value: PyGraph) -> Self { + value.graph.into_dynamic() + } +} + +impl<'source> FromPyObject<'source> for MaterializedGraph { + fn extract(graph: &'source PyAny) -> PyResult { + if let Ok(graph) = graph.extract::>() { + Ok(graph.graph.clone().into()) + } else if let Ok(graph) = graph.extract::>() { + Ok(graph.graph.clone().into()) + } else { + Err(PyErr::new::(format!( + "Incorrect type, object is not a PyGraph or PyGraphWithDeletions" + ))) + } + } +} + +impl IntoPy for Graph { + fn into_py(self, py: Python<'_>) -> PyObject { + Py::new(py, (PyGraph::from(self.clone()), PyGraphView::from(self))) + .unwrap() // I think this only fails if we are out of memory? Seems to be unavoidable if we want to create an actual graph. + .into_py(py) + } +} + +impl<'source> FromPyObject<'source> for Graph { + fn extract(ob: &'source PyAny) -> PyResult { + let g: PyRef = ob.extract()?; + Ok(g.graph.clone()) + } +} + +impl PyGraph { + pub fn py_from_db_graph(db_graph: Graph) -> PyResult> { + Python::with_gil(|py| { + Py::new( + py, + (PyGraph::from(db_graph.clone()), PyGraphView::from(db_graph)), + ) + }) + } +} + +/// A temporal graph. +#[pymethods] +impl PyGraph { + #[new] + pub fn py_new() -> (Self, PyGraphView) { + let graph = Graph::new(); + ( + Self { + graph: graph.clone(), + }, + PyGraphView::from(graph), + ) + } + + /// Adds a new vertex with the given id and properties to the graph. + /// + /// Arguments: + /// timestamp (int, str, or datetime(utc)): The timestamp of the vertex. + /// id (str or int): The id of the vertex. + /// properties (dict): The properties of the vertex. + /// + /// Returns: + /// None + #[pyo3(signature = (timestamp, id, properties=None))] + pub fn add_vertex( + &self, + timestamp: PyTime, + id: PyInputVertex, + properties: Option>, + ) -> Result, GraphError> { + self.graph + .add_vertex(timestamp, id, properties.unwrap_or_default()) + } + + /// Adds properties to the graph. + /// + /// Arguments: + /// timestamp (int, str, or datetime(utc)): The timestamp of the temporal property. + /// properties (dict): The temporal properties of the graph. + /// + /// Returns: + /// None + pub fn add_property( + &self, + timestamp: PyTime, + properties: HashMap, + ) -> Result<(), GraphError> { + self.graph.add_properties(timestamp, properties) + } + + /// Adds static properties to the graph. + /// + /// Arguments: + /// properties (dict): The static properties of the graph. + /// + /// Returns: + /// None + pub fn add_constant_properties( + &self, + properties: HashMap, + ) -> Result<(), GraphError> { + self.graph.add_constant_properties(properties) + } + + /// Adds a new edge with the given source and destination vertices and properties to the graph. + /// + /// Arguments: + /// timestamp (int): The timestamp of the edge. + /// src (str or int): The id of the source vertex. + /// dst (str or int): The id of the destination vertex. + /// properties (dict): The properties of the edge, as a dict of string and properties + /// layer (str): The layer of the edge. + /// + /// Returns: + /// None + #[pyo3(signature = (timestamp, src, dst, properties=None, layer=None))] + pub fn add_edge( + &self, + timestamp: PyTime, + src: PyInputVertex, + dst: PyInputVertex, + properties: Option>, + layer: Option<&str>, + ) -> Result, GraphError> { + self.graph + .add_edge(timestamp, src, dst, properties.unwrap_or_default(), layer) + } + + //FIXME: This is reimplemented here to get mutable views. If we switch the underlying graph to enum dispatch, this won't be necessary! + /// Gets the vertex with the specified id + /// + /// Arguments: + /// id (str or int): the vertex id + /// + /// Returns: + /// the vertex with the specified id, or None if the vertex does not exist + pub fn vertex(&self, id: VertexRef) -> Option> { + self.graph.vertex(id) + } + + //FIXME: This is reimplemented here to get mutable views. If we switch the underlying graph to enum dispatch, this won't be necessary! + /// Gets the edge with the specified source and destination vertices + /// + /// Arguments: + /// src (str or int): the source vertex id + /// dst (str or int): the destination vertex id + /// layer (str): the edge layer (optional) + /// + /// Returns: + /// the edge with the specified source and destination vertices, or None if the edge does not exist + #[pyo3(signature = (src, dst))] + pub fn edge(&self, src: VertexRef, dst: VertexRef) -> Option> { + self.graph.edge(src, dst) + } + + //****** Saving And Loading ******// + + // Alternative constructors are tricky, see: https://gist.github.com/redshiftzero/648e4feeff3843ffd9924f13625f839c + + /// Loads a graph from the given path. + /// + /// Arguments: + /// path (str): The path to the graph. + /// + /// Returns: + /// Graph: The loaded graph. + #[staticmethod] + pub fn load_from_file(path: &str) -> Result { + let file_path: PathBuf = [env!("CARGO_MANIFEST_DIR"), path].iter().collect(); + Graph::load_from_file(file_path) + } + + /// Saves the graph to the given path. + /// + /// Arguments: + /// path (str): The path to the graph. + /// + /// Returns: + /// None + pub fn save_to_file(&self, path: &str) -> Result<(), GraphError> { + self.graph.save_to_file(Path::new(path)) + } + + /// Get bincode encoded graph + pub fn bincode<'py>(&'py self, py: Python<'py>) -> Result<&'py PyBytes, GraphError> { + let bytes = MaterializedGraph::from(self.graph.clone()).bincode()?; + Ok(PyBytes::new(py, &bytes)) + } + + #[staticmethod] + #[pyo3(signature = (edges_df, src = "source", dst = "destination", time = "time", props = None, const_props=None,shared_const_props=None,layer = None, layer_in_df = None, vertex_df = None, vertex_col = None, vertex_time_col = None, vertex_props = None, vertex_const_props = None, vertex_shared_const_props = None))] + fn load_from_pandas( + edges_df: &PyAny, + src: &str, + dst: &str, + time: &str, + props: Option>, + const_props: Option>, + shared_const_props: Option>, + layer: Option<&str>, + layer_in_df: Option<&str>, + vertex_df: Option<&PyAny>, + vertex_col: Option<&str>, + vertex_time_col: Option<&str>, + vertex_props: Option>, + vertex_const_props: Option>, + vertex_shared_const_props: Option>, + ) -> Result { + let graph = PyGraph { + graph: Graph::new(), + }; + graph.load_edges_from_pandas( + edges_df, + src, + dst, + time, + props, + const_props, + shared_const_props, + layer, + layer_in_df, + )?; + if let (Some(vertex_df), Some(vertex_col), Some(vertex_time_col)) = + (vertex_df, vertex_col, vertex_time_col) + { + graph.load_vertices_from_pandas( + vertex_df, + vertex_col, + vertex_time_col, + vertex_props, + vertex_const_props, + vertex_shared_const_props, + )?; + } + Ok(graph.graph) + } + + #[pyo3(signature = (vertices_df, vertex_col = "id", time_col = "time", props = None, const_props = None, shared_const_props = None))] + fn load_vertices_from_pandas( + &self, + vertices_df: &PyAny, + vertex_col: &str, + time_col: &str, + props: Option>, + const_props: Option>, + shared_const_props: Option>, + ) -> Result<(), GraphError> { + let graph = &self.graph; + Python::with_gil(|py| { + let size: usize = py + .eval( + "index.__len__()", + Some([("index", vertices_df.getattr("index")?)].into_py_dict(py)), + None, + )? + .extract()?; + let df = process_pandas_py_df(vertices_df, py, size)?; + load_vertices_from_df( + &df, + size, + vertex_col, + time_col, + props, + const_props, + shared_const_props, + graph, + ) + .map_err(|e| GraphLoadException::new_err(format!("{:?}", e)))?; + + Ok::<(), PyErr>(()) + }) + .map_err(|e| GraphError::LoadFailure(format!("Failed to load graph {e:?}")))?; + Ok(()) + } + + #[pyo3(signature = (edge_df, src_col = "source", dst_col = "destination", time_col = "time", props = None, const_props=None,shared_const_props=None,layer=None,layer_in_df=None))] + fn load_edges_from_pandas( + &self, + edge_df: &PyAny, + src_col: &str, + dst_col: &str, + time_col: &str, + props: Option>, + const_props: Option>, + shared_const_props: Option>, + layer: Option<&str>, + layer_in_df: Option<&str>, + ) -> Result<(), GraphError> { + let graph = &self.graph; + Python::with_gil(|py| { + let size: usize = py + .eval( + "index.__len__()", + Some([("index", edge_df.getattr("index")?)].into_py_dict(py)), + None, + )? + .extract()?; + let df = process_pandas_py_df(edge_df, py, size)?; + load_edges_from_df( + &df, + size, + src_col, + dst_col, + time_col, + props, + const_props, + shared_const_props, + layer, + layer_in_df, + graph, + ) + .map_err(|e| GraphLoadException::new_err(format!("{:?}", e)))?; + + Ok::<(), PyErr>(()) + }) + .map_err(|e| GraphError::LoadFailure(format!("Failed to load graph {e:?}")))?; + Ok(()) + } + + #[pyo3(signature = (vertices_df, vertex_col = "id", const_props = None, shared_const_props = None))] + fn load_vertex_props_from_pandas( + &self, + vertices_df: &PyAny, + vertex_col: &str, + const_props: Option>, + shared_const_props: Option>, + ) -> Result<(), GraphError> { + let graph = &self.graph; + Python::with_gil(|py| { + let size: usize = py + .eval( + "index.__len__()", + Some([("index", vertices_df.getattr("index")?)].into_py_dict(py)), + None, + )? + .extract()?; + let df = process_pandas_py_df(vertices_df, py, size)?; + load_vertex_props_from_df( + &df, + size, + vertex_col, + const_props, + shared_const_props, + graph, + ) + .map_err(|e| GraphLoadException::new_err(format!("{:?}", e)))?; + + Ok::<(), PyErr>(()) + }) + .map_err(|e| GraphError::LoadFailure(format!("Failed to load graph {e:?}")))?; + Ok(()) + } + + #[pyo3(signature = (edge_df, src_col = "source", dst_col = "destination", const_props=None,shared_const_props=None,layer=None,layer_in_df=None))] + fn load_edge_props_from_pandas( + &self, + edge_df: &PyAny, + src_col: &str, + dst_col: &str, + const_props: Option>, + shared_const_props: Option>, + layer: Option<&str>, + layer_in_df: Option<&str>, + ) -> Result<(), GraphError> { + let graph = &self.graph; + Python::with_gil(|py| { + let size: usize = py + .eval( + "index.__len__()", + Some([("index", edge_df.getattr("index")?)].into_py_dict(py)), + None, + )? + .extract()?; + let df = process_pandas_py_df(edge_df, py, size)?; + load_edges_props_from_df( + &df, + size, + src_col, + dst_col, + const_props, + shared_const_props, + layer, + layer_in_df, + graph, + ) + .map_err(|e| GraphLoadException::new_err(format!("{:?}", e)))?; + + Ok::<(), PyErr>(()) + }) + .map_err(|e| GraphError::LoadFailure(format!("Failed to load graph {e:?}")))?; + Ok(()) + } +} diff --git a/raphtory/src/python/graph/graph_with_deletions.rs b/raphtory/src/python/graph/graph_with_deletions.rs new file mode 100644 index 0000000000..970331fb38 --- /dev/null +++ b/raphtory/src/python/graph/graph_with_deletions.rs @@ -0,0 +1,245 @@ +//! Defines the `GraphWithDeletions` class, which represents a raphtory graph in memory. +//! Unlike in the `Graph` which has event semantics, `GraphWithDeletions` has edges that persist until explicitly deleted. +//! +//! This is the base class used to create a temporal graph, add vertices and edges, +//! create windows, and query the graph with a variety of algorithms. +//! It is a wrapper around a set of shards, which are the actual graph data structures. +//! In Python, this class wraps around the rust graph. +use crate::{ + core::{entities::vertices::vertex_ref::VertexRef, utils::errors::GraphError, Prop}, + db::{ + api::{ + mutation::{AdditionOps, PropertyAdditionOps}, + view::internal::MaterializedGraph, + }, + graph::{edge::EdgeView, vertex::VertexView, views::deletion_graph::GraphWithDeletions}, + }, + prelude::{DeletionOps, GraphViewOps}, + python::{ + graph::views::graph_view::PyGraphView, + utils::{PyInputVertex, PyTime}, + }, +}; +use pyo3::{prelude::*, types::PyBytes}; +use std::{ + collections::HashMap, + fmt::{Debug, Formatter}, + path::{Path, PathBuf}, +}; + +/// A temporal graph. +#[derive(Clone)] +#[pyclass(name="GraphWithDeletions", extends=PyGraphView)] +pub struct PyGraphWithDeletions { + pub(crate) graph: GraphWithDeletions, +} + +impl Debug for PyGraphWithDeletions { + fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result { + write!(f, "{}", self.graph) + } +} + +impl From for PyGraphWithDeletions { + fn from(value: GraphWithDeletions) -> Self { + Self { graph: value } + } +} + +impl IntoPy for GraphWithDeletions { + fn into_py(self, py: Python<'_>) -> PyObject { + Py::new( + py, + ( + PyGraphWithDeletions::from(self.clone()), + PyGraphView::from(self), + ), + ) + .unwrap() // I think this only fails if we are out of memory? Seems to be unavoidable if we want to create an actual graph. + .into_py(py) + } +} + +impl PyGraphWithDeletions { + pub fn py_from_db_graph(db_graph: GraphWithDeletions) -> PyResult> { + Python::with_gil(|py| { + Py::new( + py, + ( + PyGraphWithDeletions::from(db_graph.clone()), + PyGraphView::from(db_graph), + ), + ) + }) + } +} + +/// A temporal graph. +#[pymethods] +impl PyGraphWithDeletions { + #[new] + pub fn py_new() -> (Self, PyGraphView) { + let graph = GraphWithDeletions::new(); + ( + Self { + graph: graph.clone(), + }, + PyGraphView::from(graph), + ) + } + + /// Adds a new vertex with the given id and properties to the graph. + /// + /// Arguments: + /// timestamp (int, str, or datetime(utc)): The timestamp of the vertex. + /// id (str or int): The id of the vertex. + /// properties (dict): The properties of the vertex. + /// + /// Returns: + /// None + #[pyo3(signature = (timestamp, id, properties=None))] + pub fn add_vertex( + &self, + timestamp: PyTime, + id: PyInputVertex, + properties: Option>, + ) -> Result, GraphError> { + self.graph + .add_vertex(timestamp, id, properties.unwrap_or_default()) + } + + /// Adds properties to the graph. + /// + /// Arguments: + /// timestamp (int, str, or datetime(utc)): The timestamp of the temporal property. + /// properties (dict): The temporal properties of the graph. + /// + /// Returns: + /// None + pub fn add_property( + &self, + timestamp: PyTime, + properties: HashMap, + ) -> Result<(), GraphError> { + self.graph.add_properties(timestamp, properties) + } + + /// Adds static properties to the graph. + /// + /// Arguments: + /// properties (dict): The static properties of the graph. + /// + /// Returns: + /// None + pub fn add_constant_properties( + &self, + properties: HashMap, + ) -> Result<(), GraphError> { + self.graph.add_constant_properties(properties) + } + + /// Adds a new edge with the given source and destination vertices and properties to the graph. + /// + /// Arguments: + /// timestamp (int): The timestamp of the edge. + /// src (str or int): The id of the source vertex. + /// dst (str or int): The id of the destination vertex. + /// properties (dict): The properties of the edge, as a dict of string and properties + /// layer (str): The layer of the edge. + /// + /// Returns: + /// None + #[pyo3(signature = (timestamp, src, dst, properties=None, layer=None))] + pub fn add_edge( + &self, + timestamp: PyTime, + src: PyInputVertex, + dst: PyInputVertex, + properties: Option>, + layer: Option<&str>, + ) -> Result, GraphError> { + self.graph + .add_edge(timestamp, src, dst, properties.unwrap_or_default(), layer) + } + + /// Deletes an edge given the timestamp, src and dst vertices and layer (optional) + /// + /// Arguments: + /// timestamp (int): The timestamp of the edge. + /// src (str or int): The id of the source vertex. + /// dst (str or int): The id of the destination vertex. + /// layer (str): The layer of the edge. (optional) + /// + /// Returns: + /// None or a GraphError if the edge could not be deleted + pub fn delete_edge( + &self, + timestamp: PyTime, + src: PyInputVertex, + dst: PyInputVertex, + layer: Option<&str>, + ) -> Result<(), GraphError> { + self.graph.delete_edge(timestamp, src, dst, layer) + } + + //FIXME: This is reimplemented here to get mutable views. If we switch the underlying graph to enum dispatch, this won't be necessary! + /// Gets the vertex with the specified id + /// + /// Arguments: + /// id (str or int): the vertex id + /// + /// Returns: + /// the vertex with the specified id, or None if the vertex does not exist + pub fn vertex(&self, id: VertexRef) -> Option> { + self.graph.vertex(id) + } + + //FIXME: This is reimplemented here to get mutable views. If we switch the underlying graph to enum dispatch, this won't be necessary! + /// Gets the edge with the specified source and destination vertices + /// + /// Arguments: + /// src (str or int): the source vertex id + /// dst (str or int): the destination vertex id + /// layer (str): the edge layer (optional) + /// + /// Returns: + /// the edge with the specified source and destination vertices, or None if the edge does not exist + #[pyo3(signature = (src, dst))] + pub fn edge(&self, src: VertexRef, dst: VertexRef) -> Option> { + self.graph.edge(src, dst) + } + + //****** Saving And Loading ******// + + // Alternative constructors are tricky, see: https://gist.github.com/redshiftzero/648e4feeff3843ffd9924f13625f839c + + /// Loads a graph from the given path. + /// + /// Arguments: + /// path (str): The path to the graph. + /// + /// Returns: + /// Graph: The loaded graph. + #[staticmethod] + pub fn load_from_file(path: &str) -> Result { + let file_path: PathBuf = [env!("CARGO_MANIFEST_DIR"), path].iter().collect(); + GraphWithDeletions::load_from_file(file_path) + } + + /// Saves the graph to the given path. + /// + /// Arguments: + /// path (str): The path to the graph. + /// + /// Returns: + /// None + pub fn save_to_file(&self, path: &str) -> Result<(), GraphError> { + self.graph.save_to_file(Path::new(path)) + } + + /// Get bincode encoded graph + pub fn bincode<'py>(&'py self, py: Python<'py>) -> Result<&'py PyBytes, GraphError> { + let bytes = MaterializedGraph::from(self.graph.clone()).bincode()?; + Ok(PyBytes::new(py, &bytes)) + } +} diff --git a/raphtory/src/python/graph/mod.rs b/raphtory/src/python/graph/mod.rs new file mode 100644 index 0000000000..f9b42d9891 --- /dev/null +++ b/raphtory/src/python/graph/mod.rs @@ -0,0 +1,8 @@ +pub mod algorithm_result; +pub mod edge; +pub mod graph; +pub mod graph_with_deletions; +pub mod pandas; +pub mod properties; +pub mod vertex; +pub mod views; diff --git a/raphtory/src/python/graph/pandas.rs b/raphtory/src/python/graph/pandas.rs new file mode 100644 index 0000000000..1b15982231 --- /dev/null +++ b/raphtory/src/python/graph/pandas.rs @@ -0,0 +1,843 @@ +use crate::{core::utils::errors::GraphError, prelude::*}; +use arrow2::{ + array::{Array, BooleanArray, PrimitiveArray, Utf8Array}, + ffi, + types::{NativeType, Offset}, +}; +use kdam::tqdm; +use pyo3::{ + create_exception, exceptions::PyException, ffi::Py_uintptr_t, prelude::*, types::PyDict, +}; +use std::collections::HashMap; + +fn i64_opt_into_u64_opt(x: Option<&i64>) -> Option { + x.map(|x| (*x).try_into().unwrap()) +} + +pub(crate) fn process_pandas_py_df(df: &PyAny, py: Python, size: usize) -> PyResult { + let globals = PyDict::new(py); + globals.set_item("df", df)?; + let module = py.import("pyarrow")?; + let pa_table = module.getattr("Table")?; + + let table = pa_table.call_method("from_pandas", (df,), None)?; + + let rb = table.call_method0("to_batches")?.extract::>()?; + let names = if let Some(batch0) = rb.get(0) { + let schema = batch0.getattr("schema")?; + schema.getattr("names")?.extract::>()? + } else { + vec![] + }; + + let arrays = tqdm!( + rb.iter().map(|rb| { + (0..names.len()) + .map(|i| { + let array = rb.call_method1("column", (i,))?; + let arr = array_to_rust(array)?; + Ok::, PyErr>(arr) + }) + .collect::, PyErr>>() + }), + desc = "Converting dataframe to Arrow", + total = size, + animation = kdam::Animation::FillUp, + unit_scale = true + ) + .collect::, PyErr>>()?; + + let df = PretendDF { names, arrays }; + Ok(df) +} + +pub(crate) fn load_vertices_from_df<'a>( + df: &'a PretendDF, + size: usize, + vertex_id: &str, + time: &str, + props: Option>, + const_props: Option>, + shared_const_props: Option>, + graph: &Graph, +) -> Result<(), GraphError> { + let prop_iter = props + .unwrap_or_default() + .into_iter() + .map(|name| lift_property(name, &df)) + .reduce(combine_prop_iters) + .unwrap_or_else(|| Box::new(std::iter::repeat(vec![]))); + + let const_prop_iter = const_props + .unwrap_or_default() + .into_iter() + .map(|name| lift_property(name, &df)) + .reduce(combine_prop_iters) + .unwrap_or_else(|| Box::new(std::iter::repeat(vec![]))); + + if let (Some(vertex_id), Some(time)) = (df.iter_col::(vertex_id), df.iter_col::(time)) + { + let iter = vertex_id.map(|i| i.copied()).zip(time); + load_vertices_from_num_iter( + graph, + size, + iter, + prop_iter, + const_prop_iter, + shared_const_props, + )?; + } else if let (Some(vertex_id), Some(time)) = + (df.iter_col::(vertex_id), df.iter_col::(time)) + { + let iter = vertex_id.map(i64_opt_into_u64_opt).zip(time); + load_vertices_from_num_iter( + graph, + size, + iter, + prop_iter, + const_prop_iter, + shared_const_props, + )?; + } else if let (Some(vertex_id), Some(time)) = + (df.utf8::(vertex_id), df.iter_col::(time)) + { + let iter = vertex_id.into_iter().zip(time); + for (((vertex_id, time), props), const_props) in tqdm!( + iter.zip(prop_iter).zip(const_prop_iter), + desc = "Loading vertices", + total = size, + animation = kdam::Animation::FillUp, + unit_scale = true + ) { + if let (Some(vertex_id), Some(time)) = (vertex_id, time) { + let v = graph.add_vertex(*time, vertex_id, props)?; + v.add_constant_properties(const_props)?; + if let Some(shared_const_props) = &shared_const_props { + v.add_constant_properties(shared_const_props.iter())?; + } + } + } + } else if let (Some(vertex_id), Some(time)) = + (df.utf8::(vertex_id), df.iter_col::(time)) + { + let iter = vertex_id.into_iter().zip(time); + for (((vertex_id, time), props), const_props) in tqdm!( + iter.zip(prop_iter).zip(const_prop_iter), + desc = "Loading vertices", + total = size, + animation = kdam::Animation::FillUp, + unit_scale = true + ) { + if let (Some(vertex_id), Some(time)) = (vertex_id, time) { + let v = graph.add_vertex(*time, vertex_id, props)?; + v.add_constant_properties(const_props)?; + if let Some(shared_const_props) = &shared_const_props { + v.add_constant_properties(shared_const_props)?; + } + } + } + } else { + return Err(GraphError::LoadFailure( + "vertex id column must be either u64 or text, time column must be i64".to_string(), + )); + } + + Ok(()) +} + +pub(crate) fn load_edges_from_df<'a, S: AsRef>( + df: &'a PretendDF, + size: usize, + src: &str, + dst: &str, + time: &str, + props: Option>, + const_props: Option>, + shared_const_props: Option>, + layer: Option, + layer_in_df: Option, + graph: &Graph, +) -> Result<(), GraphError> { + let prop_iter = props + .unwrap_or_default() + .into_iter() + .map(|name| lift_property(name, &df)) + .reduce(combine_prop_iters) + .unwrap_or_else(|| Box::new(std::iter::repeat(vec![]))); + + let const_prop_iter = const_props + .unwrap_or_default() + .into_iter() + .map(|name| lift_property(name, &df)) + .reduce(combine_prop_iters) + .unwrap_or_else(|| Box::new(std::iter::repeat(vec![]))); + + let layer = lift_layer(layer, layer_in_df, df); + + if let (Some(src), Some(dst), Some(time)) = ( + df.iter_col::(src), + df.iter_col::(dst), + df.iter_col::(time), + ) { + let triplets = src + .map(|i| i.copied()) + .zip(dst.map(|i| i.copied())) + .zip(time); + load_edges_from_num_iter( + &graph, + size, + triplets, + prop_iter, + const_prop_iter, + shared_const_props, + layer, + )?; + } else if let (Some(src), Some(dst), Some(time)) = ( + df.iter_col::(src), + df.iter_col::(dst), + df.iter_col::(time), + ) { + let triplets = src + .map(i64_opt_into_u64_opt) + .zip(dst.map(i64_opt_into_u64_opt)) + .zip(time); + load_edges_from_num_iter( + &graph, + size, + triplets, + prop_iter, + const_prop_iter, + shared_const_props, + layer, + )?; + } else if let (Some(src), Some(dst), Some(time)) = ( + df.utf8::(src), + df.utf8::(dst), + df.iter_col::(time), + ) { + let triplets = src.into_iter().zip(dst.into_iter()).zip(time.into_iter()); + + for (((((src, dst), time), props), const_props), layer) in tqdm!( + triplets.zip(prop_iter).zip(const_prop_iter).zip(layer), + desc = "Loading edges", + total = size, + animation = kdam::Animation::FillUp, + unit_scale = true + ) { + if let (Some(src), Some(dst), Some(time)) = (src, dst, time) { + let e = graph.add_edge(*time, src, dst, props, layer.as_deref())?; + e.add_constant_properties(const_props, layer.as_deref())?; + if let Some(shared_const_props) = &shared_const_props { + e.add_constant_properties(shared_const_props.iter(), layer.as_deref())?; + } + } + } + } else if let (Some(src), Some(dst), Some(time)) = ( + df.utf8::(src), + df.utf8::(dst), + df.iter_col::(time), + ) { + let triplets = src.into_iter().zip(dst.into_iter()).zip(time.into_iter()); + for (((((src, dst), time), props), const_props), layer) in tqdm!( + triplets.zip(prop_iter).zip(const_prop_iter).zip(layer), + desc = "Loading edges", + total = size, + animation = kdam::Animation::FillUp, + unit_scale = true + ) { + if let (Some(src), Some(dst), Some(time)) = (src, dst, time) { + let e = graph.add_edge(*time, src, dst, props, layer.as_deref())?; + e.add_constant_properties(const_props, layer.as_deref())?; + if let Some(shared_const_props) = &shared_const_props { + e.add_constant_properties(shared_const_props.iter(), layer.as_deref())?; + } + } + } + } else { + return Err(GraphError::LoadFailure( + "source and target columns must be either u64 or text, time column must be i64" + .to_string(), + )); + } + Ok(()) +} + +pub(crate) fn load_vertex_props_from_df<'a>( + df: &'a PretendDF, + size: usize, + vertex_id: &str, + const_props: Option>, + shared_const_props: Option>, + graph: &Graph, +) -> Result<(), GraphError> { + let const_prop_iter = const_props + .unwrap_or_default() + .into_iter() + .map(|name| lift_property(name, &df)) + .reduce(combine_prop_iters) + .unwrap_or_else(|| Box::new(std::iter::repeat(vec![]))); + + if let Some(vertex_id) = df.iter_col::(vertex_id) { + let iter = vertex_id.map(|i| i.copied()); + for (vertex_id, const_props) in tqdm!( + iter.zip(const_prop_iter), + desc = "Loading vertex properties", + total = size, + animation = kdam::Animation::FillUp, + unit_scale = true + ) { + if let Some(vertex_id) = vertex_id { + let v = graph + .vertex(vertex_id) + .ok_or(GraphError::VertexIdError(vertex_id))?; + v.add_constant_properties(const_props)?; + if let Some(shared_const_props) = &shared_const_props { + v.add_constant_properties(shared_const_props.iter())?; + } + } + } + } else if let Some(vertex_id) = df.iter_col::(vertex_id) { + let iter = vertex_id.map(i64_opt_into_u64_opt); + for (vertex_id, const_props) in tqdm!( + iter.zip(const_prop_iter), + desc = "Loading vertex properties", + total = size, + animation = kdam::Animation::FillUp, + unit_scale = true + ) { + if let Some(vertex_id) = vertex_id { + let v = graph + .vertex(vertex_id) + .ok_or(GraphError::VertexIdError(vertex_id))?; + v.add_constant_properties(const_props)?; + if let Some(shared_const_props) = &shared_const_props { + v.add_constant_properties(shared_const_props.iter())?; + } + } + } + } else if let Some(vertex_id) = df.utf8::(vertex_id) { + let iter = vertex_id.into_iter(); + for (vertex_id, const_props) in tqdm!( + iter.zip(const_prop_iter), + desc = "Loading vertex properties", + total = size, + animation = kdam::Animation::FillUp, + unit_scale = true + ) { + if let Some(vertex_id) = vertex_id { + let v = graph + .vertex(vertex_id) + .ok_or_else(|| GraphError::VertexNameError(vertex_id.to_owned()))?; + v.add_constant_properties(const_props)?; + if let Some(shared_const_props) = &shared_const_props { + v.add_constant_properties(shared_const_props.iter())?; + } + } + } + } else if let Some(vertex_id) = df.utf8::(vertex_id) { + let iter = vertex_id.into_iter(); + for (vertex_id, const_props) in tqdm!( + iter.zip(const_prop_iter), + desc = "Loading vertex properties", + total = size, + animation = kdam::Animation::FillUp, + unit_scale = true + ) { + if let Some(vertex_id) = vertex_id { + let v = graph + .vertex(vertex_id) + .ok_or_else(|| GraphError::VertexNameError(vertex_id.to_owned()))?; + v.add_constant_properties(const_props)?; + if let Some(shared_const_props) = &shared_const_props { + v.add_constant_properties(shared_const_props.iter())?; + } + } + } + } else { + return Err(GraphError::LoadFailure( + "vertex id column must be either u64 or text, time column must be i64".to_string(), + )); + } + Ok(()) +} + +pub(crate) fn load_edges_props_from_df<'a, S: AsRef>( + df: &'a PretendDF, + size: usize, + src: &str, + dst: &str, + const_props: Option>, + shared_const_props: Option>, + layer: Option, + layer_in_df: Option, + graph: &Graph, +) -> Result<(), GraphError> { + let const_prop_iter = const_props + .unwrap_or_default() + .into_iter() + .map(|name| lift_property(name, &df)) + .reduce(combine_prop_iters) + .unwrap_or_else(|| Box::new(std::iter::repeat(vec![]))); + + let layer = lift_layer(layer, layer_in_df, df); + + if let (Some(src), Some(dst)) = (df.iter_col::(src), df.iter_col::(dst)) { + let triplets = src.map(|i| i.copied()).zip(dst.map(|i| i.copied())); + + for (((src, dst), const_props), layer) in tqdm!( + triplets.zip(const_prop_iter).zip(layer), + desc = "Loading edge properties", + total = size, + animation = kdam::Animation::FillUp, + unit_scale = true + ) { + if let (Some(src), Some(dst)) = (src, dst) { + let e = graph + .edge(src, dst) + .ok_or(GraphError::EdgeIdError { src, dst })?; + e.add_constant_properties(const_props, layer.as_deref())?; + if let Some(shared_const_props) = &shared_const_props { + e.add_constant_properties(shared_const_props.iter(), layer.as_deref())?; + } + } + } + } else if let (Some(src), Some(dst)) = (df.iter_col::(src), df.iter_col::(dst)) { + let triplets = src + .map(i64_opt_into_u64_opt) + .zip(dst.map(i64_opt_into_u64_opt)); + for (((src, dst), const_props), layer) in tqdm!( + triplets.zip(const_prop_iter).zip(layer), + desc = "Loading edge properties", + total = size, + animation = kdam::Animation::FillUp, + unit_scale = true + ) { + if let (Some(src), Some(dst)) = (src, dst) { + let e = graph + .edge(src, dst) + .ok_or(GraphError::EdgeIdError { src, dst })?; + e.add_constant_properties(const_props, layer.as_deref())?; + if let Some(shared_const_props) = &shared_const_props { + e.add_constant_properties(shared_const_props.iter(), layer.as_deref())?; + } + } + } + } else if let (Some(src), Some(dst)) = (df.utf8::(src), df.utf8::(dst)) { + let triplets = src.into_iter().zip(dst.into_iter()); + for (((src, dst), const_props), layer) in tqdm!( + triplets.zip(const_prop_iter).zip(layer), + desc = "Loading edge properties", + total = size, + animation = kdam::Animation::FillUp, + unit_scale = true + ) { + if let (Some(src), Some(dst)) = (src, dst) { + let e = graph + .edge(src, dst) + .ok_or_else(|| GraphError::EdgeNameError { + src: src.to_owned(), + dst: dst.to_owned(), + })?; + e.add_constant_properties(const_props, layer.as_deref())?; + if let Some(shared_const_props) = &shared_const_props { + e.add_constant_properties(shared_const_props.iter(), layer.as_deref())?; + } + } + } + } else if let (Some(src), Some(dst)) = (df.utf8::(src), df.utf8::(dst)) { + let triplets = src.into_iter().zip(dst.into_iter()); + for (((src, dst), const_props), layer) in tqdm!( + triplets.zip(const_prop_iter).zip(layer), + desc = "Loading edge properties", + total = size, + animation = kdam::Animation::FillUp, + unit_scale = true + ) { + if let (Some(src), Some(dst)) = (src, dst) { + let e = graph + .edge(src, dst) + .ok_or_else(|| GraphError::EdgeNameError { + src: src.to_owned(), + dst: dst.to_owned(), + })?; + e.add_constant_properties(const_props, layer.as_deref())?; + if let Some(shared_const_props) = &shared_const_props { + e.add_constant_properties(shared_const_props.iter(), layer.as_deref())?; + } + } + } + } else { + return Err(GraphError::LoadFailure( + "source and target columns must be either u64 or text, time column must be i64" + .to_string(), + )); + } + Ok(()) +} + +fn lift_property<'a: 'b, 'b>( + name: &'a str, + df: &'b PretendDF, +) -> Box> + 'b> { + if let Some(col) = df.iter_col::(name) { + iter_as_prop(name, col) + } else if let Some(col) = df.iter_col::(name) { + iter_as_prop(name, col) + } else if let Some(col) = df.iter_col::(name) { + iter_as_prop(name, col) + } else if let Some(col) = df.iter_col::(name) { + iter_as_prop(name, col) + } else if let Some(col) = df.iter_col::(name) { + iter_as_prop(name, col) + } else if let Some(col) = df.iter_col::(name) { + iter_as_prop(name, col) + } else if let Some(col) = df.bool(name) { + Box::new(col.map(move |val| { + val.into_iter() + .map(|v| (name, Prop::Bool(v))) + .collect::>() + })) + } else if let Some(col) = df.utf8::(name) { + Box::new(col.map(move |val| { + val.into_iter() + .map(|v| (name, Prop::str(v))) + .collect::>() + })) + } else if let Some(col) = df.utf8::(name) { + Box::new(col.map(move |val| { + val.into_iter() + .map(|v| (name, Prop::str(v))) + .collect::>() + })) + } else { + Box::new(std::iter::repeat(Vec::with_capacity(0))) + } +} + +fn lift_layer<'a, S: AsRef>( + layer: Option, + layer_in_df: Option, + df: &'a PretendDF, +) -> Box> + 'a> { + if let Some(layer) = layer { + //Prioritise the explicit layer set by the user + Box::new(std::iter::repeat(Some(layer.as_ref().to_string()))) + } else if let Some(name) = layer_in_df { + if let Some(col) = df.utf8::(name.as_ref()) { + Box::new(col.map(|v| v.map(|v| v.to_string()))) + } else if let Some(col) = df.utf8::(name.as_ref()) { + Box::new(col.map(|v| v.map(|v| v.to_string()))) + } else { + Box::new(std::iter::repeat(None)) + } + } else { + Box::new(std::iter::repeat(None)) + } +} + +fn iter_as_prop< + 'a: 'b, + 'b, + T: Into + Copy + 'static, + I: Iterator> + 'a, +>( + name: &'a str, + is: I, +) -> Box> + '_> { + Box::new(is.map(move |val| { + val.into_iter() + .map(|v| (name, (*v).into())) + .collect::>() + })) +} + +fn combine_prop_iters< + 'a, + I1: Iterator> + 'a, + I2: Iterator> + 'a, +>( + i1: I1, + i2: I2, +) -> Box> + 'a> { + Box::new(i1.zip(i2).map(|(mut v1, v2)| { + v1.extend(v2); + v1 + })) +} + +fn load_edges_from_num_iter< + 'a, + S: AsRef, + I: Iterator, Option), Option<&'a i64>)>, + PI: Iterator>, + IL: Iterator>, +>( + graph: &Graph, + size: usize, + edges: I, + props: PI, + const_props: PI, + shared_const_props: Option>, + layer: IL, +) -> Result<(), GraphError> { + for (((((src, dst), time), edge_props), const_props), layer) in tqdm!( + edges.zip(props).zip(const_props).zip(layer), + desc = "Loading edges", + total = size, + animation = kdam::Animation::FillUp, + unit_scale = true + ) { + if let (Some(src), Some(dst), Some(time)) = (src, dst, time) { + let e = graph.add_edge(*time, src, dst, edge_props, layer.as_deref())?; + e.add_constant_properties(const_props, layer.as_deref())?; + if let Some(shared_const_props) = &shared_const_props { + e.add_constant_properties(shared_const_props.iter(), layer.as_deref())?; + } + } + } + Ok(()) +} + +fn load_vertices_from_num_iter< + 'a, + S: AsRef, + I: Iterator, Option<&'a i64>)>, + PI: Iterator>, +>( + graph: &Graph, + size: usize, + vertices: I, + props: PI, + const_props: PI, + shared_const_props: Option>, +) -> Result<(), GraphError> { + for (((vertex, time), props), const_props) in tqdm!( + vertices.zip(props).zip(const_props), + desc = "Loading vertices", + total = size, + animation = kdam::Animation::FillUp, + unit_scale = true + ) { + if let (Some(v), Some(t), props, const_props) = (vertex, time, props, const_props) { + let v = graph.add_vertex(*t, v, props)?; + v.add_constant_properties(const_props)?; + + if let Some(shared_const_props) = &shared_const_props { + v.add_constant_properties(shared_const_props.iter())?; + } + } + } + Ok(()) +} + +pub(crate) struct PretendDF { + names: Vec, + arrays: Vec>>, +} + +impl PretendDF { + fn iter_col(&self, name: &str) -> Option> + '_> { + let idx = self.names.iter().position(|n| n == name)?; + + let _ = (&self.arrays[0])[idx] + .as_any() + .downcast_ref::>()?; + + let iter = self.arrays.iter().flat_map(move |arr| { + let arr = &arr[idx]; + let arr = arr.as_any().downcast_ref::>().unwrap(); + arr.iter() + }); + + Some(iter) + } + + fn utf8(&self, name: &str) -> Option> + '_> { + let idx = self.names.iter().position(|n| n == name)?; + // test that it's actually a utf8 array + let _ = (&self.arrays[0])[idx] + .as_any() + .downcast_ref::>()?; + + let iter = self.arrays.iter().flat_map(move |arr| { + let arr = &arr[idx]; + let arr = arr.as_any().downcast_ref::>().unwrap(); + arr.iter() + }); + + Some(iter) + } + + fn bool(&self, name: &str) -> Option> + '_> { + let idx = self.names.iter().position(|n| n == name)?; + + let _ = (&self.arrays[0])[idx] + .as_any() + .downcast_ref::()?; + + let iter = self.arrays.iter().flat_map(move |arr| { + let arr = &arr[idx]; + let arr = arr.as_any().downcast_ref::().unwrap(); + arr.iter() + }); + + Some(iter) + } +} + +pub fn array_to_rust(obj: &PyAny) -> PyResult { + // prepare a pointer to receive the Array struct + let array = Box::new(ffi::ArrowArray::empty()); + let schema = Box::new(ffi::ArrowSchema::empty()); + + let array_ptr = &*array as *const ffi::ArrowArray; + let schema_ptr = &*schema as *const ffi::ArrowSchema; + + // make the conversion through PyArrow's private API + // this changes the pointer's memory and is thus unsafe. In particular, `_export_to_c` can go out of bounds + obj.call_method1( + "_export_to_c", + (array_ptr as Py_uintptr_t, schema_ptr as Py_uintptr_t), + )?; + + unsafe { + let field = ffi::import_field_from_c(schema.as_ref()) + .map_err(|e| ArrowErrorException::new_err(format!("{:?}", e)))?; + let array = ffi::import_array_from_c(*array, field.data_type) + .map_err(|e| ArrowErrorException::new_err(format!("{:?}", e)))?; + Ok(array) + } +} + +pub type ArrayRef = Box; + +create_exception!(exceptions, ArrowErrorException, PyException); +create_exception!(exceptions, GraphLoadException, PyException); + +#[cfg(test)] +mod test { + use crate::{prelude::*, python::graph::pandas::load_vertices_from_df}; + + use super::{load_edges_from_df, PretendDF}; + use arrow2::array::{PrimitiveArray, Utf8Array}; + + #[test] + fn load_edges_from_pretend_df() { + let df = PretendDF { + names: vec!["src", "dst", "time", "prop1", "prop2"] + .iter() + .map(|s| s.to_string()) + .collect(), + arrays: vec![ + vec![ + Box::new(PrimitiveArray::::from(vec![Some(1)])), + Box::new(PrimitiveArray::::from(vec![Some(2)])), + Box::new(PrimitiveArray::::from(vec![Some(1)])), + Box::new(PrimitiveArray::::from(vec![Some(1.0)])), + Box::new(Utf8Array::::from(vec![Some("a")])), + ], + vec![ + Box::new(PrimitiveArray::::from(vec![Some(2), Some(3)])), + Box::new(PrimitiveArray::::from(vec![Some(3), Some(4)])), + Box::new(PrimitiveArray::::from(vec![Some(2), Some(3)])), + Box::new(PrimitiveArray::::from(vec![Some(2.0), Some(3.0)])), + Box::new(Utf8Array::::from(vec![Some("b"), Some("c")])), + ], + ], + }; + let graph = Graph::new(); + let layer: Option<&str> = None; + let layer_in_df: Option<&str> = None; + load_edges_from_df( + &df, + 5, + "src", + "dst", + "time", + Some(vec!["prop1", "prop2"]), + None, + None, + layer, + layer_in_df, + &graph, + ) + .expect("failed to load edges from pretend df"); + + let actual = graph + .edges() + .map(|e| { + ( + e.src().id(), + e.dst().id(), + e.latest_time(), + e.properties() + .temporal() + .get("prop1") + .and_then(|v| v.latest()), + e.properties() + .temporal() + .get("prop2") + .and_then(|v| v.latest()), + ) + }) + .collect::>(); + + assert_eq!( + actual, + vec![ + (1, 2, Some(1), Some(Prop::F64(1.0)), Some(Prop::str("a"))), + (2, 3, Some(2), Some(Prop::F64(2.0)), Some(Prop::str("b"))), + (3, 4, Some(3), Some(Prop::F64(3.0)), Some(Prop::str("c"))), + ] + ); + } + + #[test] + fn load_vertices_from_pretend_df() { + let df = PretendDF { + names: vec!["id", "name", "time"] + .iter() + .map(|s| s.to_string()) + .collect(), + arrays: vec![ + vec![ + Box::new(PrimitiveArray::::from(vec![Some(1)])), + Box::new(Utf8Array::::from(vec![Some("a")])), + Box::new(PrimitiveArray::::from(vec![Some(1)])), + ], + vec![ + Box::new(PrimitiveArray::::from(vec![Some(2)])), + Box::new(Utf8Array::::from(vec![Some("b")])), + Box::new(PrimitiveArray::::from(vec![Some(2)])), + ], + ], + }; + let graph = Graph::new(); + + load_vertices_from_df(&df, 3, "id", "time", Some(vec!["name"]), None, None, &graph) + .expect("failed to load vertices from pretend df"); + + let actual = graph + .vertices() + .iter() + .map(|v| { + ( + v.id(), + v.latest_time(), + v.properties() + .temporal() + .get("name") + .and_then(|v| v.latest()), + ) + }) + .collect::>(); + + assert_eq!( + actual, + vec![ + (1, Some(1), Some(Prop::str("a"))), + (2, Some(2), Some(Prop::str("b"))), + ] + ); + } +} diff --git a/raphtory/src/python/graph/properties/constant_props.rs b/raphtory/src/python/graph/properties/constant_props.rs new file mode 100644 index 0000000000..ca353e1b0e --- /dev/null +++ b/raphtory/src/python/graph/properties/constant_props.rs @@ -0,0 +1,255 @@ +use crate::{ + core::{ArcStr, Prop}, + db::api::{ + properties::{internal::PropertiesOps, ConstProperties}, + view::internal::Static, + }, + python::{ + graph::properties::{ + props::PyPropsComp, DynProps, PyConstPropsListListCmp, PyPropValueList, + PyPropValueListList, PyPropsListCmp, + }, + types::repr::{iterator_dict_repr, Repr}, + utils::PyGenericIterator, + }, +}; +use itertools::Itertools; +use pyo3::{ + exceptions::{PyKeyError, PyTypeError}, + prelude::*, +}; +use std::{collections::HashMap, sync::Arc}; + +pub type DynConstProperties = ConstProperties; + +impl From> + for DynConstProperties +{ + fn from(value: ConstProperties

) -> Self { + ConstProperties { + props: Arc::new(value.props), + } + } +} + +impl IntoPy for ConstProperties

{ + fn into_py(self, py: Python<'_>) -> PyObject { + PyConstProperties::from(self).into_py(py) + } +} + +impl Repr for ConstProperties

{ + fn repr(&self) -> String { + format!("StaticProperties({{{}}})", iterator_dict_repr(self.iter())) + } +} + +/// A view of constant properties of an entity +#[pyclass(name = "ConstProperties")] +pub struct PyConstProperties { + props: DynConstProperties, +} + +py_eq!(PyConstProperties, PyPropsComp); + +#[pymethods] +impl PyConstProperties { + /// keys() -> list[str] + /// + /// lists the available property keys + pub fn keys(&self) -> Vec { + self.props.keys() + } + + /// values() -> list[Any] + /// + /// lists the property values + pub fn values(&self) -> Vec { + self.props.values() + } + + /// items() -> list[tuple[str, Any]] + /// + /// lists the property keys together with the corresponding value + pub fn items(&self) -> Vec<(ArcStr, Prop)> { + self.props.iter().collect() + } + + /// __getitem__(key: str) -> Any + /// + /// get property value by key + /// + /// Raises: + /// KeyError: if property `key` does not exist + pub fn __getitem__(&self, key: &str) -> PyResult { + self.props + .get(key) + .ok_or(PyKeyError::new_err("No such property")) + } + + /// get(key: str) -> Any | None + /// + /// Arguments: + /// key: the name of the property + /// + /// get property value by key (returns `None` if key does not exist) + pub fn get(&self, key: &str) -> Option { + // Fixme: Add option to specify default? + self.props.get(key) + } + + /// as_dict() -> dict[str, Any] + /// + /// convert the properties view to a python dict + pub fn as_dict(&self) -> HashMap { + self.props.as_map() + } + + /// __iter__() -> Iterator[str] + /// + /// iterate over property keys + pub fn __iter__(&self) -> PyGenericIterator { + self.keys().into_iter().into() + } + + /// __contains__(key: str) -> bool + /// + /// check if property `key` exists + pub fn __contains__(&self, key: &str) -> bool { + self.props.contains(key) + } + + /// __len__() -> int + /// + /// the number of properties + pub fn __len__(&self) -> usize { + self.keys().len() + } + + pub fn __repr__(&self) -> String { + self.repr() + } +} + +impl From> for PyConstProperties { + fn from(value: ConstProperties

) -> Self { + PyConstProperties { + props: ConstProperties::new(Arc::new(value.props)), + } + } +} + +impl Repr for PyConstProperties { + fn repr(&self) -> String { + self.props.repr() + } +} + +py_iterable_base!(PyConstPropsList, DynConstProperties, PyConstProperties); +py_eq!(PyConstPropsList, PyPropsListCmp); + +#[pymethods] +impl PyConstPropsList { + pub fn keys(&self) -> Vec { + self.iter().map(|p| p.keys()).kmerge().dedup().collect() + } + + pub fn values(&self) -> Vec { + self.keys() + .into_iter() + .map(|k| self.get(k).expect("key exists")) + .collect() + } + pub fn items(&self) -> Vec<(ArcStr, PyPropValueList)> { + self.keys().into_iter().zip(self.values()).collect() + } + + pub fn __getitem__(&self, key: ArcStr) -> PyResult { + self.get(key).ok_or(PyKeyError::new_err("No such property")) + } + + pub fn get(&self, key: ArcStr) -> Option { + self.__contains__(&key).then(|| { + let builder = self.builder.clone(); + let key = key.clone(); + (move || { + let key = key.clone(); + builder().map(move |p| p.get(&key)) + }) + .into() + }) + } + + pub fn __contains__(&self, key: &str) -> bool { + self.iter().any(|p| p.contains(key)) + } + + pub fn __iter__(&self) -> PyGenericIterator { + self.keys().into_iter().into() + } + + pub fn as_dict(&self) -> HashMap>> { + self.items() + .into_iter() + .map(|(k, v)| (k, v.collect())) + .collect() + } +} + +py_nested_iterable_base!(PyConstPropsListList, DynConstProperties, PyConstProperties); +py_eq!(PyConstPropsListList, PyConstPropsListListCmp); + +#[pymethods] +impl PyConstPropsListList { + pub fn keys(&self) -> Vec { + self.iter() + .flat_map(|it| it.map(|p| p.keys())) + .kmerge() + .dedup() + .collect() + } + + pub fn values(&self) -> Vec { + self.keys() + .into_iter() + .map(|k| self.get(k).expect("key exists")) + .collect() + } + pub fn items(&self) -> Vec<(ArcStr, PyPropValueListList)> { + self.keys().into_iter().zip(self.values()).collect() + } + + pub fn __getitem__(&self, key: ArcStr) -> PyResult { + self.get(key).ok_or(PyKeyError::new_err("No such property")) + } + + pub fn __iter__(&self) -> PyGenericIterator { + self.keys().into_iter().into() + } + + pub fn get(&self, key: ArcStr) -> Option { + self.__contains__(&key).then(|| { + let builder = self.builder.clone(); + let key = key.clone(); + (move || { + let key = key.clone(); + builder().map(move |it| { + let key = key.clone(); + it.map(move |p| p.get(&key)) + }) + }) + .into() + }) + } + + pub fn __contains__(&self, key: &str) -> bool { + self.iter().any(|mut it| it.any(|p| p.contains(key))) + } + + pub fn as_dict(&self) -> HashMap>>> { + self.items() + .into_iter() + .map(|(k, v)| (k, v.collect())) + .collect() + } +} diff --git a/raphtory/src/python/graph/properties/mod.rs b/raphtory/src/python/graph/properties/mod.rs new file mode 100644 index 0000000000..14f69c7425 --- /dev/null +++ b/raphtory/src/python/graph/properties/mod.rs @@ -0,0 +1,13 @@ +use crate::db::api::properties::internal::{InheritPropertiesOps, PropertiesOps}; +use std::sync::Arc; + +mod constant_props; +mod props; +mod temporal_props; + +pub type DynProps = Arc; +impl InheritPropertiesOps for DynProps {} + +pub use constant_props::*; +pub use props::*; +pub use temporal_props::*; diff --git a/raphtory/src/python/graph/properties/props.rs b/raphtory/src/python/graph/properties/props.rs new file mode 100644 index 0000000000..335551bd34 --- /dev/null +++ b/raphtory/src/python/graph/properties/props.rs @@ -0,0 +1,478 @@ +use crate::{ + core::{ArcStr, Prop}, + db::api::{ + properties::{internal::PropertiesOps, Properties}, + view::internal::{DynamicGraph, Static}, + }, + python::{ + graph::properties::{ + DynConstProperties, DynProps, DynTemporalProperties, PyConstProperties, + PyConstPropsList, PyConstPropsListList, PyTemporalPropsList, PyTemporalPropsListList, + }, + types::{ + repr::{iterator_dict_repr, Repr}, + wrappers::prop::PropValue, + }, + utils::PyGenericIterator, + }, +}; +use itertools::Itertools; +use pyo3::{ + exceptions::{PyKeyError, PyTypeError}, + prelude::*, +}; +use std::{collections::HashMap, ops::Deref, sync::Arc}; + +pub type DynProperties = Properties>; + +#[derive(PartialEq, Clone)] +pub struct PyPropsComp(HashMap); + +impl<'source> FromPyObject<'source> for PyPropsComp { + fn extract(ob: &'source PyAny) -> PyResult { + if let Ok(sp) = ob.extract::>() { + Ok(sp.deref().into()) + } else if let Ok(p) = ob.extract::>() { + Ok(p.deref().into()) + } else if let Ok(m) = ob.extract::>() { + Ok(PyPropsComp(m)) + } else { + Err(PyTypeError::new_err("not comparable with properties")) + } + } +} + +impl From<&PyConstProperties> for PyPropsComp { + fn from(value: &PyConstProperties) -> Self { + Self(value.as_dict()) + } +} + +impl From<&PyProperties> for PyPropsComp { + fn from(value: &PyProperties) -> Self { + Self(value.as_dict()) + } +} + +impl From for PyPropsComp { + fn from(value: DynConstProperties) -> Self { + Self(value.as_map()) + } +} + +impl From for PyPropsComp { + fn from(value: DynProperties) -> Self { + Self(value.as_map()) + } +} + +/// A view of the properties of an entity +#[pyclass(name = "Properties")] +pub struct PyProperties { + props: DynProperties, +} + +py_eq!(PyProperties, PyPropsComp); + +#[pymethods] +impl PyProperties { + /// Get property value. + /// + /// First searches temporal properties and returns latest value if it exists. + /// If not, it falls back to static properties. + pub fn get(&self, key: &str) -> Option { + self.props.get(key) + } + + /// Check if property `key` exists. + pub fn __contains__(&self, key: &str) -> bool { + self.props.contains(key) + } + + /// gets property value if it exists, otherwise raises `KeyError` + fn __getitem__(&self, key: &str) -> PyResult { + self.props + .get(key) + .ok_or(PyKeyError::new_err("No such property")) + } + + /// iterate over property keys + fn __iter__(&self) -> PyGenericIterator { + self.keys().into_iter().into() + } + + /// number of properties + fn __len__(&self) -> usize { + self.keys().len() + } + + /// Get the names for all properties (includes temporal and static properties) + pub fn keys(&self) -> Vec { + self.props.keys().map(|k| k.clone()).collect() + } + + /// Get the values of the properties + /// + /// If a property exists as both temporal and static, temporal properties take priority with + /// fallback to the static property if the temporal value does not exist. + pub fn values(&self) -> Vec { + self.props.values().collect() + } + + /// Get a list of key-value pairs + pub fn items(&self) -> Vec<(ArcStr, Prop)> { + self.props.as_vec() + } + + /// Get a view of the temporal properties only. + #[getter] + pub fn temporal(&self) -> DynTemporalProperties { + self.props.temporal() + } + + /// Get a view of the constant properties (meta-data) only. + #[getter] + pub fn constant(&self) -> DynConstProperties { + self.props.constant() + } + + /// Convert properties view to a dict + pub fn as_dict(&self) -> HashMap { + self.props.as_map() + } +} + +impl From> + for DynProperties +{ + fn from(value: Properties

) -> Self { + Properties::new(Arc::new(value.props)) + } +} + +impl From> for DynProperties { + fn from(value: Properties) -> Self { + let props: DynProps = Arc::new(value.props); + Properties::new(props) + } +} + +impl> From

for PyProperties { + fn from(value: P) -> Self { + Self { + props: value.into(), + } + } +} + +impl IntoPy for Properties

{ + fn into_py(self, py: Python<'_>) -> PyObject { + PyProperties::from(self).into_py(py) + } +} + +impl IntoPy for Properties { + fn into_py(self, py: Python<'_>) -> PyObject { + PyProperties::from(self).into_py(py) + } +} + +impl IntoPy for DynProperties { + fn into_py(self, py: Python<'_>) -> PyObject { + PyProperties::from(self).into_py(py) + } +} + +impl Repr for Properties

{ + fn repr(&self) -> String { + format!("Properties({{{}}})", iterator_dict_repr(self.iter())) + } +} + +impl Repr for PyProperties { + fn repr(&self) -> String { + self.props.repr() + } +} + +#[derive(PartialEq, Clone)] +pub struct PyPropsListCmp(HashMap); + +impl<'source> FromPyObject<'source> for PyPropsListCmp { + fn extract(ob: &'source PyAny) -> PyResult { + if let Ok(sp) = ob.extract::>() { + Ok(sp.deref().into()) + } else if let Ok(p) = ob.extract::>() { + Ok(p.deref().into()) + } else if let Ok(m) = ob.extract::>() { + Ok(Self(m)) + } else { + Err(PyTypeError::new_err("not comparable with properties")) + } + } +} + +impl From<&PyConstPropsList> for PyPropsListCmp { + fn from(value: &PyConstPropsList) -> Self { + Self( + value + .items() + .into_iter() + .map(|(k, v)| (k, v.into())) + .collect(), + ) + } +} + +impl From<&PyPropsList> for PyPropsListCmp { + fn from(value: &PyPropsList) -> Self { + Self( + value + .items() + .into_iter() + .map(|(k, v)| (k, v.into())) + .collect(), + ) + } +} + +py_iterable_base!(PyPropsList, DynProperties, PyProperties); +py_eq!(PyPropsList, PyPropsListCmp); + +#[pymethods] +impl PyPropsList { + /// Get property value. + /// + /// First searches temporal properties and returns latest value if it exists. + /// If not, it falls back to constant properties. + pub fn get(&self, key: &str) -> Option { + self.__contains__(key).then(|| { + let builder = self.builder.clone(); + let key = Arc::new(key.to_owned()); + (move || { + let key = key.clone(); + builder().map(move |p| p.get(key.as_ref())) + }) + .into() + }) + } + + pub fn __iter__(&self) -> PyGenericIterator { + self.keys().into_iter().into() + } + + /// Check if property `key` exists. + pub fn __contains__(&self, key: &str) -> bool { + self.iter().any(|p| p.contains(key)) + } + + fn __getitem__(&self, key: &str) -> PyResult { + self.get(key).ok_or(PyKeyError::new_err("No such property")) + } + + /// Get the names for all properties (includes temporal and constant properties) + pub fn keys(&self) -> Vec { + self.iter() + // FIXME: Still have to clone all those strings which sucks + .map(|p| p.keys().map(|k| k.clone()).collect_vec()) + .kmerge() + .dedup() + .collect() + } + + /// Get the values of the properties + /// + /// If a property exists as both temporal and constant, temporal properties take priority with + /// fallback to the constant property if the temporal value does not exist. + pub fn values(&self) -> PyPropValueListList { + let builder = self.builder.clone(); + let keys = Arc::new(self.keys()); + (move || { + let builder = builder.clone(); + let keys = keys.clone(); + (0..keys.len()).map(move |index| { + let builder = builder.clone(); + let keys = keys.clone(); + builder().map(move |p| { + let key = &keys[index]; + p.get(key) + }) + }) + }) + .into() + } + + /// Get a list of key-value pairs + pub fn items(&self) -> Vec<(ArcStr, PyPropValueList)> { + self.keys() + .into_iter() + .flat_map(|k| self.get(&k).map(|v| (k, v))) + .collect() + } + + /// Get a view of the temporal properties only. + #[getter] + pub fn temporal(&self) -> PyTemporalPropsList { + let builder = self.builder.clone(); + (move || builder().map(|p| p.temporal())).into() + } + + /// Get a view of the constant properties (meta-data) only. + #[getter] + pub fn constant(&self) -> PyConstPropsList { + let builder = self.builder.clone(); + (move || builder().map(|p| p.constant())).into() + } + + /// Convert properties view to a dict + pub fn as_dict(&self) -> HashMap>> { + self.items() + .into_iter() + .map(|(k, v)| (k, v.collect())) + .collect() + } + + pub fn __repr__(&self) -> String { + format!( + "Properties({{{}}})", + iterator_dict_repr(self.items().into_iter()) + ) + } +} + +py_nested_iterable_base!(PyNestedPropsIterable, DynProperties, PyProperties); +py_eq!(PyNestedPropsIterable, PyConstPropsListListCmp); + +#[derive(PartialEq, Clone)] +pub struct PyConstPropsListListCmp(HashMap); + +impl<'source> FromPyObject<'source> for PyConstPropsListListCmp { + fn extract(ob: &'source PyAny) -> PyResult { + if let Ok(sp) = ob.extract::>() { + Ok(sp.deref().into()) + } else if let Ok(p) = ob.extract::>() { + Ok(p.deref().into()) + } else if let Ok(m) = ob.extract::>() { + Ok(Self(m)) + } else { + Err(PyTypeError::new_err("not comparable with properties")) + } + } +} + +impl From<&PyConstPropsListList> for PyConstPropsListListCmp { + fn from(value: &PyConstPropsListList) -> Self { + Self( + value + .items() + .into_iter() + .map(|(k, v)| (k, v.into())) + .collect(), + ) + } +} + +impl From<&PyNestedPropsIterable> for PyConstPropsListListCmp { + fn from(value: &PyNestedPropsIterable) -> Self { + Self( + value + .items() + .into_iter() + .map(|(k, v)| (k, v.into())) + .collect(), + ) + } +} + +#[pymethods] +impl PyNestedPropsIterable { + /// Get property value. + /// + /// First searches temporal properties and returns latest value if it exists. + /// If not, it falls back to constant properties. + pub fn get(&self, key: &str) -> Option { + self.__contains__(key).then(|| { + let builder = self.builder.clone(); + let key = Arc::new(key.to_owned()); + (move || { + let key = key.clone(); + builder().map(move |it| { + let key = key.clone(); + it.map(move |p| p.get(key.clone().as_ref())) + }) + }) + .into() + }) + } + + /// Check if property `key` exists. + pub fn __contains__(&self, key: &str) -> bool { + self.iter().any(|mut it| it.any(|p| p.contains(key))) + } + + fn __getitem__(&self, key: &str) -> Result { + self.get(key).ok_or(PyKeyError::new_err("No such property")) + } + + /// Get the names for all properties (includes temporal and constant properties) + pub fn keys(&self) -> Vec { + self.iter() + // FIXME: Still have to clone all those strings which sucks + .flat_map(|it| it.map(|p| p.keys().map(|k| k.clone()).collect_vec())) + .kmerge() + .dedup() + .collect() + } + + pub fn __iter__(&self) -> PyGenericIterator { + self.keys().into_iter().into() + } + + /// Get the values of the properties + /// + /// If a property exists as both temporal and constant, temporal properties take priority with + /// fallback to the constant property if the temporal value does not exist. + pub fn values(&self) -> Vec { + self.keys() + .into_iter() + .flat_map(|key| self.get(&key)) + .collect() + } + + /// Get a list of key-value pairs + pub fn items(&self) -> Vec<(ArcStr, PyPropValueListList)> { + self.keys().into_iter().zip(self.values()).collect() + } + + /// Get a view of the temporal properties only. + #[getter] + pub fn temporal(&self) -> PyTemporalPropsListList { + let builder = self.builder.clone(); + (move || builder().map(|it| it.map(|p| p.temporal()))).into() + } + + /// Get a view of the constant properties (meta-data) only. + #[getter] + pub fn constant(&self) -> PyConstPropsListList { + let builder = self.builder.clone(); + (move || builder().map(|it| it.map(|p| p.constant()))).into() + } + + /// Convert properties view to a dict + pub fn as_dict(&self) -> HashMap>>> { + self.items() + .into_iter() + .map(|(k, v)| (k, v.collect())) + .collect() + } +} + +py_iterable!(PyPropValueList, PropValue, PropValue); +py_iterable_comp!(PyPropValueList, PropValue, PyPropValueListCmp); + +py_nested_iterable!(PyPropValueListList, PropValue, PropValue); +py_iterable_comp!( + PyPropValueListList, + PyPropValueListCmp, + PyPropValueListListCmp +); diff --git a/raphtory/src/python/graph/properties/temporal_props.rs b/raphtory/src/python/graph/properties/temporal_props.rs new file mode 100644 index 0000000000..232a1f193d --- /dev/null +++ b/raphtory/src/python/graph/properties/temporal_props.rs @@ -0,0 +1,1268 @@ +use crate::{ + core::{utils::time::IntoTime, ArcStr, Prop}, + db::api::{ + properties::{internal::PropertiesOps, TemporalProperties, TemporalPropertyView}, + view::internal::{DynamicGraph, Static}, + }, + python::{ + graph::properties::{DynProps, PyPropValueList, PyPropValueListList}, + types::{ + repr::{iterator_dict_repr, iterator_repr, Repr}, + wrappers::{ + iterators::{NestedUsizeIterable, PropIterable, UsizeIterable}, + prop::{PropHistItems, PropValue}, + }, + }, + utils::{PyGenericIterator, PyTime}, + }, +}; +use itertools::Itertools; +use pyo3::{ + exceptions::{PyKeyError, PyTypeError}, + prelude::*, +}; +use std::{collections::HashMap, ops::Deref, sync::Arc}; + +pub type DynTemporalProperties = TemporalProperties; +pub type DynTemporalProperty = TemporalPropertyView; + +impl From> + for DynTemporalProperties +{ + fn from(value: TemporalProperties

) -> Self { + TemporalProperties::new(Arc::new(value.props)) + } +} + +impl From> for DynTemporalProperties { + fn from(value: TemporalProperties) -> Self { + let props: Arc = Arc::new(value.props); + TemporalProperties::new(props) + } +} + +impl> From

for PyTemporalProperties { + fn from(value: P) -> Self { + Self { + props: value.into(), + } + } +} + +#[derive(PartialEq)] +pub struct PyTemporalPropsCmp(HashMap); + +impl From> for PyTemporalPropsCmp { + fn from(value: HashMap) -> Self { + Self(value) + } +} + +impl From<&PyTemporalProperties> for PyTemporalPropsCmp { + fn from(value: &PyTemporalProperties) -> Self { + Self( + value + .histories() + .into_iter() + .map(|(k, v)| (k, v.into())) + .collect(), + ) + } +} + +impl<'source> FromPyObject<'source> for PyTemporalPropsCmp { + fn extract(ob: &'source PyAny) -> PyResult { + if let Ok(v) = ob.extract::>() { + Ok(PyTemporalPropsCmp::from(v.deref())) + } else if let Ok(v) = ob.extract::>() { + Ok(PyTemporalPropsCmp::from(v)) + } else { + Err(PyTypeError::new_err("cannot compare")) + } + } +} + +/// A view of the temporal properties of an entity +#[pyclass(name = "TemporalProperties")] +pub struct PyTemporalProperties { + props: DynTemporalProperties, +} + +py_eq!(PyTemporalProperties, PyTemporalPropsCmp); + +#[pymethods] +impl PyTemporalProperties { + /// List the available property keys + fn keys(&self) -> Vec { + self.props.keys().map(|k| k.clone()).collect() + } + + /// List the values of the properties + /// + /// Returns: + /// list[TemporalProp]: the list of property views + fn values(&self) -> Vec { + self.props.values().collect() + } + + /// List the property keys together with the corresponding values + fn items(&self) -> Vec<(ArcStr, DynTemporalProperty)> { + self.props.iter().map(|(k, v)| (k.clone(), v)).collect() + } + + /// Get the latest value of all properties + /// + /// Returns: + /// dict[str, Any]: the mapping of property keys to latest values + fn latest(&self) -> HashMap { + self.props + .iter_latest() + .map(|(k, v)| (k.clone(), v)) + .collect() + } + + /// Get the histories of all properties + /// + /// Returns: + /// dict[str, list[(int, Any)]]: the mapping of property keys to histories + fn histories(&self) -> HashMap> { + self.props + .iter() + .map(|(k, v)| (k.clone(), v.iter().collect())) + .collect() + } + + /// __getitem__(key: str) -> TemporalProp + /// + /// Get property value for `key` + /// + /// Returns: + /// the property view + /// + /// Raises: + /// KeyError: if property `key` does not exist + fn __getitem__(&self, key: &str) -> PyResult { + self.get(key).ok_or(PyKeyError::new_err("No such property")) + } + + /// get(key: str) -> Optional[TemporalProp] + /// + /// Get property value for `key` if it exists + /// + /// Returns: + /// the property view if it exists, otherwise `None` + fn get(&self, key: &str) -> Option { + // Fixme: Add option to specify default? + self.props.get(key) + } + + /// Iterator over property keys + fn __iter__(&self) -> PyGenericIterator { + self.keys().into_iter().into() + } + + /// Check if property `key` exists + fn __contains__(&self, key: &str) -> bool { + self.props.contains(key) + } + + /// The number of properties + fn __len__(&self) -> usize { + self.keys().len() + } + + fn __repr__(&self) -> String { + self.props.repr() + } +} + +/// A view of a temporal property +#[pyclass(name = "TemporalProp")] +pub struct PyTemporalProp { + prop: DynTemporalProperty, +} + +#[derive(PartialEq, Clone)] +pub struct PyTemporalPropCmp(Vec<(i64, Prop)>); + +impl<'source> FromPyObject<'source> for PyTemporalPropCmp { + fn extract(ob: &'source PyAny) -> PyResult { + if let Ok(sp) = ob.extract::>() { + Ok(sp.deref().into()) + } else if let Ok(m) = ob.extract::>() { + Ok(Self(m)) + } else { + Err(PyTypeError::new_err("not comparable")) + } + } +} + +impl From<&PyTemporalProp> for PyTemporalPropCmp { + fn from(value: &PyTemporalProp) -> Self { + Self(value.items()) + } +} + +impl From> for PyTemporalPropCmp { + fn from(value: Vec<(i64, Prop)>) -> Self { + Self(value) + } +} + +impl From for PyTemporalPropCmp { + fn from(value: DynTemporalProperty) -> Self { + PyTemporalPropCmp(value.iter().collect()) + } +} + +py_eq!(PyTemporalProp, PyTemporalPropCmp); + +#[pymethods] +impl PyTemporalProp { + /// Get the timestamps at which the property was updated + pub fn history(&self) -> Vec { + self.prop.history() + } + + /// Get the property values for each update + pub fn values(&self) -> Vec { + self.prop.values() + } + + /// List update timestamps and corresponding property values + pub fn items(&self) -> Vec<(i64, Prop)> { + self.prop.iter().collect() + } + + /// Iterate over `items` + pub fn __iter__(&self) -> PyGenericIterator { + self.prop.iter().into() + } + /// Get the value of the property at time `t` + pub fn at(&self, t: PyTime) -> Option { + self.prop.at(t.into_time()) + } + /// Get the latest value of the property + pub fn value(&self) -> Option { + self.prop.latest() + } + + pub fn sum(&self) -> Prop { + let mut it_iter = self.prop.iter(); + let first = it_iter.next().unwrap(); + it_iter.fold(first.1, |acc, elem| acc.add(elem.1).unwrap()) + } + + pub fn min(&self) -> (i64, Prop) { + let mut it_iter = self.prop.iter(); + let first = it_iter.next().unwrap(); + it_iter.fold(first, |acc, elem| if acc.1 <= elem.1 { acc } else { elem }) + } + + pub fn max(&self) -> (i64, Prop) { + let mut it_iter = self.prop.iter(); + let first = it_iter.next().unwrap(); + it_iter.fold(first, |acc, elem| if acc.1 >= elem.1 { acc } else { elem }) + } + + pub fn count(&self) -> usize { + self.prop.iter().count() + } + + pub fn average(&self) -> Option { + self.mean() + } + + pub fn mean(&self) -> Option { + let sum: Prop = self.sum(); + let count: usize = self.count(); + if count == 0 { + return None; + } + match sum { + Prop::I32(s) => Some(Prop::F32(s as f32 / count as f32)), + Prop::I64(s) => Some(Prop::F64(s as f64 / count as f64)), + Prop::U32(s) => Some(Prop::F32(s as f32 / count as f32)), + Prop::U8(s) => Some(Prop::F64(s as f64 / count as f64)), // needs a test + Prop::U16(s) => Some(Prop::F64(s as f64 / count as f64)), // needs a test + Prop::U64(s) => Some(Prop::F64(s as f64 / count as f64)), + Prop::F32(s) => Some(Prop::F32(s / count as f32)), + Prop::F64(s) => Some(Prop::F64(s / count as f64)), + _ => None, + } + } + + pub fn median(&self) -> Option<(i64, Prop)> { + let it_iter = self.prop.iter(); + let mut vec: Vec<(i64, Prop)> = it_iter.collect_vec(); + // let mut vec: Vec<(i64, Prop)> = it_iter.map(|(t, v)| (t, v.clone())).collect(); + vec.sort_by(|a, b| a.1.partial_cmp(&b.1).unwrap()); + let len = vec.len(); + if len == 0 { + return None; + } + if len % 2 == 0 { + return Some(vec[len / 2 - 1].clone()); + } + Some(vec[len / 2].clone()) + } + + pub fn __repr__(&self) -> String { + self.prop.repr() + } +} + +impl From> for PyTemporalProp { + fn from(value: TemporalPropertyView

) -> Self { + Self { + prop: TemporalPropertyView { + id: value.id, + props: Arc::new(value.props), + }, + } + } +} + +impl IntoPy + for TemporalProperties

+{ + fn into_py(self, py: Python<'_>) -> PyObject { + PyTemporalProperties::from(self).into_py(py) + } +} + +impl IntoPy for TemporalProperties { + fn into_py(self, py: Python<'_>) -> PyObject { + PyTemporalProperties::from(self).into_py(py) + } +} + +impl IntoPy for DynTemporalProperties { + fn into_py(self, py: Python<'_>) -> PyObject { + PyTemporalProperties::from(self).into_py(py) + } +} + +impl Repr for TemporalProperties

{ + fn repr(&self) -> String { + format!( + "TemporalProperties({{{}}})", + iterator_dict_repr(self.iter()) + ) + } +} + +impl Repr for TemporalPropertyView

{ + fn repr(&self) -> String { + format!("TemporalProp({})", iterator_repr(self.iter())) + } +} + +impl Repr for PyTemporalProp { + fn repr(&self) -> String { + self.prop.repr() + } +} + +impl Repr for PyTemporalProperties { + fn repr(&self) -> String { + self.props.repr() + } +} + +impl IntoPy for TemporalPropertyView

{ + fn into_py(self, py: Python<'_>) -> PyObject { + PyTemporalProp::from(self).into_py(py) + } +} + +py_iterable_base!( + PyTemporalPropsList, + DynTemporalProperties, + PyTemporalProperties +); + +#[derive(PartialEq)] +pub struct PyTemporalPropsListCmp(HashMap); + +impl From<&PyTemporalPropsList> for PyTemporalPropsListCmp { + fn from(value: &PyTemporalPropsList) -> Self { + Self( + value + .items() + .into_iter() + .map(|(k, v)| (k, v.into())) + .collect(), + ) + } +} + +impl From> for PyTemporalPropsListCmp { + fn from(value: HashMap) -> Self { + Self(value) + } +} + +impl<'source> FromPyObject<'source> for PyTemporalPropsListCmp { + fn extract(ob: &'source PyAny) -> PyResult { + if let Ok(v) = ob.extract::>() { + Ok(PyTemporalPropsListCmp::from(v.deref())) + } else if let Ok(v) = ob.extract::>() { + Ok(PyTemporalPropsListCmp::from(v)) + } else { + Err(PyTypeError::new_err("cannot compare")) + } + } +} + +py_eq!(PyTemporalPropsList, PyTemporalPropsListCmp); + +#[pymethods] +impl PyTemporalPropsList { + fn keys(&self) -> Vec { + self.iter() + // FIXME: Still have to clone all those strings which sucks + .map(|p| p.keys().map(|k| k.clone()).collect_vec()) + .kmerge() + .dedup() + .collect() + } + fn values(&self) -> Vec { + self.keys() + .into_iter() + .map(|k| self.get(k).expect("key exists")) + .collect() + } + fn items(&self) -> Vec<(ArcStr, PyTemporalPropList)> { + self.keys().into_iter().zip(self.values()).collect() + } + + fn latest(&self) -> HashMap { + let builder = self.builder.clone(); + self.keys() + .into_iter() + .map(move |k| { + let builder = builder.clone(); + let nk = k.clone(); + ( + k, + (move || { + let nk = nk.clone(); + builder().map(move |p| p.get(nk.as_ref()).and_then(|v| v.latest())) + }) + .into(), + ) + }) + .collect() + } + + fn histories(&self) -> HashMap { + self.keys() + .into_iter() + .map(|k| { + let kk = k.clone(); + let builder = self.builder.clone(); + let v = (move || { + let kk = kk.clone(); + builder().map(move |p| { + p.get(kk.as_ref()) + .map(|v| v.iter().collect::>()) + .unwrap_or_default() + }) + }) + .into(); + (k, v) + }) + .collect() + } + + fn __getitem__(&self, key: ArcStr) -> PyResult { + self.get(key).ok_or(PyKeyError::new_err("unknown property")) + } + + fn __contains__(&self, key: &str) -> bool { + self.iter().any(|p| p.contains(key)) + } + + fn __iter__(&self) -> PyGenericIterator { + self.keys().into_iter().into() + } + + fn get(&self, key: ArcStr) -> Option { + self.__contains__(&key).then(|| { + let builder = self.builder.clone(); + let key = key.clone(); + (move || { + let key = key.clone(); + builder().map(move |p| p.get(&key)) + }) + .into() + }) + } +} + +pub struct OptionPyTemporalProp(Option); + +#[derive(PartialEq, FromPyObject, Clone)] +pub struct OptionPyTemporalPropCmp(Option); + +impl From> for OptionPyTemporalPropCmp { + fn from(value: Option) -> Self { + OptionPyTemporalPropCmp(value.map(|v| v.into())) + } +} + +impl Repr for OptionPyTemporalProp { + fn repr(&self) -> String { + self.0.repr() + } +} + +impl IntoPy for OptionPyTemporalProp { + fn into_py(self, py: Python<'_>) -> PyObject { + self.0.into_py(py) + } +} + +impl From> for OptionPyTemporalProp { + fn from(value: Option) -> Self { + Self(value.map(|v| v.into())) + } +} + +py_iterable!( + PyTemporalPropList, + Option, + OptionPyTemporalProp +); + +py_iterable_comp!( + PyTemporalPropList, + OptionPyTemporalPropCmp, + PyTemporalPropListCmp +); + +#[pymethods] +impl PyTemporalPropList { + #[getter] + pub fn history(&self) -> PyPropHistList { + let builder = self.builder.clone(); + (move || builder().map(|p| p.map(|v| v.history()).unwrap_or_default())).into() + } + + pub fn values(&self) -> PyPropHistValueList { + let builder = self.builder.clone(); + (move || builder().map(|p| p.map(|v| v.values()).unwrap_or_default())).into() + } + + pub fn items(&self) -> PyPropHistItemsList { + let builder = self.builder.clone(); + (move || builder().map(|p| p.map(|v| v.iter().collect::>()).unwrap_or_default())) + .into() + } + + pub fn at(&self, t: PyTime) -> PyPropValueList { + let t = t.into_time(); + let builder = self.builder.clone(); + (move || builder().map(move |p| p.and_then(|v| v.at(t)))).into() + } + + pub fn value(&self) -> PyPropValueList { + let builder = self.builder.clone(); + (move || builder().map(|p| p.and_then(|v| v.latest()))).into() + } +} + +py_nested_iterable_base!( + PyTemporalPropsListList, + DynTemporalProperties, + PyTemporalProperties +); + +#[derive(PartialEq)] +pub struct PyTemporalPropsListListCmp(HashMap); + +impl From<&PyTemporalPropsListList> for PyTemporalPropsListListCmp { + fn from(value: &PyTemporalPropsListList) -> Self { + Self( + value + .items() + .into_iter() + .map(|(k, v)| (k, v.into())) + .collect(), + ) + } +} + +impl From> for PyTemporalPropsListListCmp { + fn from(value: HashMap) -> Self { + Self(value) + } +} + +impl<'source> FromPyObject<'source> for PyTemporalPropsListListCmp { + fn extract(ob: &'source PyAny) -> PyResult { + if let Ok(v) = ob.extract::>() { + Ok(Self::from(v.deref())) + } else if let Ok(v) = ob.extract::>() { + Ok(Self::from(v)) + } else { + Err(PyTypeError::new_err("cannot compare")) + } + } +} + +py_eq!(PyTemporalPropsListList, PyTemporalPropsListListCmp); + +#[pymethods] +impl PyTemporalPropsListList { + fn keys(&self) -> Vec { + self.iter() + .flat_map( + |it| // FIXME: Still have to clone all those strings which sucks + it.map(|p| p.keys().map(|k| k.clone()).collect_vec()), + ) + .kmerge() + .dedup() + .collect() + } + fn values(&self) -> Vec { + self.keys() + .into_iter() + .map(|k| self.get(k).expect("key exists")) + .collect() + } + fn items(&self) -> Vec<(ArcStr, PyTemporalPropListList)> { + self.keys().into_iter().zip(self.values()).collect() + } + + fn latest(&self) -> HashMap { + let builder = self.builder.clone(); + self.keys() + .into_iter() + .map(move |k| { + let builder = builder.clone(); + let nk = k.clone(); + ( + k, + (move || { + let nk = nk.clone(); + builder().map(move |it| { + let nk = nk.clone(); + it.map(move |p| p.get(nk.as_ref()).and_then(|v| v.latest())) + }) + }) + .into(), + ) + }) + .collect() + } + + fn histories(&self) -> HashMap { + let builder = self.builder.clone(); + self.keys() + .into_iter() + .map(move |k| { + let builder = builder.clone(); + let kk = k.clone(); + let v = (move || { + let kk = kk.clone(); + builder().map(move |it| { + let kk = kk.clone(); + it.map(move |p| { + p.get(kk.as_ref()) + .map(|v| v.iter().collect::>()) + .unwrap_or_default() + }) + }) + }) + .into(); + (k, v) + }) + .collect() + } + + fn __getitem__(&self, key: ArcStr) -> PyResult { + self.get(key).ok_or(PyKeyError::new_err("unknown property")) + } + + fn __contains__(&self, key: &str) -> bool { + self.iter().any(|mut it| it.any(|p| p.contains(key))) + } + + fn __iter__(&self) -> PyGenericIterator { + self.keys().into_iter().into() + } + + fn get(&self, key: ArcStr) -> Option { + self.__contains__(&key).then(|| { + let builder = self.builder.clone(); + let key = key.clone(); + (move || { + let key = key.clone(); + builder().map(move |it| { + let key = key.clone(); + it.map(move |p| p.get(&key)) + }) + }) + .into() + }) + } +} + +py_nested_iterable!( + PyTemporalPropListList, + Option, + OptionPyTemporalProp +); + +py_iterable_comp!( + PyTemporalPropListList, + PyTemporalPropListCmp, + PyTemporalPropListListCmp +); + +#[pymethods] +impl PyTemporalPropListList { + #[getter] + pub fn history(&self) -> PyPropHistListList { + let builder = self.builder.clone(); + (move || builder().map(|it| it.map(|p| p.map(|v| v.history()).unwrap_or_default()))).into() + } + + pub fn values(&self) -> PyPropHistValueListList { + let builder = self.builder.clone(); + (move || builder().map(|it| it.map(|p| p.map(|v| v.values()).unwrap_or_default()))).into() + } + + pub fn items(&self) -> PyPropHistItemsListList { + let builder = self.builder.clone(); + (move || { + builder() + .map(|it| it.map(|p| p.map(|v| v.iter().collect::>()).unwrap_or_default())) + }) + .into() + } + + pub fn at(&self, t: PyTime) -> PyPropValueListList { + let t = t.into_time(); + let builder = self.builder.clone(); + (move || builder().map(move |it| it.map(move |p| p.and_then(|v| v.at(t))))).into() + } + + pub fn value(&self) -> PyPropValueListList { + let builder = self.builder.clone(); + (move || builder().map(|it| it.map(|p| p.and_then(|v| v.latest())))).into() + } + + pub fn flatten(&self) -> PyTemporalPropList { + let builder = self.builder.clone(); + (move || builder().flatten()).into() + } +} + +#[pymethods] +impl PyPropHistValueListList { + pub fn flatten(&self) -> PyPropHistValueList { + let builder = self.builder.clone(); + (move || builder().flatten()).into() + } + + pub fn count(&self) -> NestedUsizeIterable { + let builder = self.builder.clone(); + (move || builder().map(|it| it.map(|itit| itit.len()))).into() + } + + pub fn median(&self) -> PyPropValueListList { + let builder = self.builder.clone(); + (move || { + builder().map(|it| { + it.map(|itit| { + let mut sorted: Vec = itit.into_iter().collect(); + sorted.sort_by(|a, b| a.partial_cmp(b).unwrap_or(std::cmp::Ordering::Equal)); + let len = sorted.len(); + match len { + 0 => None, + 1 => Some(sorted[0].clone()), + _ => { + let a = &sorted[len / 2]; + Some(a.clone()) + } + } + }) + }) + }) + .into() + } + + pub fn sum(&self) -> PyPropValueListList { + let builder = self.builder.clone(); + (move || { + builder().map(|it| { + it.map(|itit| { + let mut itit_iter = itit.into_iter(); + let first = itit_iter.next(); + itit_iter.clone().fold(first, |acc, elem| match acc { + Some(a) => a.add(elem), + _ => None, + }) + }) + }) + }) + .into() + } + + pub fn mean(&self) -> PyPropValueListList { + let builder = self.builder.clone(); + (move || { + builder().map(|it| { + it.map(|itit| { + let mut itit_iter = itit.into_iter(); + let first = itit_iter.next(); + let sum = itit_iter.clone().fold(first, |acc, elem| match acc { + Some(a) => a.add(elem), + _ => Some(elem), + }); + let count = itit_iter.count(); + if count == 0 { + return None; + } + match sum { + Some(Prop::U8(s)) => Some(Prop::U8(s / count as u8)), + Some(Prop::U16(s)) => Some(Prop::U16(s / count as u16)), + Some(Prop::I32(s)) => Some(Prop::I32(s / count as i32)), + Some(Prop::I64(s)) => Some(Prop::I64(s / count as i64)), + Some(Prop::U32(s)) => Some(Prop::U32(s / count as u32)), + Some(Prop::U64(s)) => Some(Prop::U64(s / count as u64)), + Some(Prop::F32(s)) => Some(Prop::F32(s / count as f32)), + Some(Prop::F64(s)) => Some(Prop::F64(s / count as f64)), + _ => None, + } + }) + }) + }) + .into() + } +} + +#[pymethods] +impl PropIterable { + pub fn sum(&self) -> PropValue { + let mut it_iter = self.iter(); + let first = it_iter.next(); + it_iter.fold(first, |acc, elem| acc.and_then(|val| val.add(elem))) + } + + pub fn median(&self) -> PropValue { + let mut sorted: Vec = self.iter().collect(); + sorted.sort_by(|a, b| a.partial_cmp(b).unwrap_or(std::cmp::Ordering::Equal)); + let len = sorted.len(); + match len { + 0 => None, + 1 => Some(sorted[0].clone()), + _ => { + let a = &sorted[len / 2]; + Some(a.clone()) + } + } + } + + pub fn count(&self) -> usize { + self.iter().count() + } + + pub fn min(&self) -> PropValue { + let mut sorted: Vec = self.iter().collect(); + sorted.sort_by(|a, b| a.partial_cmp(b).unwrap_or(std::cmp::Ordering::Equal)); + let len = sorted.len(); + match len { + 0 => None, + _ => { + let a = &sorted[0]; + Some(a.clone()) + } + } + } + + pub fn max(&self) -> PropValue { + let mut sorted: Vec = self.iter().collect(); + sorted.sort_by(|a, b| a.partial_cmp(b).unwrap_or(std::cmp::Ordering::Equal)); + let len = sorted.len(); + match len { + 0 => None, + _ => { + let a = &sorted[len - 1]; + Some(a.clone()) + } + } + } + + pub fn average(&self) -> PropValue { + self.mean() + } + + pub fn mean(&self) -> PropValue { + let sum: PropValue = self.sum(); + let count: usize = self.iter().collect::>().len(); + if count == 0 { + return None; + } + match sum { + Some(Prop::U8(s)) => Some(Prop::F64(s as f64 / count as f64)), + Some(Prop::U16(s)) => Some(Prop::F64(s as f64 / count as f64)), + Some(Prop::I32(s)) => Some(Prop::F32(s as f32 / count as f32)), + Some(Prop::I64(s)) => Some(Prop::F64(s as f64 / count as f64)), + Some(Prop::U32(s)) => Some(Prop::F32(s as f32 / count as f32)), + Some(Prop::U64(s)) => Some(Prop::F64(s as f64 / count as f64)), + Some(Prop::F32(s)) => Some(Prop::F32(s / count as f32)), + Some(Prop::F64(s)) => Some(Prop::F64(s / count as f64)), + _ => None, + } + } +} + +#[pymethods] +impl PyPropHistValueList { + pub fn sum(&self) -> PyPropValueList { + let builder = self.builder.clone(); + (move || { + builder().map(|it| { + let mut it_iter = it.into_iter(); + let first = it_iter.next(); + it_iter.fold(first, |acc, elem| acc.and_then(|val| val.add(elem))) + }) + }) + .into() + } + + pub fn min(&self) -> PyPropValueList { + let builder = self.builder.clone(); + (move || { + builder().map(|it| { + let mut it_iter = it.into_iter(); + let first = it_iter.next(); + it_iter.fold(first, |a, b| { + match PartialOrd::partial_cmp(&a, &Some(b.clone())) { + Some(std::cmp::Ordering::Less) => a, + _ => Some(b), + } + }) + }) + }) + .into() + } + + pub fn max(&self) -> PyPropValueList { + let builder = self.builder.clone(); + (move || { + builder().map(|it| { + let mut it_iter = it.into_iter(); + let first = it_iter.next(); + it_iter.fold(first, |a, b| { + match PartialOrd::partial_cmp(&a, &Some(b.clone())) { + Some(std::cmp::Ordering::Greater) => a, + _ => Some(b), + } + }) + }) + }) + .into() + } + + pub fn median(&self) -> PyPropValueList { + let builder = self.builder.clone(); + (move || { + builder().map(|it| { + let mut sorted: Vec = it.clone(); + sorted.sort_by(|a, b| a.partial_cmp(b).unwrap_or(std::cmp::Ordering::Equal)); + let len = sorted.len(); + match len { + 0 => None, + 1 => Some(sorted[0].clone()), + _ => { + let a = &sorted[len / 2]; + Some(a.clone()) + } + } + }) + }) + .into() + } + + pub fn average(&self) -> PyPropValueList { + self.mean() + } + + pub fn mean(&self) -> PyPropValueList { + let builder = self.builder.clone(); + (move || { + builder().map(|it| { + let mut it_iter = it.clone().into_iter(); + let first = it_iter.next(); + let sum = it_iter.fold(first, |acc, elem| acc.and_then(|val| val.add(elem))); + let count = it.len(); + if count == 0 { + return None; + } + match sum { + Some(Prop::U8(s)) => Some(Prop::F64(s as f64 / count as f64)), + Some(Prop::U16(s)) => Some(Prop::F64(s as f64 / count as f64)), + Some(Prop::I32(s)) => Some(Prop::F32(s as f32 / count as f32)), + Some(Prop::I64(s)) => Some(Prop::F64(s as f64 / count as f64)), + Some(Prop::U32(s)) => Some(Prop::F32(s as f32 / count as f32)), + Some(Prop::U64(s)) => Some(Prop::F64(s as f64 / count as f64)), + Some(Prop::F32(s)) => Some(Prop::F32(s / count as f32)), + Some(Prop::F64(s)) => Some(Prop::F64(s / count as f64)), + _ => None, + } + }) + }) + .into() + } + + pub fn count(&self) -> UsizeIterable { + let builder = self.builder.clone(); + (move || builder().map(|it| it.len())).into() + } + + pub fn flatten(&self) -> PropIterable { + let builder = self.builder.clone(); + (move || builder().flatten()).into() + } +} + +#[pymethods] +impl PyPropValueList { + pub fn sum(&self) -> Option { + self.iter() + .reduce(|acc, elem| match (acc, elem) { + (Some(a), Some(b)) => a.add(b), + (Some(a), None) => Some(a), + (None, Some(b)) => Some(b), + _ => None, + }) + .flatten() + } + + pub fn count(&self) -> usize { + self.iter().count() + } + + pub fn min(&self) -> PropValue { + let mut sorted: Vec = self.iter().collect(); + sorted.sort_by(|a, b| a.partial_cmp(b).unwrap_or(std::cmp::Ordering::Equal)); + let len = sorted.len(); + match len { + 0 => None, + _ => { + let a = &sorted[0]; + a.clone() + } + } + } + + pub fn max(&self) -> PropValue { + let mut sorted: Vec = self.iter().collect(); + sorted.sort_by(|a, b| a.partial_cmp(b).unwrap_or(std::cmp::Ordering::Equal)); + let len = sorted.len(); + match len { + 0 => None, + _ => { + let a = &sorted[len - 1]; + a.clone() + } + } + } + + pub fn drop_none(&self) -> PyPropValueList { + let builder = self.builder.clone(); + (move || builder().filter(|x| x.is_some())).into() + } + + pub fn median(&self) -> PropValue { + let mut sorted: Vec = self.iter().collect(); + sorted.sort_by(|a, b| a.partial_cmp(b).unwrap_or(std::cmp::Ordering::Equal)); + let len = sorted.len(); + match len { + 0 => None, + 1 => sorted[0].clone(), + _ => { + let a = &sorted[len / 2]; + a.clone() + } + } + } + + pub fn mean(&self) -> PropValue { + let sum: PropValue = self.sum(); + let count: usize = self.iter().collect::>().len(); + if count == 0 { + return None; + } + match sum { + Some(Prop::U8(s)) => Some(Prop::F64(s as f64 / count as f64)), + Some(Prop::U16(s)) => Some(Prop::F64(s as f64 / count as f64)), + Some(Prop::I32(s)) => Some(Prop::F32(s as f32 / count as f32)), + Some(Prop::I64(s)) => Some(Prop::F64(s as f64 / count as f64)), + Some(Prop::U32(s)) => Some(Prop::F32(s as f32 / count as f32)), + Some(Prop::U64(s)) => Some(Prop::F64(s as f64 / count as f64)), + Some(Prop::F32(s)) => Some(Prop::F32(s / count as f32)), + Some(Prop::F64(s)) => Some(Prop::F64(s / count as f64)), + _ => None, + } + } + + pub fn average(&self) -> PropValue { + self.mean() + } +} + +#[pymethods] +impl PyPropValueListList { + pub fn sum(&self) -> PyPropValueList { + let builder = self.builder.clone(); + (move || { + builder().map(|it| { + let mut it_iter = it.into_iter(); + let first = it_iter.next().flatten(); + it_iter.fold(first, |acc, elem| match (acc, elem) { + (Some(a), Some(b)) => a.add(b), + (Some(a), None) => Some(a), + (None, Some(b)) => Some(b), + _ => None, + }) + }) + }) + .into() + } + + pub fn min(&self) -> PyPropValueList { + let builder = self.builder.clone(); + (move || { + builder().map(|it| { + let mut it_iter = it.into_iter(); + let first = it_iter.next().unwrap(); + it_iter.fold(first, |a, b| { + match PartialOrd::partial_cmp(&a, &Some(b.clone().unwrap())) { + Some(std::cmp::Ordering::Less) => a, + _ => Some(b.clone().unwrap()), + } + }) + }) + }) + .into() + } + + pub fn max(&self) -> PyPropValueList { + let builder = self.builder.clone(); + (move || { + builder().map(|it| { + let mut it_iter = it.into_iter(); + let first = it_iter.next().unwrap(); + it_iter.fold(first, |a, b| { + match PartialOrd::partial_cmp(&a, &Some(b.clone().unwrap())) { + Some(std::cmp::Ordering::Greater) => a, + _ => Some(b.clone().unwrap()), + } + }) + }) + }) + .into() + } + + pub fn average(&self) -> PyPropValueList { + self.mean() + } + + pub fn mean(&self) -> PyPropValueList { + let builder = self.builder.clone(); + (move || { + builder().map(|mut it| { + let mut count: usize = 1; + let first = it.next().flatten(); + let sum = it.fold(first, |acc, elem| { + count += 1; + match (acc, elem) { + (Some(a), Some(b)) => a.add(b), + (Some(a), None) => Some(a), + (None, Some(b)) => Some(b), + _ => None, + } + }); + if count == 0 { + return None; + } + match sum { + Some(Prop::U8(s)) => Some(Prop::F64(s as f64 / count as f64)), + Some(Prop::U16(s)) => Some(Prop::F64(s as f64 / count as f64)), + Some(Prop::I32(s)) => Some(Prop::F32(s as f32 / count as f32)), + Some(Prop::I64(s)) => Some(Prop::F64(s as f64 / count as f64)), + Some(Prop::U32(s)) => Some(Prop::F32(s as f32 / count as f32)), + Some(Prop::U64(s)) => Some(Prop::F64(s as f64 / count as f64)), + Some(Prop::F32(s)) => Some(Prop::F32(s / count as f32)), + Some(Prop::F64(s)) => Some(Prop::F64(s / count as f64)), + _ => None, + } + }) + }) + .into() + } + + pub fn median(&self) -> PyPropValueList { + let builder = self.builder.clone(); + (move || { + builder().map(|it| { + let mut sorted: Vec = it.into_iter().collect(); + sorted.sort_by(|a, b| a.partial_cmp(b).unwrap_or(std::cmp::Ordering::Equal)); + let len = sorted.len(); + match len { + 0 => None, + 1 => sorted[0].clone(), + _ => { + let a = &sorted[len / 2]; + a.clone() + } + } + }) + }) + .into() + } + + pub fn flatten(&self) -> PyPropValueList { + let builder = self.builder.clone(); + (move || builder().flatten()).into() + } + + pub fn count(&self) -> UsizeIterable { + let builder = self.builder.clone(); + (move || builder().map(|it| it.count())).into() + } + + pub fn drop_none(&self) -> PyPropValueListList { + let builder = self.builder.clone(); + (move || builder().map(|it| it.filter(|x| x.is_some()))).into() + } +} + +py_iterable!(PyPropHistList, Vec); +py_iterable_comp!(PyPropHistList, Vec, PyPropHistListCmp); +py_nested_iterable!(PyPropHistListList, Vec); +py_iterable_comp!(PyPropHistListList, PyPropHistListCmp, PyPropHistListListCmp); + +py_iterable!(PyPropHistValueList, Vec); +py_iterable_comp!(PyPropHistValueList, Vec, PyPropHistValueListCmp); +py_nested_iterable!(PyPropHistValueListList, Vec); +py_iterable_comp!( + PyPropHistValueListList, + PyPropHistValueListCmp, + PropHistValueListListCmp +); + +py_iterable!(PyPropHistItemsList, PropHistItems); +py_iterable_comp!(PyPropHistItemsList, PropHistItems, PyPropHistItemsListCmp); +py_nested_iterable!(PyPropHistItemsListList, PropHistItems); +py_iterable_comp!( + PyPropHistItemsListList, + PyPropHistItemsListCmp, + PyPropHistItemsListListCmp +); diff --git a/py-raphtory/src/vertex.rs b/raphtory/src/python/graph/vertex.rs similarity index 59% rename from py-raphtory/src/vertex.rs rename to raphtory/src/python/graph/vertex.rs index 841da8fd8d..0cee2bcbb8 100644 --- a/py-raphtory/src/vertex.rs +++ b/raphtory/src/python/graph/vertex.rs @@ -1,32 +1,55 @@ //! Defines the `Vertex`, which represents a vertex in the graph. //! A vertex is a node in the graph, and can have properties and edges. //! It can also be used to navigate the graph. -use crate::dynamic::{DynamicGraph, IntoDynamic}; -use crate::edge::{PyEdges, PyNestedEdges}; -use crate::types::repr::{iterator_repr, Repr}; -use crate::utils::{ - at_impl, expanding_impl, extract_vertex_ref, rolling_impl, window_impl, IntoPyObject, - PyWindowSet, +use crate::{ + core::{ + entities::vertices::vertex_ref::VertexRef, + utils::{errors::GraphError, time::error::ParseTimeError}, + Prop, + }, + db::{ + api::{ + properties::Properties, + view::{ + internal::{DynamicGraph, Immutable, IntoDynamic, MaterializedGraph}, + *, + }, + }, + graph::{ + path::{PathFromGraph, PathFromVertex}, + vertex::VertexView, + vertices::Vertices, + views::{ + deletion_graph::GraphWithDeletions, layer_graph::LayeredGraph, + window_graph::WindowedGraph, + }, + }, + }, + prelude::Graph, + python::{ + graph::{ + edge::{PyEdges, PyNestedEdges}, + properties::{PyNestedPropsIterable, PyPropsList}, + }, + types::wrappers::iterators::*, + utils::{PyInterval, PyTime}, + }, + *, }; -use crate::wrappers::iterators::*; -use crate::wrappers::prop::Prop; use chrono::NaiveDateTime; use itertools::Itertools; -use pyo3::exceptions::PyIndexError; -use pyo3::prelude::*; -use pyo3::{pyclass, pymethods, PyAny, PyObject, PyRef, PyRefMut, PyResult, Python}; -use raphtory::core::vertex_ref::VertexRef; -use raphtory::db::path::{PathFromGraph, PathFromVertex}; -use raphtory::db::vertex::VertexView; -use raphtory::db::vertices::Vertices; -use raphtory::db::view_api::layer::LayerOps; -use raphtory::db::view_api::*; -use raphtory::*; -use std::collections::HashMap; -use std::sync::Arc; +use pyo3::{ + exceptions::{PyIndexError, PyKeyError}, + prelude::*, + pyclass, + pyclass::CompareOp, + pymethods, PyAny, PyObject, PyRef, PyRefMut, PyResult, Python, +}; +use python::types::repr::{iterator_repr, Repr}; +use std::{collections::HashMap, ops::Deref}; /// A vertex (or node) in the graph. -#[pyclass(name = "Vertex")] +#[pyclass(name = "Vertex", subclass)] #[derive(Clone)] pub struct PyVertex { vertex: VertexView, @@ -43,13 +66,6 @@ impl From> for PyVertex { } } -impl IntoPyObject for VertexView { - fn into_py_object(self) -> PyObject { - let py_version: PyVertex = self.into(); - Python::with_gil(|py| py_version.into_py(py)) - } -} - /// Converts a python vertex into a rust vertex. impl From for VertexRef { fn from(value: PyVertex) -> Self { @@ -62,11 +78,42 @@ impl From for VertexRef { /// It can also be used to navigate the graph. #[pymethods] impl PyVertex { + /// Rich Comparison for Vertex objects + pub fn __richcmp__(&self, other: PyRef, op: CompareOp) -> Py { + let py = other.py(); + match op { + CompareOp::Eq => (self.vertex.id() == other.id()).into_py(py), + CompareOp::Ne => (self.vertex.id() != other.id()).into_py(py), + _ => py.NotImplemented(), + } + } + + /// TODO: uncomment when we update to py03 0.2 + /// checks if a vertex is equal to another by their id (ids are unqiue) + /// + /// Arguments: + /// other: The other vertex to compare to. + /// + /// Returns: + /// True if the vertices are equal, false otherwise. + // pub fn __eq__(&self, other: &PyVertex) -> bool { + // self.vertex.id() == other.vertex.id() + // } + + /// Returns the hash of the vertex. + /// + /// Returns: + /// The vertex id. + pub fn __hash__(&self) -> u64 { + self.vertex.id() + } + /// Returns the id of the vertex. /// This is a unique identifier for the vertex. /// /// Returns: /// The id of the vertex as an integer. + #[getter] pub fn id(&self) -> u64 { self.vertex.id() } @@ -75,6 +122,7 @@ impl PyVertex { /// /// Returns: /// The name of the vertex as a string. + #[getter] pub fn name(&self) -> String { self.vertex.name() } @@ -86,6 +134,7 @@ impl PyVertex { /// /// Returns: /// The earliest time that the vertex exists as an integer. + #[getter] pub fn earliest_time(&self) -> Option { self.vertex.earliest_time() } @@ -97,15 +146,17 @@ impl PyVertex { /// /// Returns: /// The earliest datetime that the vertex exists as an integer. + #[getter] pub fn earliest_date_time(&self) -> Option { let earliest_time = self.vertex.earliest_time()?; - Some(NaiveDateTime::from_timestamp_millis(earliest_time).unwrap()) + NaiveDateTime::from_timestamp_millis(earliest_time) } /// Returns the latest time that the vertex exists. /// /// Returns: /// The latest time that the vertex exists as an integer. + #[getter] pub fn latest_time(&self) -> Option { self.vertex.latest_time() } @@ -117,117 +168,16 @@ impl PyVertex { /// /// Returns: /// The latest datetime that the vertex exists as an integer. + #[getter] pub fn latest_date_time(&self) -> Option { let latest_time = self.vertex.latest_time()?; - Some(NaiveDateTime::from_timestamp_millis(latest_time).unwrap()) + NaiveDateTime::from_timestamp_millis(latest_time) } - /// Gets the property value of this vertex given the name of the property. - /// - /// Arguments: - /// name: The name of the property. - /// include_static: Whether to include static properties. Defaults to true. - /// - /// Returns: - /// The property value as a `Prop` object. - pub fn property(&self, name: String, include_static: Option) -> Option { - let include_static = include_static.unwrap_or(true); - self.vertex - .property(name, include_static) - .map(|prop| prop.into()) - } - - /// Returns the history of a property value of a vertex at all times - /// - /// Arguments: - /// name: The name of the property. - /// - /// Returns: - /// A list of tuples of the form (time, value) where time is an integer and value is a `Prop` object. - pub fn property_history(&self, name: String) -> Vec<(i64, Prop)> { - self.vertex - .property_history(name) - .into_iter() - .map(|(k, v)| (k, v.into())) - .collect() - } - - /// Returns all the properties of the vertex as a dictionary. - /// - /// Arguments: - /// include_static: Whether to include static properties. Defaults to true. - /// - /// Returns: - /// A dictionary of the form {name: value} where name is a string and value is a `Prop` object. - pub fn properties(&self, include_static: Option) -> HashMap { - let include_static = include_static.unwrap_or(true); - self.vertex - .properties(include_static) - .into_iter() - .map(|(k, v)| (k, v.into())) - .collect() - } - - /// Returns all the properties of the vertex as a dictionary including the history of each property. - /// - /// Arguments: - /// include_static: Whether to include static properties. Defaults to true. - /// - /// Returns: - /// A dictionary of the form {name: [(time, value)]} where name is a string, time is an integer, and value is a `Prop` object. - pub fn property_histories(&self) -> HashMap> { - self.vertex - .property_histories() - .into_iter() - .map(|(k, v)| (k, v.into_iter().map(|(t, p)| (t, p.into())).collect())) - .collect() - } - - /// Returns the names of all the properties of the vertex. - /// - /// Arguments: - /// include_static: Whether to include static properties. Defaults to true. - /// - /// Returns: - /// A list of strings of propert names. - pub fn property_names(&self, include_static: Option) -> Vec { - let include_static = include_static.unwrap_or(true); - self.vertex.property_names(include_static) - } - - /// Checks if a property exists on this vertex. - /// - /// Arguments: - /// name: The name of the property. - /// include_static: Whether to include static properties. Defaults to true. - /// - /// Returns: - /// True if the property exists, false otherwise. - pub fn has_property(&self, name: String, include_static: Option) -> bool { - let include_static = include_static.unwrap_or(true); - self.vertex.has_property(name, include_static) - } - - /// Checks if a static property exists on this vertex. - /// - /// Arguments: - /// name: The name of the property. - /// - /// Returns: - /// True if the property exists, false otherwise. - pub fn has_static_property(&self, name: String) -> bool { - self.vertex.has_static_property(name) - } - - /// Returns the static property value of this vertex given the name of the property. - /// - /// Arguments: - /// name: The name of the property. - /// - /// Returns: - /// The property value as a `Prop` object or None if the property does not exist. - pub fn static_property(&self, name: String) -> Option { - self.vertex.static_property(name).map(|prop| prop.into()) + /// The properties of the vertex + #[getter] + pub fn properties(&self) -> Properties> { + self.vertex.properties() } /// Get the degree of this vertex (i.e., the number of edges that are incident to it). @@ -258,6 +208,7 @@ impl PyVertex { /// /// Returns: /// A list of `Edge` objects. + #[getter] pub fn edges(&self) -> PyEdges { let vertex = self.vertex.clone(); (move || vertex.edges()).into() @@ -267,6 +218,7 @@ impl PyVertex { /// /// Returns: /// A list of `Edge` objects. + #[getter] pub fn in_edges(&self) -> PyEdges { let vertex = self.vertex.clone(); (move || vertex.in_edges()).into() @@ -276,6 +228,7 @@ impl PyVertex { /// /// Returns: /// A list of `Edge` objects. + #[getter] pub fn out_edges(&self) -> PyEdges { let vertex = self.vertex.clone(); (move || vertex.out_edges()).into() @@ -286,6 +239,7 @@ impl PyVertex { /// Returns: /// /// A list of `Vertex` objects. + #[getter] pub fn neighbours(&self) -> PyPathFromVertex { self.vertex.neighbours().into() } @@ -294,6 +248,7 @@ impl PyVertex { /// /// Returns: /// A list of `Vertex` objects. + #[getter] pub fn in_neighbours(&self) -> PyPathFromVertex { self.vertex.in_neighbours().into() } @@ -302,6 +257,7 @@ impl PyVertex { /// /// Returns: /// A list of `Vertex` objects. + #[getter] pub fn out_neighbours(&self) -> PyPathFromVertex { self.vertex.out_neighbours().into() } @@ -312,6 +268,7 @@ impl PyVertex { /// /// Returns: /// The earliest time that this vertex is valid or None if the vertex is valid for all times. + #[getter] pub fn start(&self) -> Option { self.vertex.start() } @@ -320,15 +277,17 @@ impl PyVertex { /// /// Returns: /// The earliest datetime that this vertex is valid or None if the vertex is valid for all times. + #[getter] pub fn start_date_time(&self) -> Option { let start_time = self.vertex.start()?; - Some(NaiveDateTime::from_timestamp_millis(start_time).unwrap()) + NaiveDateTime::from_timestamp_millis(start_time) } /// Gets the latest time that this vertex is valid. /// /// Returns: /// The latest time that this vertex is valid or None if the vertex is valid for all times. + #[getter] pub fn end(&self) -> Option { self.vertex.end() } @@ -337,9 +296,10 @@ impl PyVertex { /// /// Returns: /// The latest datetime that this vertex is valid or None if the vertex is valid for all times. + #[getter] pub fn end_date_time(&self) -> Option { let end_time = self.vertex.end()?; - Some(NaiveDateTime::from_timestamp_millis(end_time).unwrap()) + NaiveDateTime::from_timestamp_millis(end_time) } /// Creates a `PyVertexWindowSet` with the given `step` size and optional `start` and `end` times, @@ -356,8 +316,11 @@ impl PyVertex { /// /// Returns: /// A `PyVertexWindowSet` object. - fn expanding(&self, step: &PyAny) -> PyResult { - expanding_impl(&self.vertex, step) + fn expanding( + &self, + step: PyInterval, + ) -> Result>, ParseTimeError> { + self.vertex.expanding(step) } /// Creates a `PyVertexWindowSet` with the given `window` size and optional `step`, `start` and `end` times, @@ -375,8 +338,12 @@ impl PyVertex { /// /// Returns: /// A `PyVertexWindowSet` object. - fn rolling(&self, window: &PyAny, step: Option<&PyAny>) -> PyResult { - rolling_impl(&self.vertex, window, step) + fn rolling( + &self, + window: PyInterval, + step: Option, + ) -> Result>, ParseTimeError> { + self.vertex.rolling(window, step) } /// Create a view of the vertex including all events between `t_start` (inclusive) and `t_end` (exclusive) @@ -388,8 +355,13 @@ impl PyVertex { /// Returns: /// A `PyVertex` object. #[pyo3(signature = (t_start = None, t_end = None))] - pub fn window(&self, t_start: Option<&PyAny>, t_end: Option<&PyAny>) -> PyResult { - window_impl(&self.vertex, t_start, t_end).map(|v| v.into()) + pub fn window( + &self, + t_start: Option, + t_end: Option, + ) -> VertexView> { + self.vertex + .window(t_start.unwrap_or(PyTime::MIN), t_end.unwrap_or(PyTime::MAX)) } /// Create a view of the vertex including all events at `t`. @@ -400,8 +372,8 @@ impl PyVertex { /// Returns: /// A `PyVertex` object. #[pyo3(signature = (end))] - pub fn at(&self, end: &PyAny) -> PyResult { - at_impl(&self.vertex, end).map(|v| v.into()) + pub fn at(&self, end: PyTime) -> VertexView> { + self.vertex.at(end) } #[doc = default_layer_doc_string!()] @@ -409,10 +381,16 @@ impl PyVertex { self.vertex.default_layer().into() } - #[doc = layer_doc_string!()] + #[doc = layers_doc_string!()] + #[pyo3(signature = (names))] + pub fn layers(&self, names: Vec) -> Option>> { + self.vertex.layer(names) + } + + #[doc = layers_doc_string!()] #[pyo3(signature = (name))] - pub fn layer(&self, name: &str) -> Option { - Some(self.vertex.layer(name)?.into()) + pub fn layer(&self, name: String) -> Option>> { + self.vertex.layer(name) } /// Returns the history of a vertex, including vertex additions and changes made to vertex. @@ -424,8 +402,11 @@ impl PyVertex { } //****** Python ******// - pub fn __getitem__(&self, name: String) -> Option { - self.property(name, Some(true)) + pub fn __getitem__(&self, name: &str) -> PyResult { + self.vertex + .properties() + .get(name) + .ok_or(PyKeyError::new_err(format!("Unknown property {}", name))) } /// Display the vertex as a string. @@ -433,28 +414,111 @@ impl PyVertex { self.repr() } } - impl Repr for PyVertex { fn repr(&self) -> String { + self.vertex.repr() + } +} + +impl Repr for VertexView { + fn repr(&self) -> String { + let earliest_time = self.earliest_time().repr(); + let latest_time = self.latest_time().repr(); let properties: String = self - .properties(Some(true)) + .properties() .iter() - .map(|(k, v)| k.to_string() + " : " + &v.to_string()) + .map(|(k, v)| format!("{}: {}", k.deref(), v)) .join(", "); - if properties.is_empty() { - format!("Vertex(name={})", self.name().trim_matches('"')) + format!( + "Vertex(name={}, earliest_time={:?}, latest_time={:?})", + self.name().trim_matches('"'), + earliest_time, + latest_time + ) } else { - let property_string: String = "{".to_owned() + &properties + "}"; format!( - "Vertex(name={}, properties={})", + "Vertex(name={}, earliest_time={:?}, latest_time={:?}, properties={})", self.name().trim_matches('"'), - property_string + earliest_time, + latest_time, + format!("{{{properties}}}") ) } } } +#[pyclass(name = "MutableVertex", extends=PyVertex)] +pub struct PyMutableVertex { + vertex: VertexView, +} + +impl Repr for PyMutableVertex { + fn repr(&self) -> String { + self.vertex.repr() + } +} + +impl From> for PyMutableVertex { + fn from(vertex: VertexView) -> Self { + Self { vertex } + } +} + +impl IntoPy for VertexView { + fn into_py(self, py: Python<'_>) -> PyObject { + PyVertex::from(self).into_py(py) + } +} + +impl IntoPy for VertexView { + fn into_py(self, py: Python<'_>) -> PyObject { + let graph: MaterializedGraph = self.graph.into(); + let vertex = self.vertex; + let vertex = VertexView { graph, vertex }; + vertex.into_py(py) + } +} + +impl IntoPy for VertexView { + fn into_py(self, py: Python<'_>) -> PyObject { + let graph: MaterializedGraph = self.graph.into(); + let vertex = self.vertex; + let vertex = VertexView { graph, vertex }; + vertex.into_py(py) + } +} + +impl IntoPy for VertexView { + fn into_py(self, py: Python<'_>) -> PyObject { + Py::new( + py, + (PyMutableVertex::from(self.clone()), PyVertex::from(self)), + ) + .unwrap() // I think this only fails if we are out of memory? Seems to be unavoidable! + .into_py(py) + } +} + +#[pymethods] +impl PyMutableVertex { + fn add_updates( + &self, + t: PyTime, + properties: Option>, + ) -> Result<(), GraphError> { + self.vertex.add_updates(t, properties.unwrap_or_default()) + } + + fn add_constant_properties(&self, properties: HashMap) -> Result<(), GraphError> { + self.vertex.add_constant_properties(properties) + } + + fn __repr__(&self) -> String { + self.repr() + } +} + /// A list of vertices that can be iterated over. #[pyclass(name = "Vertices")] pub struct PyVertices { @@ -469,10 +533,9 @@ impl From> for PyVertices { } } -impl IntoPyObject for Vertices { - fn into_py_object(self) -> PyObject { - let py_version: PyVertices = self.into(); - Python::with_gil(|py| py_version.into_py(py)) +impl IntoPy for Vertices { + fn into_py(self, py: Python<'_>) -> PyObject { + PyVertices::from(self).into_py(py) } } @@ -480,137 +543,219 @@ impl IntoPyObject for Vertices { /// These use all the same functions as a normal vertex except it returns a list of results. #[pymethods] impl PyVertices { + /// checks if a list of vertices is equal to another list by their idd (ids are unique) + /// + /// Arguments: + /// other: The other vertices to compare to. + /// + /// Returns: + /// True if the vertices are equal, false otherwise. + fn __eq__(&self, other: &PyVertices) -> bool { + for (v1, v2) in self.vertices.iter().zip(other.vertices.iter()) { + if v1.id() != v2.id() { + return false; + } + } + true + } + + /// Returns an iterator over the vertices ids + #[getter] fn id(&self) -> U64Iterable { let vertices = self.vertices.clone(); (move || vertices.id()).into() } + /// Returns an iterator over the vertices name + #[getter] fn name(&self) -> StringIterable { let vertices = self.vertices.clone(); (move || vertices.name()).into() } + /// Returns an iterator over the vertices earliest time + #[getter] fn earliest_time(&self) -> OptionI64Iterable { let vertices = self.vertices.clone(); (move || vertices.earliest_time()).into() } + /// Returns an iterator over the vertices latest time + #[getter] fn latest_time(&self) -> OptionI64Iterable { let vertices = self.vertices.clone(); (move || vertices.latest_time()).into() } - fn property(&self, name: String, include_static: Option) -> OptionPropIterable { - let vertices = self.vertices.clone(); - (move || vertices.property(name.clone(), include_static.unwrap_or(true))).into() - } - - fn property_history(&self, name: String) -> PropHistoryIterable { - let vertices = self.vertices.clone(); - (move || vertices.property_history(name.clone())).into() - } - - fn properties(&self, include_static: Option) -> PropsIterable { - let vertices = self.vertices.clone(); - (move || vertices.properties(include_static.unwrap_or(true))).into() - } - - fn property_histories(&self) -> PropHistoriesIterable { - let vertices = self.vertices.clone(); - (move || vertices.property_histories()).into() - } - - fn property_names(&self, include_static: Option) -> StringVecIterable { - let vertices = self.vertices.clone(); - (move || vertices.property_names(include_static.unwrap_or(true))).into() - } - - fn has_property(&self, name: String, include_static: Option) -> BoolIterable { - let vertices = self.vertices.clone(); - (move || vertices.has_property(name.clone(), include_static.unwrap_or(true))).into() - } - - fn has_static_property(&self, name: String) -> BoolIterable { + #[getter] + fn properties(&self) -> PyPropsList { let vertices = self.vertices.clone(); - (move || vertices.has_static_property(name.clone())).into() - } - - fn static_property(&self, name: String) -> OptionPropIterable { - let vertices = self.vertices.clone(); - (move || vertices.static_property(name.clone())).into() + (move || vertices.properties()).into() } + /// Returns the number of edges of the vertices + /// + /// Returns: + /// An iterator of the number of edges of the vertices fn degree(&self) -> UsizeIterable { let vertices = self.vertices.clone(); (move || vertices.degree()).into() } + /// Returns the number of in edges of the vertices + /// + /// Returns: + /// An iterator of the number of in edges of the vertices fn in_degree(&self) -> UsizeIterable { let vertices = self.vertices.clone(); (move || vertices.in_degree()).into() } + /// Returns the number of out edges of the vertices + /// + /// Returns: + /// An iterator of the number of out edges of the vertices fn out_degree(&self) -> UsizeIterable { let vertices = self.vertices.clone(); (move || vertices.out_degree()).into() } + /// Returns the edges of the vertices + /// + /// Returns: + /// An iterator of edges of the vertices + #[getter] fn edges(&self) -> PyNestedEdges { let clone = self.vertices.clone(); (move || clone.edges()).into() } + /// Returns the in edges of the vertices + /// + /// Returns: + /// An iterator of in edges of the vertices + #[getter] fn in_edges(&self) -> PyNestedEdges { let clone = self.vertices.clone(); (move || clone.in_edges()).into() } + /// Returns the out edges of the vertices + /// + /// Returns: + /// An iterator of out edges of the vertices + #[getter] fn out_edges(&self) -> PyNestedEdges { let clone = self.vertices.clone(); (move || clone.out_edges()).into() } - fn out_neighbours(&self) -> PyPathFromGraph { - self.vertices.out_neighbours().into() + /// Get the neighbours of the vertices + /// + /// Returns: + /// An iterator of the neighbours of the vertices + #[getter] + fn neighbours(&self) -> PyPathFromGraph { + self.vertices.neighbours().into() } + /// Get the in neighbours of the vertices + /// + /// Returns: + /// An iterator of the in neighbours of the vertices + #[getter] fn in_neighbours(&self) -> PyPathFromGraph { self.vertices.in_neighbours().into() } - fn neighbours(&self) -> PyPathFromGraph { - self.vertices.neighbours().into() + /// Get the out neighbours of the vertices + /// + /// Returns: + /// An iterator of the out neighbours of the vertices + #[getter] + fn out_neighbours(&self) -> PyPathFromGraph { + self.vertices.out_neighbours().into() } + /// Collects all vertices into a list fn collect(&self) -> Vec { self.__iter__().into_iter().collect() } - //****** Perspective APIS ******// + //***** Perspective APIS ******// + /// Returns the start time of the vertices + #[getter] pub fn start(&self) -> Option { self.vertices.start() } + /// Returns the end time of the vertices + #[getter] pub fn end(&self) -> Option { self.vertices.end() } #[doc = window_size_doc_string!()] + #[getter] pub fn window_size(&self) -> Option { self.vertices.window_size() } - fn expanding(&self, step: &PyAny) -> PyResult { - expanding_impl(&self.vertices, step) + /// Creates a PyVertexWindowSet with the given step size using an expanding window. + /// + /// An expanding window is a window that grows by step size at each iteration. + /// This will tell you whether a vertex exists at different points in the window + /// and what its properties are at those points. + /// + /// Arguments: + /// `step` - The step size of the window + /// + /// Returns: + /// A PyVertexWindowSet with the given step size and optional start and end times or an error + fn expanding( + &self, + step: PyInterval, + ) -> Result>, ParseTimeError> { + self.vertices.expanding(step) } - fn rolling(&self, window: &PyAny, step: Option<&PyAny>) -> PyResult { - rolling_impl(&self.vertices, window, step) + /// Creates a PyVertexWindowSet with the given window size and optional step using a rolling window. + /// + /// A rolling window is a window that moves forward by step size at each iteration. + /// This will tell you whether a vertex exists at different points in the window and + /// what its properties are at those points. + /// + /// Arguments: + /// `window` - The window size of the window + /// `step` - The step size of the window + /// + /// Returns: + /// A PyVertexWindowSet with the given window size and optional step size or an error + fn rolling( + &self, + window: PyInterval, + step: Option, + ) -> Result>, ParseTimeError> { + self.vertices.rolling(window, step) } + /// Create a view of the vertices including all events between t_start (inclusive) and + /// t_end (exclusive) + /// + /// Arguments: + /// `t_start` - The start time of the window + /// `t_end` - The end time of the window + /// + /// Returns: + /// A `PyVertices` object. #[pyo3(signature = (t_start = None, t_end = None))] - pub fn window(&self, t_start: Option<&PyAny>, t_end: Option<&PyAny>) -> PyResult { - window_impl(&self.vertices, t_start, t_end).map(|v| v.into()) + pub fn window( + &self, + t_start: Option, + t_end: Option, + ) -> Vertices> { + self.vertices + .window(t_start.unwrap_or(PyTime::MIN), t_end.unwrap_or(PyTime::MAX)) } /// Create a view of the vertices including all events at `t`. @@ -621,8 +766,8 @@ impl PyVertices { /// Returns: /// A `PyVertices` object. #[pyo3(signature = (end))] - pub fn at(&self, end: &PyAny) -> PyResult { - at_impl(&self.vertices, end).map(|v| v.into()) + pub fn at(&self, end: PyTime) -> Vertices> { + self.vertices.at(end) } #[doc = default_layer_doc_string!()] @@ -630,10 +775,10 @@ impl PyVertices { self.vertices.default_layer().into() } - #[doc = layer_doc_string!()] + #[doc = layers_doc_string!()] #[pyo3(signature = (name))] - pub fn layer(&self, name: &str) -> Option { - Some(self.vertices.layer(name)?.into()) + pub fn layer(&self, name: &str) -> Option>> { + self.vertices.layer(name) } //****** Python ******* @@ -649,16 +794,10 @@ impl PyVertices { self.vertices.is_empty() } - pub fn __getitem__(&self, vertex: &PyAny) -> PyResult { - let vref = extract_vertex_ref(vertex)?; - self.vertices.get(vref).map_or_else( - || Err(PyIndexError::new_err("Vertex does not exist")), - |v| Ok(v.into()), - ) - } - - pub fn __call__(slf: PyRef<'_, Self>) -> PyRef<'_, Self> { - slf + pub fn __getitem__(&self, vertex: VertexRef) -> PyResult> { + self.vertices + .get(vertex) + .ok_or_else(|| PyIndexError::new_err("Vertex does not exist")) } pub fn __repr__(&self) -> String { @@ -686,64 +825,34 @@ impl PyPathFromGraph { fn collect(&self) -> Vec> { self.__iter__().into_iter().map(|it| it.collect()).collect() } + #[getter] fn id(&self) -> NestedU64Iterable { let path = self.path.clone(); (move || path.id()).into() } + #[getter] fn name(&self) -> NestedStringIterable { let path = self.path.clone(); (move || path.name()).into() } + #[getter] fn earliest_time(&self) -> NestedOptionI64Iterable { let path = self.path.clone(); (move || path.earliest_time()).into() } + #[getter] fn latest_time(&self) -> NestedOptionI64Iterable { let path = self.path.clone(); (move || path.latest_time()).into() } - fn property(&self, name: String, include_static: Option) -> NestedOptionPropIterable { - let path = self.path.clone(); - (move || path.property(name.clone(), include_static.unwrap_or(true))).into() - } - - fn property_history(&self, name: String) -> NestedPropHistoryIterable { - let path = self.path.clone(); - (move || path.property_history(name.clone())).into() - } - - fn properties(&self, include_static: Option) -> NestedPropsIterable { - let path = self.path.clone(); - (move || path.properties(include_static.unwrap_or(true))).into() - } - - fn property_histories(&self) -> NestedPropHistoriesIterable { - let path = self.path.clone(); - (move || path.property_histories()).into() - } - - fn property_names(&self, include_static: Option) -> NestedStringVecIterable { - let path = self.path.clone(); - (move || path.property_names(include_static.unwrap_or(true))).into() - } - - fn has_property(&self, name: String, include_static: Option) -> NestedBoolIterable { + #[getter] + fn properties(&self) -> PyNestedPropsIterable { let path = self.path.clone(); - (move || path.has_property(name.clone(), include_static.unwrap_or(true))).into() - } - - fn has_static_property(&self, name: String) -> NestedBoolIterable { - let path = self.path.clone(); - (move || path.has_static_property(name.clone())).into() - } - - fn static_property(&self, name: String) -> NestedOptionPropIterable { - let path = self.path.clone(); - (move || path.static_property(name.clone())).into() + (move || path.properties()).into() } fn degree(&self) -> NestedUsizeIterable { @@ -761,58 +870,79 @@ impl PyPathFromGraph { (move || path.out_degree()).into() } + #[getter] fn edges(&self) -> PyNestedEdges { let clone = self.path.clone(); (move || clone.edges()).into() } + #[getter] fn in_edges(&self) -> PyNestedEdges { let clone = self.path.clone(); (move || clone.in_edges()).into() } + #[getter] fn out_edges(&self) -> PyNestedEdges { let clone = self.path.clone(); (move || clone.out_edges()).into() } + #[getter] fn out_neighbours(&self) -> Self { self.path.out_neighbours().into() } + #[getter] fn in_neighbours(&self) -> Self { self.path.in_neighbours().into() } + #[getter] fn neighbours(&self) -> Self { self.path.neighbours().into() } //****** Perspective APIS ******// + #[getter] pub fn start(&self) -> Option { self.path.start() } + #[getter] pub fn end(&self) -> Option { self.path.end() } #[doc = window_size_doc_string!()] + #[getter] pub fn window_size(&self) -> Option { self.path.window_size() } - fn expanding(&self, step: &PyAny) -> PyResult { - expanding_impl(&self.path, step) + fn expanding( + &self, + step: PyInterval, + ) -> Result>, ParseTimeError> { + self.path.expanding(step) } - fn rolling(&self, window: &PyAny, step: Option<&PyAny>) -> PyResult { - rolling_impl(&self.path, window, step) + fn rolling( + &self, + window: PyInterval, + step: Option, + ) -> Result>, ParseTimeError> { + self.path.rolling(window, step) } #[pyo3(signature = (t_start = None, t_end = None))] - pub fn window(&self, t_start: Option<&PyAny>, t_end: Option<&PyAny>) -> PyResult { - window_impl(&self.path, t_start, t_end).map(|p| p.into()) + pub fn window( + &self, + t_start: Option, + t_end: Option, + ) -> PathFromGraph> { + self.path + .window(t_start.unwrap_or(PyTime::MIN), t_end.unwrap_or(PyTime::MAX)) } /// Create a view of the vertex including all events at `t`. @@ -823,8 +953,8 @@ impl PyPathFromGraph { /// Returns: /// A `PyVertex` object. #[pyo3(signature = (end))] - pub fn at(&self, end: &PyAny) -> PyResult { - at_impl(&self.path, end).map(|p| p.into()) + pub fn at(&self, end: PyTime) -> PathFromGraph> { + self.path.at(end) } #[doc = default_layer_doc_string!()] @@ -832,10 +962,10 @@ impl PyPathFromGraph { self.path.default_layer().into() } - #[doc = layer_doc_string!()] + #[doc = layers_doc_string!()] #[pyo3(signature = (name))] - pub fn layer(&self, name: &str) -> Option { - Some(self.path.layer(name)?.into()) + pub fn layer(&self, name: &str) -> Option>> { + self.path.layer(name) } fn __repr__(&self) -> String { @@ -863,10 +993,9 @@ impl From> for PyPathFromGraph { } } -impl IntoPyObject for PathFromGraph { - fn into_py_object(self) -> PyObject { - let py_version: PyPathFromGraph = self.into(); - Python::with_gil(|py| py_version.into_py(py)) +impl IntoPy for PathFromGraph { + fn into_py(self, py: Python<'_>) -> PyObject { + PyPathFromGraph::from(self).into_py(py) } } @@ -887,10 +1016,9 @@ impl From> for PyPathFromVertex } } -impl IntoPyObject for PathFromVertex { - fn into_py_object(self) -> PyObject { - let py_version: PyPathFromVertex = self.into(); - Python::with_gil(|py| py_version.into_py(py)) +impl IntoPy for PathFromVertex { + fn into_py(self, py: Python<'_>) -> PyObject { + PyPathFromVertex::from(self).into_py(py) } } @@ -904,64 +1032,34 @@ impl PyPathFromVertex { self.__iter__().into_iter().collect() } + #[getter] fn id(&self) -> U64Iterable { let path = self.path.clone(); (move || path.id()).into() } + #[getter] fn name(&self) -> StringIterable { let path = self.path.clone(); (move || path.name()).into() } + #[getter] fn earliest_time(&self) -> OptionI64Iterable { let path = self.path.clone(); (move || path.earliest_time()).into() } + #[getter] fn latest_time(&self) -> OptionI64Iterable { let path = self.path.clone(); (move || path.latest_time()).into() } - fn property(&self, name: String, include_static: Option) -> OptionPropIterable { - let path = self.path.clone(); - (move || path.property(name.clone(), include_static.unwrap_or(true))).into() - } - - fn property_history(&self, name: String) -> PropHistoryIterable { + #[getter] + fn properties(&self) -> PyPropsList { let path = self.path.clone(); - (move || path.property_history(name.clone())).into() - } - - fn properties(&self, include_static: Option) -> PropsIterable { - let path = self.path.clone(); - (move || path.properties(include_static.unwrap_or(true))).into() - } - - fn property_histories(&self) -> PropHistoriesIterable { - let path = self.path.clone(); - (move || path.property_histories()).into() - } - - fn property_names(&self, include_static: Option) -> StringVecIterable { - let path = self.path.clone(); - (move || path.property_names(include_static.unwrap_or(true))).into() - } - - fn has_property(&self, name: String, include_static: Option) -> BoolIterable { - let path = self.path.clone(); - (move || path.has_property(name.clone(), include_static.unwrap_or(true))).into() - } - - fn has_static_property(&self, name: String) -> BoolIterable { - let path = self.path.clone(); - (move || path.has_static_property(name.clone())).into() - } - - fn static_property(&self, name: String) -> OptionPropIterable { - let path = self.path.clone(); - (move || path.static_property(name.clone())).into() + (move || path.properties()).into() } fn in_degree(&self) -> UsizeIterable { @@ -979,58 +1077,79 @@ impl PyPathFromVertex { (move || path.degree()).into() } + #[getter] fn edges(&self) -> PyEdges { let path = self.path.clone(); (move || path.edges()).into() } + #[getter] fn in_edges(&self) -> PyEdges { let path = self.path.clone(); (move || path.in_edges()).into() } + #[getter] fn out_edges(&self) -> PyEdges { let path = self.path.clone(); (move || path.out_edges()).into() } + #[getter] fn out_neighbours(&self) -> Self { self.path.out_neighbours().into() } + #[getter] fn in_neighbours(&self) -> Self { self.path.in_neighbours().into() } + #[getter] fn neighbours(&self) -> Self { self.path.neighbours().into() } //****** Perspective APIS ******// + #[getter] pub fn start(&self) -> Option { self.path.start() } + #[getter] pub fn end(&self) -> Option { self.path.end() } #[doc = window_size_doc_string!()] + #[getter] pub fn window_size(&self) -> Option { self.path.window_size() } - fn expanding(&self, step: &PyAny) -> PyResult { - expanding_impl(&self.path, step) + fn expanding( + &self, + step: PyInterval, + ) -> Result>, ParseTimeError> { + self.path.expanding(step) } - fn rolling(&self, window: &PyAny, step: Option<&PyAny>) -> PyResult { - rolling_impl(&self.path, window, step) + fn rolling( + &self, + window: PyInterval, + step: Option, + ) -> Result>, ParseTimeError> { + self.path.rolling(window, step) } #[pyo3(signature = (t_start = None, t_end = None))] - pub fn window(&self, t_start: Option<&PyAny>, t_end: Option<&PyAny>) -> PyResult { - window_impl(&self.path, t_start, t_end).map(|p| p.into()) + pub fn window( + &self, + t_start: Option, + t_end: Option, + ) -> PathFromVertex> { + self.path + .window(t_start.unwrap_or(PyTime::MIN), t_end.unwrap_or(PyTime::MAX)) } /// Create a view of the vertex including all events at `t`. @@ -1041,18 +1160,18 @@ impl PyPathFromVertex { /// Returns: /// A `PyVertex` object. #[pyo3(signature = (end))] - pub fn at(&self, end: &PyAny) -> PyResult { - at_impl(&self.path, end).map(|p| p.into()) + pub fn at(&self, end: PyTime) -> PathFromVertex> { + self.path.at(end) } pub fn default_layer(&self) -> Self { self.path.default_layer().into() } - #[doc = layer_doc_string!()] + #[doc = layers_doc_string!()] #[pyo3(signature = (name))] - pub fn layer(&self, name: &str) -> Option { - Some(self.path.layer(name)?.into()) + pub fn layer(&self, name: &str) -> Option>> { + self.path.layer(name) } fn __repr__(&self) -> String { @@ -1139,115 +1258,172 @@ impl PathIterator { } } -py_iterable!( - PyVertexIterable, - VertexView, - PyVertex, - PyVertexIterator -); +py_iterable!(PyVertexIterable, VertexView, PyVertex); #[pymethods] impl PyVertexIterable { + #[getter] fn id(&self) -> U64Iterable { let builder = self.builder.clone(); (move || builder().id()).into() } + #[getter] fn name(&self) -> StringIterable { let vertices = self.builder.clone(); (move || vertices().name()).into() } + #[getter] fn earliest_time(&self) -> OptionI64Iterable { let vertices = self.builder.clone(); (move || vertices().earliest_time()).into() } + #[getter] fn latest_time(&self) -> OptionI64Iterable { let vertices = self.builder.clone(); (move || vertices().latest_time()).into() } - fn property(&self, name: String, include_static: Option) -> OptionPropIterable { + #[getter] + fn properties(&self) -> PyPropsList { let vertices = self.builder.clone(); - (move || vertices().property(name.clone(), include_static.unwrap_or(true))).into() + (move || vertices().properties()).into() } - fn property_history(&self, name: String) -> PropHistoryIterable { + fn degree(&self) -> UsizeIterable { let vertices = self.builder.clone(); - (move || vertices().property_history(name.clone())).into() + (move || vertices().degree()).into() } - fn properties(&self, include_static: Option) -> PropsIterable { + fn in_degree(&self) -> UsizeIterable { let vertices = self.builder.clone(); - (move || vertices().properties(include_static.unwrap_or(true))).into() + (move || vertices().in_degree()).into() } - fn property_histories(&self) -> PropHistoriesIterable { + fn out_degree(&self) -> UsizeIterable { let vertices = self.builder.clone(); - (move || vertices().property_histories()).into() + (move || vertices().out_degree()).into() + } + + #[getter] + fn edges(&self) -> PyEdges { + let clone = self.builder.clone(); + (move || clone().edges()).into() + } + + #[getter] + fn in_edges(&self) -> PyEdges { + let clone = self.builder.clone(); + (move || clone().in_edges()).into() + } + + #[getter] + fn out_edges(&self) -> PyEdges { + let clone = self.builder.clone(); + (move || clone().out_edges()).into() + } + + #[getter] + fn out_neighbours(&self) -> Self { + let builder = self.builder.clone(); + (move || builder().out_neighbours()).into() } - fn property_names(&self, include_static: Option) -> StringVecIterable { + #[getter] + fn in_neighbours(&self) -> Self { + let builder = self.builder.clone(); + (move || builder().in_neighbours()).into() + } + + #[getter] + fn neighbours(&self) -> Self { + let builder = self.builder.clone(); + (move || builder().neighbours()).into() + } +} + +py_nested_iterable!(PyNestedVertexIterable, VertexView); + +#[pymethods] +impl PyNestedVertexIterable { + #[getter] + fn id(&self) -> NestedU64Iterable { + let builder = self.builder.clone(); + (move || builder().id()).into() + } + + #[getter] + fn name(&self) -> NestedStringIterable { let vertices = self.builder.clone(); - (move || vertices().property_names(include_static.unwrap_or(true))).into() + (move || vertices().name()).into() } - fn has_property(&self, name: String, include_static: Option) -> BoolIterable { + #[getter] + fn earliest_time(&self) -> NestedOptionI64Iterable { let vertices = self.builder.clone(); - (move || vertices().has_property(name.clone(), include_static.unwrap_or(true))).into() + (move || vertices().earliest_time()).into() } - fn has_static_property(&self, name: String) -> BoolIterable { + #[getter] + fn latest_time(&self) -> NestedOptionI64Iterable { let vertices = self.builder.clone(); - (move || vertices().has_static_property(name.clone())).into() + (move || vertices().latest_time()).into() } - fn static_property(&self, name: String) -> OptionPropIterable { + #[getter] + fn properties(&self) -> PyNestedPropsIterable { let vertices = self.builder.clone(); - (move || vertices().static_property(name.clone())).into() + (move || vertices().properties()).into() } - fn degree(&self) -> UsizeIterable { + fn degree(&self) -> NestedUsizeIterable { let vertices = self.builder.clone(); (move || vertices().degree()).into() } - fn in_degree(&self) -> UsizeIterable { + fn in_degree(&self) -> NestedUsizeIterable { let vertices = self.builder.clone(); (move || vertices().in_degree()).into() } - fn out_degree(&self) -> UsizeIterable { + fn out_degree(&self) -> NestedUsizeIterable { let vertices = self.builder.clone(); (move || vertices().out_degree()).into() } - fn edges(&self) -> PyEdges { + #[getter] + fn edges(&self) -> PyNestedEdges { let clone = self.builder.clone(); (move || clone().edges()).into() } - fn in_edges(&self) -> PyEdges { + #[getter] + fn in_edges(&self) -> PyNestedEdges { let clone = self.builder.clone(); (move || clone().in_edges()).into() } - fn out_edges(&self) -> PyEdges { + #[getter] + fn out_edges(&self) -> PyNestedEdges { let clone = self.builder.clone(); (move || clone().out_edges()).into() } + #[getter] fn out_neighbours(&self) -> Self { let builder = self.builder.clone(); (move || builder().out_neighbours()).into() } + #[getter] fn in_neighbours(&self) -> Self { let builder = self.builder.clone(); (move || builder().in_neighbours()).into() } + #[getter] fn neighbours(&self) -> Self { let builder = self.builder.clone(); (move || builder().neighbours()).into() diff --git a/raphtory/src/python/graph/views/graph_view.rs b/raphtory/src/python/graph/views/graph_view.rs new file mode 100644 index 0000000000..747fe3ce2f --- /dev/null +++ b/raphtory/src/python/graph/views/graph_view.rs @@ -0,0 +1,444 @@ +//! The API for querying a view of the graph in a read-only state + +use crate::{ + core::{ + entities::vertices::vertex_ref::VertexRef, + utils::{errors::GraphError, time::error::ParseTimeError}, + ArcStr, + }, + db::{ + api::{ + properties::Properties, + view::{ + internal::{DynamicGraph, IntoDynamic, MaterializedGraph}, + LayerOps, WindowSet, + }, + }, + graph::{ + edge::EdgeView, + vertex::VertexView, + views::{ + layer_graph::LayeredGraph, vertex_subgraph::VertexSubgraph, + window_graph::WindowedGraph, + }, + }, + }, + prelude::*, + python::{ + graph::{edge::PyEdges, vertex::PyVertices}, + types::repr::Repr, + utils::{PyInterval, PyTime}, + }, + *, +}; +use chrono::prelude::*; +use itertools::Itertools; +use pyo3::{prelude::*, types::PyBytes}; +use std::ops::Deref; + +impl IntoPy for MaterializedGraph { + fn into_py(self, py: Python<'_>) -> PyObject { + match self { + MaterializedGraph::EventGraph(g) => g.into_py(py), + MaterializedGraph::PersistentGraph(g) => g.into_py(py), + } + } +} + +impl IntoPy for DynamicGraph { + fn into_py(self, py: Python<'_>) -> PyObject { + PyGraphView::from(self).into_py(py) + } +} + +impl<'source> FromPyObject<'source> for DynamicGraph { + fn extract(ob: &'source PyAny) -> PyResult { + ob.extract::>() + .map(|g| g.graph.clone()) + .or_else(|err| { + let res = ob.call_method0("bincode").map_err(|_| err)?; // return original error as probably more helpful + // assume we have a graph at this point, the res probably should not fail + let b = res.extract::<&[u8]>()?; + let g = MaterializedGraph::from_bincode(b)?; + Ok(g.into_dynamic()) + }) + } +} +/// Graph view is a read-only version of a graph at a certain point in time. + +#[pyclass(name = "GraphView", frozen, subclass)] +#[repr(C)] +pub struct PyGraphView { + pub graph: DynamicGraph, +} + +/// Graph view is a read-only version of a graph at a certain point in time. +impl From for PyGraphView { + fn from(value: G) -> Self { + PyGraphView { + graph: value.into_dynamic(), + } + } +} + +impl IntoPy for WindowedGraph { + fn into_py(self, py: Python<'_>) -> PyObject { + PyGraphView::from(self).into_py(py) + } +} + +impl IntoPy for LayeredGraph { + fn into_py(self, py: Python<'_>) -> PyObject { + PyGraphView::from(self).into_py(py) + } +} + +impl IntoPy for VertexSubgraph { + fn into_py(self, py: Python<'_>) -> PyObject { + PyGraphView::from(self).into_py(py) + } +} + +/// The API for querying a view of the graph in a read-only state +#[pymethods] +impl PyGraphView { + /// Return all the layer ids in the graph + #[getter] + pub fn unique_layers(&self) -> Vec { + self.graph.unique_layers().collect() + } + + //****** Metrics APIs ******// + + /// Timestamp of earliest activity in the graph + /// + /// Returns: + /// the timestamp of the earliest activity in the graph + #[getter] + pub fn earliest_time(&self) -> Option { + self.graph.earliest_time() + } + + /// DateTime of earliest activity in the graph + /// + /// Returns: + /// the datetime of the earliest activity in the graph + #[getter] + pub fn earliest_date_time(&self) -> Option { + let earliest_time = self.graph.earliest_time()?; + NaiveDateTime::from_timestamp_millis(earliest_time) + } + + /// Timestamp of latest activity in the graph + /// + /// Returns: + /// the timestamp of the latest activity in the graph + #[getter] + pub fn latest_time(&self) -> Option { + self.graph.latest_time() + } + + /// DateTime of latest activity in the graph + /// + /// Returns: + /// the datetime of the latest activity in the graph + #[getter] + pub fn latest_date_time(&self) -> Option { + let latest_time = self.graph.latest_time()?; + NaiveDateTime::from_timestamp_millis(latest_time) + } + + /// Number of edges in the graph + /// + /// Returns: + /// the number of edges in the graph + pub fn count_edges(&self) -> usize { + self.graph.count_edges() + } + + /// Number of edges in the graph + /// + /// Returns: + /// the number of temporal edges in the graph + pub fn count_temporal_edges(&self) -> usize { + self.graph.count_temporal_edges() + } + + /// Number of vertices in the graph + /// + /// Returns: + /// the number of vertices in the graph + pub fn count_vertices(&self) -> usize { + self.graph.count_vertices() + } + + /// Returns true if the graph contains the specified vertex + /// + /// Arguments: + /// id (str or int): the vertex id + /// + /// Returns: + /// true if the graph contains the specified vertex, false otherwise + pub fn has_vertex(&self, id: VertexRef) -> bool { + self.graph.has_vertex(id) + } + + /// Returns true if the graph contains the specified edge + /// + /// Arguments: + /// src (str or int): the source vertex id + /// dst (str or int): the destination vertex id + /// layer (str): the edge layer (optional) + /// + /// Returns: + /// true if the graph contains the specified edge, false otherwise + #[pyo3(signature = (src, dst, layer=None))] + pub fn has_edge(&self, src: VertexRef, dst: VertexRef, layer: Option<&str>) -> bool { + self.graph.has_edge(src, dst, layer) + } + + //****** Getter APIs ******// + + /// Gets the vertex with the specified id + /// + /// Arguments: + /// id (str or int): the vertex id + /// + /// Returns: + /// the vertex with the specified id, or None if the vertex does not exist + pub fn vertex(&self, id: VertexRef) -> Option> { + self.graph.vertex(id) + } + + /// Gets the vertices in the graph + /// + /// Returns: + /// the vertices in the graph + #[getter] + pub fn vertices(&self) -> PyVertices { + self.graph.vertices().into() + } + + /// Gets the edge with the specified source and destination vertices + /// + /// Arguments: + /// src (str or int): the source vertex id + /// dst (str or int): the destination vertex id + /// layer (str): the edge layer (optional) + /// + /// Returns: + /// the edge with the specified source and destination vertices, or None if the edge does not exist + #[pyo3(signature = (src, dst))] + pub fn edge(&self, src: VertexRef, dst: VertexRef) -> Option> { + self.graph.edge(src, dst) + } + + /// Gets all edges in the graph + /// + /// Returns: + /// the edges in the graph + pub fn edges(&self) -> PyEdges { + let clone = self.graph.clone(); + (move || clone.edges()).into() + } + + //****** Perspective APIS ******// + + /// Returns the default start time for perspectives over the view + /// + /// Returns: + /// the default start time for perspectives over the view + #[getter] + pub fn start(&self) -> Option { + self.graph.start() + } + + /// Returns the default start datetime for perspectives over the view + /// + /// Returns: + /// the default start datetime for perspectives over the view + #[getter] + pub fn start_date_time(&self) -> Option { + let start_time = self.graph.start()?; + NaiveDateTime::from_timestamp_millis(start_time) + } + + /// Returns the default end time for perspectives over the view + /// + /// Returns: + /// the default end time for perspectives over the view + #[getter] + pub fn end(&self) -> Option { + self.graph.end() + } + + #[doc = window_size_doc_string!()] + pub fn window_size(&self) -> Option { + self.graph.window_size() + } + + /// Returns the default end datetime for perspectives over the view + /// + /// Returns: + /// the default end datetime for perspectives over the view + #[getter] + pub fn end_date_time(&self) -> Option { + let end_time = self.graph.end()?; + NaiveDateTime::from_timestamp_millis(end_time) + } + + /// Creates a `WindowSet` with the given `step` size and optional `start` and `end` times, + /// using an expanding window. + /// + /// An expanding window is a window that grows by `step` size at each iteration. + /// + /// Arguments: + /// step (int) : the size of the window + /// start (int): the start time of the window (optional) + /// end (int): the end time of the window (optional) + /// + /// Returns: + /// A `WindowSet` with the given `step` size and optional `start` and `end` times, + #[pyo3(signature = (step))] + fn expanding(&self, step: PyInterval) -> Result, ParseTimeError> { + self.graph.expanding(step) + } + + /// Creates a `WindowSet` with the given `window` size and optional `step`, `start` and `end` times, + /// using a rolling window. + /// + /// A rolling window is a window that moves forward by `step` size at each iteration. + /// + /// Arguments: + /// window (int): the size of the window + /// step (int): the size of the step (optional) + /// start (int): the start time of the window (optional) + /// end: the end time of the window (optional) + /// + /// Returns: + /// a `WindowSet` with the given `window` size and optional `step`, `start` and `end` times, + fn rolling( + &self, + window: PyInterval, + step: Option, + ) -> Result, ParseTimeError> { + self.graph.rolling(window, step) + } + + /// Create a view including all events between `start` (inclusive) and `end` (exclusive) + /// + /// Arguments: + /// start (int): the start time of the window (optional) + /// end (int): the end time of the window (optional) + /// + /// Returns: + /// a view including all events between `start` (inclusive) and `end` (exclusive) + #[pyo3(signature = (start=None, end=None))] + pub fn window( + &self, + start: Option, + end: Option, + ) -> WindowedGraph { + self.graph + .window(start.unwrap_or(PyTime::MIN), end.unwrap_or(PyTime::MAX)) + } + + /// Create a view including all events until `end` (inclusive) + /// + /// Arguments: + /// end (int) : the end time of the window + /// + /// Returns: + /// a view including all events until `end` (inclusive) + #[pyo3(signature = (end))] + pub fn at(&self, end: PyTime) -> WindowedGraph { + self.graph.at(end) + } + + #[doc = default_layer_doc_string!()] + pub fn default_layer(&self) -> LayeredGraph { + self.graph.default_layer() + } + + #[doc = layers_doc_string!()] + #[pyo3(signature = (names))] + pub fn layers(&self, names: Vec) -> Option> { + self.graph.layer(names) + } + + #[doc = layers_doc_string!()] + #[pyo3(signature = (name))] + pub fn layer(&self, name: String) -> Option> { + self.graph.layer(name) + } + + /// Get all graph properties + /// + /// + /// Returns: + /// HashMap - Properties paired with their names + #[getter] + fn properties(&self) -> Properties { + self.graph.properties() + } + + /// Returns a subgraph given a set of vertices + /// + /// Arguments: + /// * `vertices`: set of vertices + /// + /// Returns: + /// GraphView - Returns the subgraph + fn subgraph(&self, vertices: Vec) -> VertexSubgraph { + self.graph.subgraph(vertices) + } + + /// Returns a graph clone + /// + /// Arguments: + /// + /// Returns: + /// GraphView - Returns a graph clone + fn materialize(&self) -> Result { + self.graph.materialize() + } + + /// Get bincode encoded graph + pub fn bincode<'py>(&'py self, py: Python<'py>) -> Result<&'py PyBytes, GraphError> { + let bytes = self.graph.materialize()?.bincode()?; + Ok(PyBytes::new(py, &bytes)) + } + + /// Displays the graph + pub fn __repr__(&self) -> String { + self.repr() + } +} + +impl Repr for PyGraphView { + fn repr(&self) -> String { + let num_edges = self.graph.count_edges(); + let num_vertices = self.graph.count_vertices(); + let num_temporal_edges: usize = self.graph.count_temporal_edges(); + let earliest_time = self.graph.earliest_time().repr(); + let latest_time = self.graph.latest_time().repr(); + let properties: String = self + .graph + .properties() + .iter() + .map(|(k, v)| format!("{}: {}", k.deref(), v)) + .join(", "); + if properties.is_empty() { + return format!( + "Graph(number_of_edges={:?}, number_of_vertices={:?}, number_of_temporal_edges={:?}, earliest_time={:?}, latest_time={:?})", + num_edges, num_vertices, num_temporal_edges, earliest_time, latest_time + ); + } else { + let property_string: String = format!("{{{properties}}}"); + return format!( + "Graph(number_of_edges={:?}, number_of_vertices={:?}, number_of_temporal_edges={:?}, earliest_time={:?}, latest_time={:?}, properties={})", + num_edges, num_vertices, num_temporal_edges, earliest_time, latest_time, property_string + ); + } + } +} diff --git a/raphtory/src/python/graph/views/mod.rs b/raphtory/src/python/graph/views/mod.rs new file mode 100644 index 0000000000..c0068a9452 --- /dev/null +++ b/raphtory/src/python/graph/views/mod.rs @@ -0,0 +1 @@ +pub mod graph_view; diff --git a/raphtory/src/python/mod.rs b/raphtory/src/python/mod.rs new file mode 100644 index 0000000000..f8ff9f5c5f --- /dev/null +++ b/raphtory/src/python/mod.rs @@ -0,0 +1,7 @@ +extern crate core; + +#[macro_use] +pub mod types; +pub mod graph; +pub mod packages; +pub mod utils; diff --git a/raphtory/src/python/packages/algorithms.rs b/raphtory/src/python/packages/algorithms.rs new file mode 100644 index 0000000000..77a8c253ca --- /dev/null +++ b/raphtory/src/python/packages/algorithms.rs @@ -0,0 +1,413 @@ +use std::collections::HashMap; + +use crate::python::graph::edge::PyDirection; +/// Implementations of various graph algorithms that can be run on a graph. +/// +/// To run an algorithm simply import the module and call the function with the graph as the argument +/// +use crate::{ + algorithms::{ + algorithm_result::AlgorithmResult, + balance::balance as balance_rs, + connected_components, + degree::{ + average_degree as average_degree_rs, max_in_degree as max_in_degree_rs, + max_out_degree as max_out_degree_rs, min_in_degree as min_in_degree_rs, + min_out_degree as min_out_degree_rs, + }, + directed_graph_density::directed_graph_density as directed_graph_density_rs, + hits::hits as hits_rs, + local_clustering_coefficient::local_clustering_coefficient as local_clustering_coefficient_rs, + local_triangle_count::local_triangle_count as local_triangle_count_rs, + motifs::three_node_temporal_motifs::{ + global_temporal_three_node_motif as global_temporal_three_node_motif_rs, + global_temporal_three_node_motif_general as global_temporal_three_node_motif_general_rs, + temporal_three_node_motif as local_three_node_rs, + }, + pagerank::unweighted_page_rank, + reciprocity::{ + all_local_reciprocity as all_local_reciprocity_rs, + global_reciprocity as global_reciprocity_rs, + }, + temporal_reachability::temporally_reachable_nodes as temporal_reachability_rs, + }, + core::entities::vertices::vertex_ref::VertexRef, + python::{graph::views::graph_view::PyGraphView, utils::PyInputVertex}, +}; +use ordered_float::OrderedFloat; +use pyo3::prelude::*; + +/// Local triangle count - calculates the number of triangles (a cycle of length 3) a vertex participates in. +/// +/// This function returns the number of pairs of neighbours of a given node which are themselves connected. +/// +/// Arguments: +/// g (Raphtory graph) : Raphtory graph, this can be directed or undirected but will be treated as undirected +/// v (int or str) : vertex id or name +/// +/// Returns: +/// triangles(int) : number of triangles associated with vertex v +/// +#[pyfunction] +pub fn local_triangle_count(g: &PyGraphView, v: VertexRef) -> Option { + local_triangle_count_rs(&g.graph, v) +} + +/// Weakly connected components -- partitions the graph into node sets which are mutually reachable by an undirected path +/// +/// This function assigns a component id to each vertex such that vertices with the same component id are mutually reachable +/// by an undirected path. +/// +/// Arguments: +/// g (Raphtory graph) : Raphtory graph +/// iter_count (int) : Maximum number of iterations to run. Note that this will terminate early if the labels converge prior to the number of iterations being reached. +/// +/// Returns: +/// AlgorithmResult : AlgorithmResult object with string keys and integer values mapping vertex names to their component ids. +#[pyfunction] +#[pyo3(signature = (g, iter_count=9223372036854775807))] +pub fn weakly_connected_components( + g: &PyGraphView, + iter_count: usize, +) -> AlgorithmResult { + connected_components::weakly_connected_components(&g.graph, iter_count, None) +} + +/// Pagerank -- pagerank centrality value of the vertices in a graph +/// +/// This function calculates the Pagerank value of each vertex in a graph. See https://en.wikipedia.org/wiki/PageRank for more information on PageRank centrality. +/// A default damping factor of 0.85 is used. This is an iterative algorithm which terminates if the sum of the absolute difference in pagerank values between iterations +/// is less than the max diff value given. +/// +/// Arguments: +/// g (Raphtory graph) : Raphtory graph +/// iter_count (int) : Maximum number of iterations to run. Note that this will terminate early if convergence is reached. +/// max_diff (float) : Optional parameter providing an alternative stopping condition. The algorithm will terminate if the sum of the absolute difference in pagerank values between iterations +/// is less than the max diff value given. +/// +/// Returns: +/// AlgorithmResult : AlgorithmResult with string keys and float values mapping vertex names to their pagerank value. +#[pyfunction] +#[pyo3(signature = (g, iter_count=20, max_diff=None))] +pub fn pagerank( + g: &PyGraphView, + iter_count: usize, + max_diff: Option, +) -> AlgorithmResult> { + unweighted_page_rank(&g.graph, iter_count, None, max_diff, true) +} + +/// Temporally reachable nodes -- the nodes that are reachable by a time respecting path followed out from a set of seed nodes at a starting time. +/// +/// This function starts at a set of seed nodes and follows all time respecting paths until either a) a maximum number of hops is reached, b) one of a set of +/// stop nodes is reached, or c) no further time respecting edges exist. A time respecting path is a sequence of nodes v_1, v_2, ... , v_k such that there exists +/// a sequence of edges (v_i, v_i+1, t_i) with t_i < t_i+1 for i = 1, ... , k - 1. +/// +/// Arguments: +/// g (Raphtory graph) : directed Raphtory graph +/// max_hops (int) : maximum number of hops to propagate out +/// start_time (int) : time at which to start the path (such that t_1 > start_time for any path starting from these seed nodes) +/// seed_nodes (list(str) or list(int)) : list of vertex names or ids which should be the starting nodes +/// stop_nodes (list(str) or list(int)) : nodes at which a path shouldn't go any further +/// +/// Returns: +/// AlgorithmResult : AlgorithmResult with string keys and float values mapping vertex names to their pagerank value. +#[pyfunction] +pub fn temporally_reachable_nodes( + g: &PyGraphView, + max_hops: usize, + start_time: i64, + seed_nodes: Vec, + stop_nodes: Option>, +) -> AlgorithmResult> { + temporal_reachability_rs(&g.graph, None, max_hops, start_time, seed_nodes, stop_nodes) +} + +/// Local clustering coefficient - measures the degree to which nodes in a graph tend to cluster together. +/// +/// The proportion of pairs of neighbours of a node who are themselves connected. +/// +/// Arguments: +/// g (Raphtory graph) : Raphtory graph, can be directed or undirected but will be treated as undirected. +/// v (int or str): vertex id or name +/// +/// Returns: +/// float : the local clustering coefficient of vertex v in g. +#[pyfunction] +pub fn local_clustering_coefficient(g: &PyGraphView, v: VertexRef) -> Option { + local_clustering_coefficient_rs(&g.graph, v) +} + +/// Graph density - measures how dense or sparse a graph is. +/// +/// The ratio of the number of directed edges in the graph to the total number of possible directed +/// edges (given by N * (N-1) where N is the number of nodes). +/// +/// Arguments: +/// g (Raphtory graph) : a directed Raphtory graph +/// +/// Returns: +/// float : Directed graph density of G. +#[pyfunction] +pub fn directed_graph_density(g: &PyGraphView) -> f32 { + directed_graph_density_rs(&g.graph) +} + +/// The average (undirected) degree of all vertices in the graph. +/// +/// Note that this treats the graph as simple and undirected and is equal to twice +/// the number of undirected edges divided by the number of nodes. +/// +/// Arguments: +/// g (Raphtory graph) : a Raphtory graph +/// +/// Returns: +/// float : the average degree of the nodes in the graph +#[pyfunction] +pub fn average_degree(g: &PyGraphView) -> f64 { + average_degree_rs(&g.graph) +} + +/// The maximum out degree of any vertex in the graph. +/// +/// Arguments: +/// g (Raphtory graph) : a directed Raphtory graph +/// +/// Returns: +/// int : value of the largest outdegree +#[pyfunction] +pub fn max_out_degree(g: &PyGraphView) -> usize { + max_out_degree_rs(&g.graph) +} + +/// The maximum in degree of any vertex in the graph. +/// +/// Arguments: +/// g (Raphtory graph) : a directed Raphtory graph +/// +/// Returns: +/// int : value of the largest indegree +#[pyfunction] +pub fn max_in_degree(g: &PyGraphView) -> usize { + max_in_degree_rs(&g.graph) +} + +/// The minimum out degree of any vertex in the graph. +/// +/// Arguments: +/// g (Raphtory graph) : a directed Raphtory graph +/// +/// Returns: +/// int : value of the smallest outdegree +#[pyfunction] +pub fn min_out_degree(g: &PyGraphView) -> usize { + min_out_degree_rs(&g.graph) +} + +/// The minimum in degree of any vertex in the graph. +/// +/// Arguments: +/// g (Raphtory graph) : a directed Raphtory graph +/// +/// Returns: +/// int : value of the smallest indegree +#[pyfunction] +pub fn min_in_degree(g: &PyGraphView) -> usize { + min_in_degree_rs(&g.graph) +} + +/// Reciprocity - measure of the symmetry of relationships in a graph, the global reciprocity of +/// the entire graph. +/// This calculates the number of reciprocal connections (edges that go in both directions) in a +/// graph and normalizes it by the total number of directed edges. +/// +/// Arguments: +/// g (Raphtory graph) : a directed Raphtory graph +/// +/// Returns: +/// float : reciprocity of the graph between 0 and 1. + +#[pyfunction] +pub fn global_reciprocity(g: &PyGraphView) -> f64 { + global_reciprocity_rs(&g.graph, None) +} + +/// Local reciprocity - measure of the symmetry of relationships associated with a vertex +/// +/// This measures the proportion of a vertex's outgoing edges which are reciprocated with an incoming edge. +/// +/// Arguments: +/// g (Raphtory graph) : a directed Raphtory graph +/// +/// Returns: +/// AlgorithmResult : AlgorithmResult with string keys and float values mapping each vertex name to its reciprocity value. +/// +#[pyfunction] +pub fn all_local_reciprocity(g: &PyGraphView) -> AlgorithmResult> { + all_local_reciprocity_rs(&g.graph, None) +} + +/// Computes the number of connected triplets within a graph +/// +/// A connected triplet (also known as a wedge, 2-hop path) is a pair of edges with one node in common. For example, the triangle made up of edges +/// A-B, B-C, C-A is formed of three connected triplets. +/// +/// Arguments: +/// g (Raphtory graph) : a Raphtory graph, treated as undirected +/// +/// Returns: +/// int : the number of triplets in the graph +#[pyfunction] +pub fn triplet_count(g: &PyGraphView) -> usize { + crate::algorithms::triplet_count::triplet_count(&g.graph, None) +} + +/// Computes the global clustering coefficient of a graph. The global clustering coefficient is +/// defined as the number of triangles in the graph divided by the number of triplets in the graph. +/// +/// Note that this is also known as transitivity and is different to the average clustering coefficient. +/// +/// Arguments: +/// g (Raphtory graph) : a Raphtory graph, treated as undirected +/// +/// Returns: +/// float : the global clustering coefficient of the graph +/// +/// See also: +/// [`Triplet Count`](triplet_count) +#[pyfunction] +pub fn global_clustering_coefficient(g: &PyGraphView) -> f64 { + crate::algorithms::clustering_coefficient::clustering_coefficient(&g.graph) +} + +/// Computes the number of three edge, up-to-three node delta-temporal motifs in the graph, using the algorithm of Paranjape et al, Motifs in Temporal Networks (2017). +/// We point the reader to this reference for more information on the algorithm and background, but provide a short summary below. +/// +/// Motifs included: +/// +/// Stars +/// +/// There are three classes (in the order they are outputted) of star motif on three nodes based on the switching behaviour of the edges between the two leaf nodes. +/// +/// - PRE: Stars of the form i<->j, i<->j, i<->k (ie two interactions with leaf j followed by one with leaf k) +/// - MID: Stars of the form i<->j, i<->k, i<->j (ie switching interactions from leaf j to leaf k, back to j again) +/// - POST: Stars of the form i<->j, i<->k, i<->k (ie one interaction with leaf j followed by two with leaf k) +/// +/// Within each of these classes is 8 motifs depending on the direction of the first to the last edge -- incoming "I" or outgoing "O". +/// These are enumerated in the order III, IIO, IOI, IOO, OII, OIO, OOI, OOO (like binary with "I"-0 and "O"-1). +/// +/// Two node motifs: +/// +/// Also included are two node motifs, of which there are 8 when counted from the perspective of each vertex. These are characterised by the direction of each edge, enumerated +/// in the above order. Note that for the global graph counts, each motif is counted in both directions (a single III motif for one vertex is an OOO motif for the other vertex). +/// +/// Triangles: +/// +/// There are 8 triangle motifs: +/// +/// 1. i --> j, k --> j, i --> k +/// 2. i --> j, k --> i, j --> k +/// 3. i --> j, j --> k, i --> k +/// 4. i --> j, i --> k, j --> k +/// 5. i --> j, k --> j, k --> i +/// 6. i --> j, k --> i, k --> j +/// 7. i --> j, j --> k, k --> i +/// 8. i --> j, i --> k, k --> j +/// +/// Arguments: +/// g (raphtory graph) : A directed raphtory graph +/// delta (int) - Maximum time difference between the first and last edge of the +/// motif. NB if time for edges was given as a UNIX epoch, this should be given in seconds, otherwise +/// milliseconds should be used (if edge times were given as string) +/// +/// Returns: +/// list : A 40 dimensional array with the counts of each motif, given in the same order as described above. Note that the two-node motif counts are symmetrical so it may be more useful just to consider the first four elements. +/// +/// Notes: +/// This is achieved by calling the local motif counting algorithm, summing the resulting arrays and dealing with overcounted motifs: the triangles (by dividing each motif count by three) and two-node motifs (dividing by two). +/// +#[pyfunction] +pub fn global_temporal_three_node_motif(g: &PyGraphView, delta: i64) -> Vec { + global_temporal_three_node_motif_rs(&g.graph, delta, None) +} + +#[pyfunction] +pub fn global_temporal_three_node_motif_multi( + g: &PyGraphView, + deltas: Vec, +) -> Vec> { + global_temporal_three_node_motif_general_rs(&g.graph, deltas, None) +} + +/// Computes the number of each type of motif that each node participates in. See global_temporal_three_node_motifs for a summary of the motifs involved. +/// +/// Arguments: +/// g (raphtory graph) : A directed raphtory graph +/// delta (int) - Maximum time difference between the first and last edge of the +/// motif. NB if time for edges was given as a UNIX epoch, this should be given in seconds, otherwise +/// milliseconds should be used (if edge times were given as string) +/// +/// Returns: +/// AlgorithmResult : An AlgorithmResult with node ids as keys and a 40d array of motif counts (in the same order as the global motif counts) with the number of each +/// motif that node participates in. +/// +/// Notes: +/// For this local count, a node is counted as participating in a motif in the following way. For star motifs, only the centre node counts +/// the motif. For two node motifs, both constituent nodes count the motif. For triangles, all three constituent nodes count the motif. +#[pyfunction] +pub fn local_temporal_three_node_motifs( + g: &PyGraphView, + delta: i64, +) -> HashMap> { + local_three_node_rs(&g.graph, vec![delta], None) + .into_iter() + .map(|(k, v)| (String::from(k), v[0].clone())) + .collect::>>() +} + +/// HITS (Hubs and Authority) Algorithm: +/// AuthScore of a vertex (A) = Sum of HubScore of all vertices pointing at vertex (A) from previous iteration / +/// Sum of HubScore of all vertices in the current iteration +/// +/// HubScore of a vertex (A) = Sum of AuthScore of all vertices pointing away from vertex (A) from previous iteration / +/// Sum of AuthScore of all vertices in the current iteration +/// +/// Returns +/// +/// * An AlgorithmResult object containing the mapping from vertex ID to the hub and authority score of the vertex +#[pyfunction] +#[pyo3(signature = (g, iter_count=20, threads=None))] +pub fn hits( + g: &PyGraphView, + iter_count: usize, + threads: Option, +) -> AlgorithmResult, OrderedFloat)> { + hits_rs(&g.graph, iter_count, threads) +} + +/// Sums the weights of edges in the graph based on the specified direction. +/// +/// This function computes the sum of edge weights based on the direction provided, and can be executed in parallel using a given number of threads. +/// +/// # Parameters +/// * `g` (`&PyGraphView`): The graph view on which the operation is to be performed. +/// * `name` (`String`, default = "weight"): The name of the edge property used as the weight. Defaults to "weight" if not provided. +/// * `direction` (`PyDirection`, default = `PyDirection::new("BOTH")`): Specifies the direction of the edges to be considered for summation. +/// - `PyDirection::new("OUT")`: Only consider outgoing edges. +/// - `PyDirection::new("IN")`: Only consider incoming edges. +/// - `PyDirection::new("BOTH")`: Consider both outgoing and incoming edges. This is the default. +/// * `threads` (`Option`, default = `None`): The number of threads to be used for parallel execution. Defaults to single-threaded operation if not provided. +/// +/// # Returns +/// `AlgorithmResult>`: A result containing a mapping of vertex names to the computed sum of their associated edge weights. +/// +#[pyfunction] +#[pyo3[signature = (g, name="weight".to_string(), direction=PyDirection::new("BOTH"), threads=None)]] +pub fn balance( + g: &PyGraphView, + name: String, + direction: PyDirection, + threads: Option, +) -> AlgorithmResult> { + balance_rs(&g.graph, name.clone(), direction.into(), threads) +} diff --git a/py-raphtory/src/graph_gen.rs b/raphtory/src/python/packages/graph_gen.rs similarity index 91% rename from py-raphtory/src/graph_gen.rs rename to raphtory/src/python/packages/graph_gen.rs index d96ba28f74..cb38b93ed6 100644 --- a/py-raphtory/src/graph_gen.rs +++ b/raphtory/src/python/packages/graph_gen.rs @@ -1,11 +1,14 @@ //! Provides functionality for generating graphs for testing and benchmarking. //! Allows us to generate graphs using the preferential attachment model and //! the random attachment model. - -use crate::graph::PyGraph; +use crate::{ + graphgen::{ + preferential_attachment::ba_preferential_attachment as pa, + random_attachment::random_attachment as ra, + }, + python::graph::graph::PyGraph, +}; use pyo3::prelude::*; -use raphtory::graphgen::preferential_attachment::ba_preferential_attachment as pa; -use raphtory::graphgen::random_attachment::random_attachment as ra; /// Generates a graph using the random attachment model /// diff --git a/py-raphtory/src/graph_loader.rs b/raphtory/src/python/packages/graph_loader.rs similarity index 77% rename from py-raphtory/src/graph_loader.rs rename to raphtory/src/python/packages/graph_loader.rs index e1083852f2..5132338341 100644 --- a/py-raphtory/src/graph_loader.rs +++ b/raphtory/src/python/packages/graph_loader.rs @@ -1,6 +1,6 @@ //! `GraphLoader` provides some default implementations for loading a pre-built graph. //! This base class is used to load in-built graphs such as the LOTR, reddit and StackOverflow. -use crate::graph::PyGraph; +use crate::python::graph::graph::PyGraph; use pyo3::prelude::*; use tokio::runtime::Runtime; @@ -24,11 +24,8 @@ use tokio::runtime::Runtime; /// Returns: /// A Graph containing the LOTR dataset #[pyfunction] -#[pyo3(signature = (shards=1))] -pub fn lotr_graph(shards: usize) -> PyResult> { - PyGraph::py_from_db_graph(raphtory_io::graph_loader::example::lotr_graph::lotr_graph( - shards, - )) +pub fn lotr_graph() -> PyResult> { + PyGraph::py_from_db_graph(crate::graph_loader::example::lotr_graph::lotr_graph()) } /// Load (a subset of) Reddit hyperlinks dataset into a graph. @@ -67,37 +64,35 @@ pub fn lotr_graph(shards: usize) -> PyResult> { /// Returns: /// A Graph containing the Reddit hyperlinks dataset #[pyfunction] -#[pyo3(signature = (shards=1,timeout_seconds=600))] -pub fn reddit_hyperlink_graph(shards: usize, timeout_seconds: u64) -> PyResult> { +#[pyo3(signature = (timeout_seconds=600))] +pub fn reddit_hyperlink_graph(timeout_seconds: u64) -> PyResult> { PyGraph::py_from_db_graph( - raphtory_io::graph_loader::example::reddit_hyperlinks::reddit_graph( - shards, - timeout_seconds, - false, - ), + crate::graph_loader::example::reddit_hyperlinks::reddit_graph(timeout_seconds, false), ) } #[pyfunction] -#[pyo3(signature = (path=None,subset=None,shards=1))] -pub fn stable_coin_graph(path: Option, subset:Option, shards: usize) -> PyResult> { +#[pyo3(signature = (path=None,subset=None))] +pub fn stable_coin_graph(path: Option, subset: Option) -> PyResult> { PyGraph::py_from_db_graph( - raphtory_io::graph_loader::example::stable_coins::stable_coin_graph(path, subset.unwrap_or(false),shards), + crate::graph_loader::example::stable_coins::stable_coin_graph( + path, + subset.unwrap_or(false), + ), ) } #[pyfunction] -#[pyo3(signature = (uri,username,password,database="neo4j".to_string(),shards=1))] +#[pyo3(signature = (uri,username,password,database="neo4j".to_string()))] pub fn neo4j_movie_graph( uri: String, username: String, password: String, database: String, - shards: usize, ) -> PyResult> { let g = Runtime::new().unwrap().block_on( - raphtory_io::graph_loader::example::neo4j_examples::neo4j_movie_graph( - uri, username, password, database, shards, + crate::graph_loader::example::neo4j_examples::neo4j_movie_graph( + uri, username, password, database, ), ); PyGraph::py_from_db_graph(g) diff --git a/raphtory/src/python/packages/mod.rs b/raphtory/src/python/packages/mod.rs new file mode 100644 index 0000000000..a2a2988bb2 --- /dev/null +++ b/raphtory/src/python/packages/mod.rs @@ -0,0 +1,4 @@ +pub mod algorithms; +pub mod graph_gen; +pub mod graph_loader; +pub mod vectors; diff --git a/raphtory/src/python/packages/vectors.rs b/raphtory/src/python/packages/vectors.rs new file mode 100644 index 0000000000..2b82a8b69c --- /dev/null +++ b/raphtory/src/python/packages/vectors.rs @@ -0,0 +1,121 @@ +use crate::{ + db::{ + api::view::internal::DynamicGraph, + graph::{edge::EdgeView, vertex::VertexView}, + }, + prelude::{EdgeViewOps, VertexViewOps}, + python::graph::views::graph_view::PyGraphView, + vectors::{Embedding, EmbeddingFunction, Vectorizable, VectorizedGraph}, +}; +use futures_util::future::BoxFuture; +use itertools::Itertools; +use pyo3::{ + prelude::*, + types::{PyFunction, PyList}, +}; +use std::{path::PathBuf, sync::Arc}; + +/// Graph view is a read-only version of a graph at a certain point in time. +#[pyclass(name = "VectorizedGraph", frozen)] +pub struct PyVectorizedGraph { + vectors: Arc>, +} + +#[pymethods] +impl PyVectorizedGraph { + #[new] + fn new( + py: Python<'_>, + graph: &PyGraphView, + embedding: &PyFunction, + cache: &str, + node_document: Option, + edge_document: Option, + ) -> PyResult { + // FIXME: we should be able to specify templates only for one type of entity: nodes/edges + + let embedding: Py = embedding.into(); + let graph = graph.graph.clone(); + let cache = PathBuf::from(cache); + + // FIXME: Maybe we should have two versions: a VectorizedGraph (sync) and AsyncVectorizedGraph, in both python and rust + // this instead is just terrible + pyo3_asyncio::tokio::run(py, async move { + let vectorized_graph = match (node_document, edge_document) { + (Some(node_document), Some(edge_document)) => { + let node_template = move |vertex: &VertexView| { + vertex.properties().get(&node_document).unwrap().to_string() + }; + let edge_template = move |edge: &EdgeView| { + edge.properties().get(&edge_document).unwrap().to_string() + }; + graph.vectorize_with_templates( + Box::new(embedding.clone()), + &cache, + node_template, + edge_template, + ) + } + (None, None) => graph.vectorize(Box::new(embedding.clone()), &cache), + _ => panic!("you need to specify both templates for now sadly"), + }; + + Ok(PyVectorizedGraph { + vectors: Arc::new(vectorized_graph.await), + }) + }) + } + + fn similarity_search( + &self, + py: Python<'_>, + query: String, + init: usize, + min_nodes: usize, + min_edges: usize, + limit: usize, + ) -> PyResult> { + let vectors = self.vectors.clone(); + pyo3_asyncio::tokio::run(py, async move { + let docs = vectors + .similarity_search( + query.as_str(), + init, + min_nodes, + min_edges, + limit, + None, + None, + ) + .await; + Ok(docs) + }) + } +} + +impl EmbeddingFunction for Py { + fn call(&self, texts: Vec) -> BoxFuture<'static, Vec> { + // FIXME: return result and avoid unwraps!! + + let embedding_function = self.clone(); + + Box::pin(async move { + Python::with_gil(|py| { + let python_texts = PyList::new(py, texts); + let result = embedding_function.call1(py, (python_texts,)).unwrap(); + let embeddings: &PyList = result.downcast(py).unwrap(); + + embeddings + .iter() + .map(|embedding| { + let pylist: &PyList = embedding.downcast().unwrap(); + pylist + .iter() + .map(|element| element.extract::().unwrap()) + .collect_vec() + }) + .collect_vec() + }) + }) + } +} diff --git a/raphtory/src/python/types/iterable.rs b/raphtory/src/python/types/iterable.rs new file mode 100644 index 0000000000..9f73ffea8b --- /dev/null +++ b/raphtory/src/python/types/iterable.rs @@ -0,0 +1,115 @@ +use crate::{ + db::api::view::BoxedIter, + python::types::repr::{iterator_repr, Repr}, +}; +use pyo3::{IntoPy, PyObject}; +use std::{marker::PhantomData, sync::Arc}; + +pub struct Iterable + From + Repr> { + pub name: &'static str, + pub builder: Arc BoxedIter + Send + Sync + 'static>, + pytype: PhantomData, +} + +impl + From + Repr> Iterable { + pub fn iter(&self) -> BoxedIter { + (self.builder)() + } + pub fn py_iter(&self) -> BoxedIter { + Box::new(self.iter().map(|i| i.into())) + } + pub fn new It + Send + Sync + 'static, It: Iterator + Send + 'static>( + name: &'static str, + builder: F, + ) -> Self + where + It::Item: Into, + { + let builder = Arc::new(move || { + let iter: BoxedIter = Box::new(builder().map(|v| v.into())); + iter + }); + Self { + name, + builder, + pytype: Default::default(), + } + } + pub fn iter_eq>(&self, other: J) -> bool + where + I: PartialEq, + { + self.iter().eq(other) + } +} + +impl + From + Repr, J> PartialEq + for Iterable +where + for<'a> &'a J: IntoIterator, +{ + fn eq(&self, other: &J) -> bool { + self.iter_eq(other) + } +} + +impl + From + Repr> Repr for Iterable { + fn repr(&self) -> String { + format!("{}([{}])", self.name, iterator_repr(self.py_iter())) + } +} + +pub struct NestedIterable + From + Repr> { + pub name: &'static str, + pub builder: Arc BoxedIter> + Send + Sync + 'static>, + pytype: PhantomData, +} + +impl + From + Repr> NestedIterable { + pub fn iter(&self) -> BoxedIter> { + (self.builder)() + } + pub fn new It + Send + Sync + 'static, It: Iterator + Send + 'static>( + name: &'static str, + builder: F, + ) -> Self + where + It::Item: Iterator + Send, + ::Item: Into + Send, + { + let builder = Arc::new(move || { + let iter: BoxedIter> = Box::new(builder().map(|it| { + let iter: BoxedIter = Box::new(it.map(|v| v.into())); + iter + })); + iter + }); + Self { + name, + builder, + pytype: Default::default(), + } + } + + pub fn iter_eq, J: IntoIterator>(&self, other: JJ) -> bool + where + I: PartialEq, + { + self.iter() + .zip(other) + .all(|(t, o)| t.zip(o).all(|(tt, oo)| tt == oo)) + } +} + +impl + From + Repr> Repr for NestedIterable { + fn repr(&self) -> String { + format!( + "{}([{}])", + self.name, + iterator_repr( + self.iter() + .map(|it| format!("[{}]", iterator_repr(it.map(|i| PyI::from(i))))) + ) + ) + } +} diff --git a/raphtory/src/python/types/macros/cmp.rs b/raphtory/src/python/types/macros/cmp.rs new file mode 100644 index 0000000000..87627a6798 --- /dev/null +++ b/raphtory/src/python/types/macros/cmp.rs @@ -0,0 +1,29 @@ +/// Add equality support to pyclass +/// +/// # Arguments +/// +/// * `name` - The identifier for the struct +/// * `cmp_item` - Struct to use for comparisons, needs to support `cmp_item: From<&name>` +/// and `cmp_item: PartialEq` and `cmp_item: FromPyObject` with conversion for all +/// the python types we want to compare with +macro_rules! py_eq { + ($name:ty, $cmp_name:ty) => { + #[pyo3::pymethods] + impl $name { + pub fn __richcmp__( + &self, + other: $cmp_name, + op: pyo3::basic::CompareOp, + ) -> pyo3::PyResult { + match op { + pyo3::basic::CompareOp::Lt => Err(PyTypeError::new_err("not ordered")), + pyo3::basic::CompareOp::Le => Err(PyTypeError::new_err("not ordered")), + pyo3::basic::CompareOp::Eq => Ok(<$cmp_name>::from(self) == other), + pyo3::basic::CompareOp::Ne => Ok(<$cmp_name>::from(self) != other), + pyo3::basic::CompareOp::Gt => Err(PyTypeError::new_err("not ordered")), + pyo3::basic::CompareOp::Ge => Err(PyTypeError::new_err("not ordered")), + } + } + } + }; +} diff --git a/raphtory/src/python/types/macros/iterable.rs b/raphtory/src/python/types/macros/iterable.rs new file mode 100644 index 0000000000..db7f727538 --- /dev/null +++ b/raphtory/src/python/types/macros/iterable.rs @@ -0,0 +1,301 @@ +// internal macro for sum and mean methods +macro_rules! _py_numeric_methods { + ($name:ident, $item:ty, $pyitem:ty) => { + #[pymethods] + impl $name { + pub fn sum(&self) -> $pyitem { + let v: $item = self.iter().sum(); + v.into() + } + + pub fn mean(&self) -> f64 { + use $crate::python::types::wrappers::iterators::MeanExt; + self.iter().mean() + } + } + }; +} + +// Internal macro defining max and min on ordered iterables +macro_rules! _py_ord_max_min_methods { + ($name:ident, $pyitem:ty) => { + #[pymethods] + impl $name { + pub fn max(&self) -> Option<$pyitem> { + self.iter().max().map(|v| v.into()) + } + + pub fn min(&self) -> Option<$pyitem> { + self.iter().min().map(|v| v.into()) + } + } + }; +} + +// Internal macro defining max and min on float iterables +macro_rules! _py_float_max_min_methods { + ($name:ident, $pyitem:ty) => { + #[pymethods] + impl $name { + pub fn max(&self) -> Option<$pyitem> { + self.iter().max_by(|a, b| a.total_cmp(b)).map(|v| v.into()) + } + pub fn min(&self) -> Option<$pyitem> { + self.iter().min_by(|a, b| a.total_cmp(b)).map(|v| v.into()) + } + } + }; +} + +// Internal macro for methods supported by all iterables (also used by nested iterables) +macro_rules! _py_iterable_base_methods { + ($name:ident, $iter:ty) => { + #[pymethods] + impl $name { + pub fn __iter__(&self) -> $iter { + self.iter().into() + } + + pub fn __len__(&self) -> usize { + self.iter().count() + } + + pub fn __repr__(&self) -> String { + self.repr() + } + } + }; +} + +// internal macro for the collect method (as it is different for nested iterables) +macro_rules! _py_iterable_collect_method { + ($name:ident, $pyitem:ty) => { + #[pymethods] + impl $name { + pub fn collect(&self) -> Vec<$pyitem> { + self.iter().map(|v| v.into()).collect() + } + } + }; +} + +/// Construct a python Iterable struct which wraps a closure that returns an iterator +/// +/// Does not implement any methods! +/// +/// # Arguments +/// +/// * `name` - The identifier for the new struct +/// * `item` - The type of `Item` for the wrapped iterator builder +/// * `pyitem` - The type of the python wrapper for `Item` (optional if `item` implements `IntoPy`, need `item: Into`) +macro_rules! py_iterable_base { + ($name:ident, $item:ty) => { + py_iterable!($name, $item, $item); + }; + ($name:ident, $item:ty, $pyitem:ty) => { + #[pyclass] + pub struct $name($crate::python::types::iterable::Iterable<$item, $pyitem>); + + impl Repr for $name { + fn repr(&self) -> String { + self.0.repr() + } + } + + impl std::ops::Deref for $name { + type Target = $crate::python::types::iterable::Iterable<$item, $pyitem>; + + fn deref(&self) -> &Self::Target { + &self.0 + } + } + + impl It + Send + Sync + 'static, It: Iterator + Send + 'static> From for $name + where + It::Item: Into<$item>, + { + fn from(value: F) -> Self { + Self($crate::python::types::iterable::Iterable::new( + stringify!($name), + value, + )) + } + } + }; +} + +/// Construct a python Iterable struct which wraps a closure that returns an iterator +/// +/// Has methods `__iter__`, `__len__`, `__repr__`, `collect` +/// +/// # Arguments +/// +/// * `name` - The identifier for the new struct +/// * `item` - The type of `Item` for the wrapped iterator builder +/// * `pyitem` - The type of the python wrapper for `Item` (optional if `item` implements `IntoPy`, need Into<`pyitem`> to be implemented for `item`) +macro_rules! py_iterable { + ($name:ident, $item:ty) => { + py_iterable!($name, $item, $item); + }; + ($name:ident, $item:ty, $pyitem:ty) => { + py_iterable_base!($name, $item, $pyitem); + _py_iterable_base_methods!($name, $crate::python::utils::PyGenericIterator); + _py_iterable_collect_method!($name, $pyitem); + }; +} + +/// Construct a python Iterable struct which wraps a closure that returns an iterator of ordered values +/// +/// additionally adds the `min` and `max` methods to those created by `py_iterable` +/// # Arguments +/// +/// * `name` - The identifier for the new struct +/// * `item` - The type of `Item` for the wrapped iterator builder +/// * `pyitem` - The type of the python wrapper for `Item` (optional if `item` implements `IntoPy`, need Into<`pyitem`> to be implemented for `item`) +/// * `pyiter` - The python iterator wrapper that should be returned when calling `__iter__` (needs to have the same `item` and `pyitem`) +macro_rules! py_ordered_iterable { + ($name:ident, $item:ty) => { + py_ordered_iterable!($name, $item, $item); + }; + ($name:ident, $item:ty, $pyitem:ty) => { + py_iterable!($name, $item, $pyitem); + _py_ord_max_min_methods!($name, $pyitem); + }; +} + +/// Construct a python Iterable struct which wraps a closure that returns an iterator of ordered and summable values +/// +/// additionally adds the `mean` and `sum` methods to those created by `py_ordered_iterable` +/// # Arguments +/// +/// * `name` - The identifier for the new struct +/// * `item` - The type of `Item` for the wrapped iterator builder +/// * `pyitem` - The type of the python wrapper for `Item` (optional if `item` implements `IntoPy`, need Into<`pyitem`> to be implemented for `item`) +/// * `pyiter` - The python iterator wrapper that should be returned when calling `__iter__` (needs to have the same `item` and `pyitem`) +macro_rules! py_numeric_iterable { + ($name:ident, $item:ty) => { + py_numeric_iterable!($name, $item, $item); + }; + ($name:ident, $item:ty, $pyitem:ty) => { + py_ordered_iterable!($name, $item, $pyitem); + _py_numeric_methods!($name, $item, $pyitem); + }; +} + +/// Construct a python Iterable struct which wraps a closure that returns an iterator of float values +/// +/// This acts the same as `py_numeric_iterable` but with special implementations of `max` and `min` for floats. +/// +/// # Arguments +/// +/// * `name` - The identifier for the new struct +/// * `item` - The type of `Item` for the wrapped iterator builder +/// * `pyitem` - The type of the python wrapper for `Item` (optional if `item` implements `IntoPy`, need Into<`pyitem`> to be implemented for `item`) +/// * `pyiter` - The python iterator wrapper that should be returned when calling `__iter__` (needs to have the same `item` and `pyitem`) +macro_rules! py_float_iterable { + ($name:ident, $item:ty) => { + py_float_iterable!($name, $item, $item); + }; + ($name:ident, $item:ty, $pyitem:ty) => { + py_iterable!($name, $item, $pyitem); + _py_numeric_methods!($name, $item, $pyitem); + _py_float_max_min_methods!($name, $pyitem); + }; +} + +/// Add equality support to iterable +/// +/// +/// # Arguments +/// +/// * `name` - The identifier for the iterable struct +/// * `cmp_item` - Struct to use for comparisons, needs to support `cmp_item: From` +/// and `cmp_item: PartialEq` and FromPyObject for all the python types we +/// want to compare with +/// * `cmp_internal` - Name for the internal Enum that is created by the macro to implement +/// the conversion from python (only needed because we can't create our own +/// unique identifier without a proc macro) +macro_rules! py_iterable_comp { + ($name:ty, $cmp_item:ty, $cmp_internal:ident) => { + #[derive(Clone)] + enum $cmp_internal { + Vec(Vec<$cmp_item>), + This(Py<$name>), + } + + impl<'source> FromPyObject<'source> for $cmp_internal { + fn extract(ob: &'source PyAny) -> PyResult { + if let Ok(s) = ob.extract::>() { + Ok($cmp_internal::This(s)) + } else if let Ok(v) = ob.extract::>() { + Ok($cmp_internal::Vec(v)) + } else { + Err(pyo3::exceptions::PyTypeError::new_err("cannot compare")) + } + } + } + + impl From<$name> for $cmp_internal { + fn from(value: $name) -> Self { + let py_value = Python::with_gil(|py| Py::new(py, value)).unwrap(); + Self::This(py_value) + } + } + + impl $cmp_internal { + fn iter_py<'py>( + &'py self, + py: Python<'py>, + ) -> Box + 'py> { + match self { + Self::Vec(v) => Box::new(v.iter().cloned()), + Self::This(t) => Box::new(t.borrow(py).iter().map_into()), + } + } + } + + impl PartialEq for $cmp_internal { + fn eq(&self, other: &Self) -> bool { + Python::with_gil(|py| self.iter_py(py).eq(other.iter_py(py))) + } + } + + impl, J: Into<$cmp_item>> From for $cmp_internal { + fn from(value: I) -> Self { + Self::Vec(value.map_into().collect()) + } + } + + #[pymethods] + impl $name { + fn __richcmp__( + &self, + other: $cmp_internal, + op: pyo3::basic::CompareOp, + py: Python<'_>, + ) -> PyResult { + match op { + pyo3::basic::CompareOp::Lt => { + Err(pyo3::exceptions::PyTypeError::new_err("not ordered")) + } + pyo3::basic::CompareOp::Le => { + Err(pyo3::exceptions::PyTypeError::new_err("not ordered")) + } + pyo3::basic::CompareOp::Eq => Ok(self + .iter() + .map(|t| <$cmp_item>::from(t)) + .eq(other.iter_py(py))), + pyo3::basic::CompareOp::Ne => { + Ok(!self.__richcmp__(other, pyo3::basic::CompareOp::Eq, py)?) + } + pyo3::basic::CompareOp::Gt => { + Err(pyo3::exceptions::PyTypeError::new_err("not ordered")) + } + pyo3::basic::CompareOp::Ge => { + Err(pyo3::exceptions::PyTypeError::new_err("not ordered")) + } + } + } + } + }; +} diff --git a/raphtory/src/python/types/macros/mod.rs b/raphtory/src/python/types/macros/mod.rs new file mode 100644 index 0000000000..8d589e93db --- /dev/null +++ b/raphtory/src/python/types/macros/mod.rs @@ -0,0 +1,6 @@ +#[macro_use] +pub mod iterable; +#[macro_use] +pub mod nested_iterable; +#[macro_use] +pub mod cmp; diff --git a/py-raphtory/src/macros/nested_iterable.rs b/raphtory/src/python/types/macros/nested_iterable.rs similarity index 81% rename from py-raphtory/src/macros/nested_iterable.rs rename to raphtory/src/python/types/macros/nested_iterable.rs index 8606b83ccc..3f28dd35d1 100644 --- a/py-raphtory/src/macros/nested_iterable.rs +++ b/raphtory/src/python/types/macros/nested_iterable.rs @@ -1,21 +1,28 @@ // Internal macro to create the struct for a nested iterable -macro_rules! _py_nested_iterable_base { +macro_rules! py_nested_iterable_base { + ($name:ident, $item:ty) => { + py_nested_iterable_base!($name, $item, $item); + }; ($name:ident, $item:ty, $pyitem:ty) => { #[pyclass] - pub struct $name($crate::types::iterable::NestedIterable<$item, $pyitem>); + pub struct $name($crate::python::types::iterable::NestedIterable<$item, $pyitem>); - impl Deref for $name { - type Target = $crate::types::iterable::NestedIterable<$item, $pyitem>; + impl std::ops::Deref for $name { + type Target = $crate::python::types::iterable::NestedIterable<$item, $pyitem>; fn deref(&self) -> &Self::Target { &self.0 } } - impl BoxedIter> + Sync + Send + 'static> From for $name { + impl It + Send + Sync + 'static, It: Iterator + Send + 'static> From for $name + where + It::Item: Iterator + Send, + ::Item: Into<$item> + Send, + { fn from(value: F) -> Self { - Self($crate::types::iterable::NestedIterable::new( - stringify!($name).to_string(), + Self($crate::python::types::iterable::NestedIterable::new( + stringify!($name), value, )) } @@ -25,8 +32,8 @@ macro_rules! _py_nested_iterable_base { // Internal macro to create basic methods for a nested iterable macro_rules! _py_nested_iterable_methods { - ($name:ident, $pyitem:ty, $iter:ty) => { - _py_iterable_base_methods!($name, $iter); + ($name:ident, $pyitem:ty) => { + _py_iterable_base_methods!($name, $crate::python::utils::PyNestedGenericIterator); #[pymethods] impl $name { @@ -130,12 +137,12 @@ macro_rules! _py_nested_float_max_min_methods { /// * `pyitem` - The type of the python wrapper for `Item` (optional if `item` implements `IntoPy`, need Into<`pyitem`> to be implemented for `item`) /// * `iter` - The python iterator wrapper that should be returned when calling `__iter__` macro_rules! py_nested_iterable { - ($name:ident, $item:ty, $iter:ty) => { - py_nested_iterable!($name, $item, $item, $iter); + ($name:ident, $item:ty) => { + py_nested_iterable!($name, $item, $item); }; - ($name:ident, $item:ty, $pyitem:ty, $iter:ty) => { - _py_nested_iterable_base!($name, $item, $pyitem); - _py_nested_iterable_methods!($name, $pyitem, $iter); + ($name:ident, $item:ty, $pyitem:ty) => { + py_nested_iterable_base!($name, $item, $pyitem); + _py_nested_iterable_methods!($name, $pyitem); }; } @@ -147,11 +154,10 @@ macro_rules! py_nested_iterable { /// /// * `name` - The identifier for the new struct /// * `item` - The type of `Item` for the wrapped iterator builder -/// * `iter` - The python iterator wrapper that should be returned when calling `__iter__` /// * `option_value_iterable` - The iterable to return for `max` and `min` (should have item type `Option`) macro_rules! py_nested_ordered_iterable { - ($name:ident, $item:ty, $iter:ty, $option_value_iterable:ty) => { - py_nested_iterable!($name, $item, $iter); + ($name:ident, $item:ty, $option_value_iterable:ty) => { + py_nested_iterable!($name, $item); _py_nested_ord_max_min_methods!($name, $item, $option_value_iterable); }; } @@ -169,8 +175,8 @@ macro_rules! py_nested_ordered_iterable { /// * `value_iterable` - The iterable to return for `sum` and `mean` /// * `option_value_iterable` - The iterable to return for `max` and `min` (should have item type `Option`) macro_rules! py_nested_numeric_iterable { - ($name:ident, $item:ty, $iter:ty, $value_iterable:ty, $option_value_iterable:ty) => { - py_nested_ordered_iterable!($name, $item, $iter, $option_value_iterable); + ($name:ident, $item:ty, $value_iterable:ty, $option_value_iterable:ty) => { + py_nested_ordered_iterable!($name, $item, $option_value_iterable); _py_nested_numeric_methods!($name, $item, $value_iterable); }; } @@ -187,8 +193,9 @@ macro_rules! py_nested_numeric_iterable { /// * `iter` - The python iterator wrapper that should be returned when calling `__iter__` /// * `value_iterable` - The iterable to return for `sum` and `mean` /// * `option_value_iterable` - The iterable to return for `max` and `min` (should have item type `Option`) +#[allow(unused_macros)] macro_rules! py_nested_float_iterable { - ($name:ident, $item:ty, $iter:ty, $value_iterable:ty, $option_value_iterable:ty) => { + ($name:ident, $item:ty, $value_iterable:ty, $option_value_iterable:ty) => { py_nested_iterable!($name, $item); _py_nested_numeric_methods!($name, $item, $value_iterable); _py_nested_float_max_min_methods!($name, $item, $option_value_iterable); diff --git a/raphtory/src/python/types/mod.rs b/raphtory/src/python/types/mod.rs new file mode 100644 index 0000000000..713089c41a --- /dev/null +++ b/raphtory/src/python/types/mod.rs @@ -0,0 +1,6 @@ +#[macro_use] +pub mod macros; + +pub mod iterable; +pub mod repr; +pub mod wrappers; diff --git a/py-raphtory/src/types/repr.rs b/raphtory/src/python/types/repr.rs similarity index 74% rename from py-raphtory/src/types/repr.rs rename to raphtory/src/python/types/repr.rs index 40df935d52..4bd0b1f192 100644 --- a/py-raphtory/src/types/repr.rs +++ b/raphtory/src/python/types/repr.rs @@ -1,6 +1,7 @@ +use crate::core::{storage::locked_view::LockedView, ArcStr}; use chrono::NaiveDateTime; use itertools::Itertools; -use std::collections::HashMap; +use std::{collections::HashMap, ops::Deref}; pub fn iterator_repr, V: Repr>(iter: I) -> String { let values: Vec = iter.take(11).map(|v| v.repr()).collect(); @@ -11,6 +12,18 @@ pub fn iterator_repr, V: Repr>(iter: I) -> String { } } +pub fn iterator_dict_repr, K: Repr, V: Repr>(iter: I) -> String { + let values: Vec = iter + .take(11) + .map(|(k, v)| format!("{}: {}", k.repr(), v.repr())) + .collect(); + if values.len() < 11 { + values.join(", ") + } else { + values[0..10].join(", ") + ", ..." + } +} + pub trait Repr { fn repr(&self) -> String; } @@ -27,6 +40,18 @@ impl Repr for u32 { } } +impl Repr for u8 { + fn repr(&self) -> String { + self.to_string() + } +} + +impl Repr for u16 { + fn repr(&self) -> String { + self.to_string() + } +} + impl Repr for u64 { fn repr(&self) -> String { self.to_string() @@ -69,6 +94,18 @@ impl Repr for String { } } +impl Repr for ArcStr { + fn repr(&self) -> String { + self.to_string() + } +} + +impl Repr for &ArcStr { + fn repr(&self) -> String { + self.to_string() + } +} + impl Repr for &str { fn repr(&self) -> String { self.to_string() @@ -113,6 +150,12 @@ impl Repr for (S, T) { } } +impl<'a, T: Repr> Repr for LockedView<'a, T> { + fn repr(&self) -> String { + self.deref().repr() + } +} + #[cfg(test)] mod repr_tests { use super::*; diff --git a/raphtory/src/python/types/wrappers/iterators.rs b/raphtory/src/python/types/wrappers/iterators.rs new file mode 100644 index 0000000000..7ac80f0863 --- /dev/null +++ b/raphtory/src/python/types/wrappers/iterators.rs @@ -0,0 +1,75 @@ +use crate::{db::api::view::BoxedIter, prelude::Prop, python::types::repr::Repr}; +use itertools::Itertools; +use num::cast::AsPrimitive; +use pyo3::prelude::*; +use std::{i64, iter::Sum}; + +pub(crate) trait MeanExt: Iterator +where + V: AsPrimitive + Sum, +{ + fn mean(self) -> f64 + where + Self: Sized, + { + let mut count: usize = 0; + let sum: V = self.inspect(|_| count += 1).sum(); + + if count > 0 { + sum.as_() / (count as f64) + } else { + 0.0 + } + } +} + +impl, V: AsPrimitive + Sum> MeanExt for I {} + +py_float_iterable!(Float64Iterable, f64); + +py_numeric_iterable!(U64Iterable, u64); +py_nested_numeric_iterable!(NestedU64Iterable, u64, U64Iterable, OptionU64Iterable); + +py_iterable!(OptionU64U64Iterable, Option<(u64, u64)>); +py_ordered_iterable!(U64U64Iterable, (u64, u64)); +py_nested_ordered_iterable!(NestedU64U64Iterable, (u64, u64), OptionU64U64Iterable); + +py_iterable!(OptionU64Iterable, Option, Option); +_py_ord_max_min_methods!(OptionU64Iterable, Option); + +py_iterable!(PropIterable, Prop, Prop); +py_iterable_comp!(PropIterable, Prop, PropIterableCmp); + +py_numeric_iterable!(I64Iterable, i64); +py_nested_numeric_iterable!(NestedI64Iterable, i64, I64Iterable, OptionI64Iterable); + +py_iterable!(OptionI64Iterable, Option); +_py_ord_max_min_methods!(OptionI64Iterable, Option); +py_iterable!(OptionOptionI64Iterable, Option>); +_py_ord_max_min_methods!(OptionOptionI64Iterable, Option>); + +py_nested_ordered_iterable!( + NestedOptionI64Iterable, + Option, + OptionOptionI64Iterable +); + +py_numeric_iterable!(UsizeIterable, usize); +py_iterable_comp!(UsizeIterable, usize, UsizeIterableCmp); + +py_ordered_iterable!(OptionUsizeIterable, Option); +py_nested_numeric_iterable!( + NestedUsizeIterable, + usize, + UsizeIterable, + OptionUsizeIterable +); + +py_iterable!(BoolIterable, bool); +py_nested_iterable!(NestedBoolIterable, bool); + +py_iterable!(StringIterable, String); +py_nested_iterable!(NestedStringIterable, String); + +py_iterable!(StringVecIterable, Vec); +py_nested_iterable!(NestedStringVecIterable, Vec); diff --git a/py-raphtory/src/wrappers/mod.rs b/raphtory/src/python/types/wrappers/mod.rs similarity index 100% rename from py-raphtory/src/wrappers/mod.rs rename to raphtory/src/python/types/wrappers/mod.rs diff --git a/raphtory/src/python/types/wrappers/prop.rs b/raphtory/src/python/types/wrappers/prop.rs new file mode 100644 index 0000000000..402884351c --- /dev/null +++ b/raphtory/src/python/types/wrappers/prop.rs @@ -0,0 +1,84 @@ +use crate::{ + core::Prop, + python::{graph::views::graph_view::PyGraphView, types::repr::Repr}, +}; +use pyo3::{ + exceptions::PyTypeError, types::PyBool, FromPyObject, IntoPy, PyAny, PyObject, PyResult, Python, +}; +use std::{ops::Deref, sync::Arc}; + +impl IntoPy for Prop { + fn into_py(self, py: Python<'_>) -> PyObject { + match self { + Prop::Str(s) => s.into_py(py), + Prop::Bool(bool) => bool.into_py(py), + Prop::U8(u8) => u8.into_py(py), + Prop::U16(u16) => u16.into_py(py), + Prop::I64(i64) => i64.into_py(py), + Prop::U64(u64) => u64.into_py(py), + Prop::F64(f64) => f64.into_py(py), + Prop::DTime(dtime) => dtime.into_py(py), + Prop::Graph(g) => g.into_py(py), // Need to find a better way + Prop::I32(v) => v.into_py(py), + Prop::U32(v) => v.into_py(py), + Prop::F32(v) => v.into_py(py), + Prop::List(v) => v.deref().clone().into_py(py), // Fixme: optimise the clone here? + Prop::Map(v) => v.deref().clone().into_py(py), + } + } +} + +// Manually implemented to make sure we don't end up with f32/i32/u32 from python ints/floats +impl<'source> FromPyObject<'source> for Prop { + fn extract(ob: &'source PyAny) -> PyResult { + if ob.is_instance_of::() { + return Ok(Prop::Bool(ob.extract()?)); + } + if let Ok(v) = ob.extract() { + return Ok(Prop::I64(v)); + } + if let Ok(v) = ob.extract() { + return Ok(Prop::F64(v)); + } + if let Ok(d) = ob.extract() { + return Ok(Prop::DTime(d)); + } + if let Ok(s) = ob.extract::() { + return Ok(Prop::Str(s.into())); + } + if let Ok(g) = ob.extract() { + return Ok(Prop::Graph(g)); + } + if let Ok(list) = ob.extract() { + return Ok(Prop::List(Arc::new(list))); + } + if let Ok(map) = ob.extract() { + return Ok(Prop::Map(Arc::new(map))); + } + Err(PyTypeError::new_err("Not a valid property type")) + } +} + +impl Repr for Prop { + fn repr(&self) -> String { + match &self { + Prop::Str(v) => v.repr(), + Prop::Bool(v) => v.repr(), + Prop::I64(v) => v.repr(), + Prop::U8(v) => v.repr(), + Prop::U16(v) => v.repr(), + Prop::U64(v) => v.repr(), + Prop::F64(v) => v.repr(), + Prop::DTime(v) => v.repr(), + Prop::Graph(g) => PyGraphView::from(g.clone()).repr(), + Prop::I32(v) => v.repr(), + Prop::U32(v) => v.repr(), + Prop::F32(v) => v.repr(), + Prop::List(v) => v.repr(), + Prop::Map(v) => v.repr(), + } + } +} + +pub type PropValue = Option; +pub type PropHistItems = Vec<(i64, Prop)>; diff --git a/raphtory/src/python/utils/errors.rs b/raphtory/src/python/utils/errors.rs new file mode 100644 index 0000000000..7a67443639 --- /dev/null +++ b/raphtory/src/python/utils/errors.rs @@ -0,0 +1,32 @@ +use crate::{ + core::utils::{errors::GraphError, time::error::ParseTimeError}, + graph_loader::source::csv_loader::CsvErr, +}; +use pyo3::{exceptions::PyException, PyErr}; +use std::error::Error; + +impl From for PyErr { + fn from(value: ParseTimeError) -> Self { + adapt_err_value(&value) + } +} + +impl From for PyErr { + fn from(value: GraphError) -> Self { + adapt_err_value(&value) + } +} + +impl From for PyErr { + fn from(value: CsvErr) -> Self { + adapt_err_value(&value) + } +} + +pub fn adapt_err_value(err: &E) -> PyErr +where + E: Error + ?Sized, +{ + let error_log = display_error_chain::DisplayErrorChain::new(err).to_string(); + PyException::new_err(error_log) +} diff --git a/py-raphtory/src/utils.rs b/raphtory/src/python/utils/mod.rs similarity index 50% rename from py-raphtory/src/utils.rs rename to raphtory/src/python/utils/mod.rs index 666a5e2847..a756d1fd23 100644 --- a/py-raphtory/src/utils.rs +++ b/raphtory/src/python/utils/mod.rs @@ -2,18 +2,18 @@ //! //! This module contains helper functions for the Python bindings. //! These functions are not part of the public API and are not exported to the Python module. -use crate::vertex::PyVertex; +use crate::{ + core::{ + entities::vertices::{input_vertex::InputVertex, vertex_ref::VertexRef}, + utils::time::{error::ParseTimeError, Interval, IntoTime, TryIntoTime}, + }, + db::api::view::*, + python::graph::vertex::PyVertex, +}; use chrono::NaiveDateTime; -use pyo3::exceptions::{PyException, PyTypeError}; -use pyo3::prelude::*; -use raphtory::core as dbc; -use raphtory::core::time::error::ParseTimeError; -use raphtory::core::time::{Interval, TryIntoTime}; -use raphtory::core::vertex::InputVertex; -use raphtory::core::vertex_ref::VertexRef; -use raphtory::db::view_api::time::WindowSet; -use raphtory::db::view_api::TimeOps; -use std::error::Error; +use pyo3::{exceptions::PyTypeError, prelude::*}; + +pub mod errors; /// Extract a `VertexRef` from a Python object. /// The object can be a `str`, `u64` or `PyVertex`. @@ -26,77 +26,20 @@ use std::error::Error; /// /// Returns /// A `VertexRef` extracted from the Python object. -pub(crate) fn extract_vertex_ref(vref: &PyAny) -> PyResult { - if let Ok(s) = vref.extract::() { - Ok(s.into()) - } else if let Ok(gid) = vref.extract::() { - Ok(gid.into()) - } else if let Ok(v) = vref.extract::() { - Ok(v.into()) - } else { - Err(PyTypeError::new_err("Not a valid vertex")) +impl<'source> FromPyObject<'source> for VertexRef { + fn extract(vref: &'source PyAny) -> PyResult { + if let Ok(s) = vref.extract::() { + Ok(s.into()) + } else if let Ok(gid) = vref.extract::() { + Ok(gid.into()) + } else if let Ok(v) = vref.extract::() { + Ok(v.into()) + } else { + Err(PyTypeError::new_err("Not a valid vertex")) + } } } -pub(crate) fn window_impl( - slf: &T, - t_start: Option<&PyAny>, - t_end: Option<&PyAny>, -) -> PyResult { - let t_start = t_start.map(|t| extract_time(t)).transpose()?; - let t_end = t_end.map(|t| extract_time(t)).transpose()?; - Ok(slf.window(t_start.unwrap_or(i64::MIN), t_end.unwrap_or(i64::MAX))) -} - -pub(crate) fn at_impl( - slf: &T, - end: &PyAny, -) -> PyResult { - let end = extract_time(end)?; - Ok(slf.at(end)) -} - -pub fn adapt_err_value(err: &E) -> PyErr -where - E: Error + ?Sized, -{ - let error_log = display_error_chain::DisplayErrorChain::new(err).to_string(); - PyException::new_err(error_log) -} - -pub fn adapt_result(result: Result) -> PyResult -// TODO: make this private -where - E: Error, -{ - result.map_err(|e| adapt_err_value(&e)) -} - -pub(crate) fn expanding_impl(slf: &T, step: &PyAny) -> PyResult -where - T: TimeOps + Clone + Sync + Send + 'static, - T::WindowedViewType: IntoPyObject + Send + Sync, -{ - let step = extract_interval(step)?; - let window_set: WindowSet = adapt_result(slf.expanding(step)).map(|iter| iter.into())?; - Ok(window_set.into()) -} - -pub(crate) fn rolling_impl( - slf: &T, - window: &PyAny, - step: Option<&PyAny>, -) -> PyResult -where - T: TimeOps + Clone + Sync + Send + 'static, - T::WindowedViewType: IntoPyObject + Send + Sync, -{ - let window = extract_interval(window)?; - let step = step.map(extract_interval).transpose()?; - let window_set: WindowSet = adapt_result(slf.rolling(window, step))?; - Ok(window_set.into()) -} - fn parse_email_timestamp(timestamp: &str) -> PyResult { Python::with_gil(|py| { let email_utils = PyModule::import(py, "email.utils")?; @@ -107,89 +50,53 @@ fn parse_email_timestamp(timestamp: &str) -> PyResult { }) } -pub(crate) fn extract_time(time: &PyAny) -> PyResult { - let from_number = time.extract::().map(|n| Ok(n)); - let from_str = time.extract::<&str>().map(|str| { - str.try_into_time() - .or_else(|e| parse_email_timestamp(str).map_err(|_| e)) - }); - - let mut extract_results = vec![from_number, from_str].into_iter(); - let first_valid_extraction = extract_results - .find_map(|result| match result { - Ok(val) => Some(Ok(val)), - Err(_) => None, - }) - .unwrap_or_else(|| { - let message = format!("time '{time}' must be a str or an int"); - Err(PyTypeError::new_err(message)) - })?; - - adapt_result(first_valid_extraction) +pub struct PyTime { + parsing_result: i64, } -pub(crate) fn extract_into_time(time: &PyAny) -> PyResult { - let string = time.extract::(); - let result = string.map(|string| { - let timestamp = string.as_str(); - let parsing_result = timestamp - .try_into_time() - .or_else(|e| parse_email_timestamp(timestamp).map_err(|_| e)); - TimeBox::new(parsing_result) - }); - - let result = result.or_else(|_| { - let number = time.extract::(); - number.map(|number| TimeBox::new(number.try_into_time())) - }); - - let result = result.or_else(|_| { - let parsed_datetime = time.extract::(); - parsed_datetime.map(|parsed_datetime | TimeBox::new(parsed_datetime.try_into_time())) - }); - - result.map_err(|_| { +impl<'source> FromPyObject<'source> for PyTime { + fn extract(time: &'source PyAny) -> PyResult { + if let Ok(string) = time.extract::() { + let timestamp = string.as_str(); + let parsing_result = timestamp + .try_into_time() + .or_else(|e| parse_email_timestamp(timestamp).map_err(|_| e))?; + return Ok(PyTime::new(parsing_result)); + } + if let Ok(number) = time.extract::() { + return Ok(PyTime::new(number.try_into_time()?)); + } + if let Ok(parsed_datetime) = time.extract::() { + return Ok(PyTime::new(parsed_datetime.try_into_time()?)); + } let message = format!("time '{time}' must be a str, dt or an integer"); - PyTypeError::new_err(message) - }) -} - -pub(crate) struct TimeBox { - parsing_result: Result, + Err(PyTypeError::new_err(message)) + } } -impl TimeBox { - fn new(parsing_result: Result) -> Self { +impl PyTime { + fn new(parsing_result: i64) -> Self { Self { parsing_result } } + pub const MIN: PyTime = PyTime { + parsing_result: i64::MIN, + }; + pub const MAX: PyTime = PyTime { + parsing_result: i64::MAX, + }; } -impl TryIntoTime for TimeBox { - fn try_into_time(self) -> Result { +impl IntoTime for PyTime { + fn into_time(self) -> i64 { self.parsing_result } } -pub(crate) fn extract_interval(interval: &PyAny) -> PyResult { - let string = interval.extract::(); - let result = string.map(|string| IntervalBox::new(string.as_str())); - - let result = result.or_else(|_| { - let number = interval.extract::(); - number.map(|number| IntervalBox::new(number)) - }); - - result.map_err(|_| { - let message = format!("interval '{interval}' must be a str or an unsigned integer"); - PyTypeError::new_err(message) - }) -} - -pub(crate) struct IntervalBox { +pub(crate) struct PyInterval { interval: Result, } -impl IntervalBox { +impl PyInterval { fn new(interval: I) -> Self where I: TryInto, @@ -200,9 +107,26 @@ impl IntervalBox { } } -impl TryFrom for Interval { +impl<'source> FromPyObject<'source> for PyInterval { + fn extract(interval: &'source PyAny) -> PyResult { + let string = interval.extract::(); + let result = string.map(|string| PyInterval::new(string.as_str())); + + let result = result.or_else(|_| { + let number = interval.extract::(); + number.map(PyInterval::new) + }); + + result.map_err(|_| { + let message = format!("interval '{interval}' must be a str or an unsigned integer"); + PyTypeError::new_err(message) + }) + } +} + +impl TryFrom for Interval { type Error = ParseTimeError; - fn try_from(value: IntervalBox) -> Result { + fn try_from(value: PyInterval) -> Result { value.interval } } @@ -210,46 +134,51 @@ impl TryFrom for Interval { /// A trait for vertices that can be used as input for the graph. /// This allows us to add vertices with different types of ids, either strings or ints. #[derive(Clone, Debug)] -pub struct InputVertexBox { +pub struct PyInputVertex { id: u64, - name_prop: Option, + name: Option, +} + +impl<'source> FromPyObject<'source> for PyInputVertex { + fn extract(id: &'source PyAny) -> PyResult { + match id.extract::() { + Ok(string) => Ok(PyInputVertex::new(string)), + Err(_) => { + let msg = "IDs need to be strings or an unsigned integers"; + let number = id.extract::().map_err(|_| PyTypeError::new_err(msg))?; + Ok(PyInputVertex::new(number)) + } + } + } } /// Implementation for vertices that can be used as input for the graph. /// This allows us to add vertices with different types of ids, either strings or ints. -impl InputVertexBox { - pub(crate) fn new(vertex: T) -> InputVertexBox +impl PyInputVertex { + pub(crate) fn new(vertex: T) -> PyInputVertex where T: InputVertex, { - InputVertexBox { + PyInputVertex { id: vertex.id(), - name_prop: vertex.name_prop(), + name: vertex.id_str().map(|s| s.into()), } } } /// Implementation for vertices that can be used as input for the graph. /// This allows us to add vertices with different types of ids, either strings or ints. -impl InputVertex for InputVertexBox { +impl InputVertex for PyInputVertex { /// Returns the id of the vertex. fn id(&self) -> u64 { self.id } /// Returns the name property of the vertex. - fn name_prop(&self) -> Option { - self.name_prop.clone() - } -} - -pub(crate) fn extract_input_vertex(id: &PyAny) -> PyResult { - match id.extract::() { - Ok(string) => Ok(InputVertexBox::new(string)), - Err(_) => { - let msg = "IDs need to be strings or an unsigned integers"; - let number = id.extract::().map_err(|_| PyTypeError::new_err(msg))?; - Ok(InputVertexBox::new(number)) + fn id_str(&self) -> Option<&str> { + match &self.name { + Some(n) => Some(n), + None => None, } } } @@ -262,10 +191,10 @@ pub trait WindowSetOps { impl WindowSetOps for WindowSet where T: TimeOps + Clone + Sync + 'static + Send, - T::WindowedViewType: IntoPyObject + Send, + T::WindowedViewType: IntoPy + Send, { fn build_iter(&self) -> PyGenericIterator { - self.clone().map(|v| v.into_py_object()).into() + self.clone().into() } fn time_index(&self, center: bool) -> PyGenericIterable { @@ -301,7 +230,7 @@ pub struct PyWindowSet { impl From> for PyWindowSet where T: TimeOps + Clone + Sync + Send + 'static, - T::WindowedViewType: IntoPyObject + Send + Sync, + T::WindowedViewType: IntoPy + Send + Sync, { fn from(value: WindowSet) -> Self { Self { @@ -310,6 +239,16 @@ where } } +impl IntoPy for WindowSet +where + T: TimeOps + Clone + Sync + Send + 'static, + T::WindowedViewType: IntoPy + Send + Sync, +{ + fn into_py(self, py: Python<'_>) -> PyObject { + PyWindowSet::from(self).into_py(py) + } +} + #[pymethods] impl PyWindowSet { fn __iter__(&self) -> PyGenericIterator { @@ -385,6 +324,29 @@ impl PyGenericIterator { } } -pub(crate) trait IntoPyObject { - fn into_py_object(self) -> PyObject; +#[pyclass(name = "NestedIterator")] +pub struct PyNestedGenericIterator { + iter: BoxedIter, +} + +impl From for PyNestedGenericIterator +where + I: Iterator + Send + 'static, + J: Iterator + Send + 'static, + T: IntoPy + 'static, +{ + fn from(value: I) -> Self { + let py_iter = Box::new(value.map(|item| item.into())); + Self { iter: py_iter } + } +} + +#[pymethods] +impl PyNestedGenericIterator { + fn __iter__(slf: PyRef<'_, Self>) -> PyRef<'_, Self> { + slf + } + fn __next__(&mut self) -> Option { + self.iter.next() + } } diff --git a/raphtory/src/search/mod.rs b/raphtory/src/search/mod.rs new file mode 100644 index 0000000000..2dbd02387c --- /dev/null +++ b/raphtory/src/search/mod.rs @@ -0,0 +1,1123 @@ +// search goes here + +use std::{collections::HashSet, ops::Deref, sync::Arc}; + +use rayon::{prelude::ParallelIterator, slice::ParallelSlice}; +use tantivy::{ + collector::TopDocs, + schema::{Field, Schema, SchemaBuilder, FAST, INDEXED, STORED, TEXT}, + Document, Index, IndexReader, IndexSettings, IndexWriter, TantivyError, +}; + +use crate::{ + core::{ + entities::{vertices::vertex_ref::VertexRef, EID, VID}, + storage::timeindex::{AsTime, TimeIndexEntry}, + utils::errors::GraphError, + ArcStr, PropType, + }, + db::{ + api::{ + mutation::internal::InternalAdditionOps, + view::{ + internal::{DynamicGraph, InheritViewOps, IntoDynamic}, + EdgeViewInternalOps, + }, + }, + graph::{edge::EdgeView, vertex::VertexView}, + }, + prelude::*, +}; + +#[derive(Clone)] +pub struct IndexedGraph { + pub(crate) graph: G, + pub(crate) vertex_index: Arc, + pub(crate) edge_index: Arc, + pub(crate) reader: IndexReader, + pub(crate) edge_reader: IndexReader, +} + +impl Deref for IndexedGraph { + type Target = G; + + fn deref(&self) -> &Self::Target { + &self.graph + } +} + +impl IntoDynamic for IndexedGraph { + fn into_dynamic(self) -> DynamicGraph { + DynamicGraph::new(self) + } +} + +impl InheritViewOps for IndexedGraph {} + +pub(in crate::search) mod fields { + pub const TIME: &str = "time"; + pub const VERTEX_ID: &str = "vertex_id"; + pub const VERTEX_ID_REV: &str = "vertex_id_rev"; + pub const NAME: &str = "name"; + + // edges + // pub const SRC_ID: &str = "src_id"; + pub const SOURCE: &str = "from"; + // pub const DEST_ID: &str = "dest_id"; + pub const DESTINATION: &str = "to"; + pub const EDGE_ID: &str = "edge_id"; +} + +impl From for IndexedGraph { + fn from(graph: G) -> Self { + Self::from_graph(&graph).expect("failed to generate index from graph") + } +} + +impl IndexedGraph { + pub fn into_dynamic_indexed(self) -> IndexedGraph { + IndexedGraph { + graph: self.graph.into_dynamic(), + vertex_index: self.vertex_index, + edge_index: self.edge_index, + reader: self.reader, + edge_reader: self.edge_reader, + } + } +} + +impl IndexedGraph { + fn new_vertex_schema_builder() -> SchemaBuilder { + let mut schema = Schema::builder(); + + // we first add GID time, ID and ID_REV + // ensure time is part of the index + schema.add_i64_field(fields::TIME, INDEXED | STORED); + // ensure we add vertex_id as stored to get back the vertex id after the search + schema.add_u64_field(fields::VERTEX_ID, FAST | STORED); + // reverse to sort by it + schema.add_u64_field(fields::VERTEX_ID_REV, FAST | STORED); + // add name + schema.add_text_field(fields::NAME, TEXT); + schema + } + + fn new_edge_schema_builder() -> SchemaBuilder { + let mut schema = Schema::builder(); + // we first add GID time, ID and ID_REV + // ensure time is part of the index + schema.add_i64_field(fields::TIME, INDEXED | STORED); + // ensure we add vertex_id as stored to get back the vertex id after the search + schema.add_text_field(fields::SOURCE, TEXT); + schema.add_text_field(fields::DESTINATION, TEXT); + schema.add_u64_field(fields::EDGE_ID, FAST | STORED); + + schema + } + + fn schema_from_props, I: IntoIterator>(props: I) -> Schema { + let mut schema = Self::new_vertex_schema_builder(); + + for (prop_name, prop) in props.into_iter() { + match prop { + Prop::Str(_) => { + schema.add_text_field(prop_name.as_ref(), TEXT); + } + Prop::DTime(_) => { + schema.add_date_field(prop_name.as_ref(), INDEXED); + } + _ => todo!(), + } + } + + schema.build() + } + + fn set_schema_field_from_prop(schema: &mut SchemaBuilder, prop: &str, prop_value: Prop) { + match prop_value { + Prop::Str(_) => { + schema.add_text_field(prop, TEXT); + } + Prop::DTime(_) => { + schema.add_date_field(prop, INDEXED); + } + Prop::U8(_) => { + schema.add_u64_field(prop, INDEXED); + } + Prop::U16(_) => { + schema.add_u64_field(prop, INDEXED); + } + Prop::U64(_) => { + schema.add_u64_field(prop, INDEXED); + } + Prop::I64(_) => { + schema.add_i64_field(prop, INDEXED); + } + Prop::I32(_) => { + schema.add_i64_field(prop, INDEXED); + } + Prop::F64(_) => { + schema.add_f64_field(prop, INDEXED); + } + Prop::F32(_) => { + schema.add_f64_field(prop, INDEXED); + } + Prop::Bool(_) => { + schema.add_u64_field(prop, INDEXED); + } + _ => { + schema.add_text_field(prop, TEXT); + } + } + } + + // we need to check every vertex for the properties and add them + // to the schem depending on the type of the property + // + fn schema_for_vertex(g: &G) -> Schema { + let mut schema = Self::new_vertex_schema_builder(); + + // TODO: load all these from the graph at some point in the future + let mut prop_names_set = g + .vertex_meta() + .temporal_prop_meta() + .get_keys() + .into_iter() + .chain(g.vertex_meta().const_prop_meta().get_keys().into_iter()) + .collect::>(); + + for vertex in g.vertices() { + if prop_names_set.is_empty() { + break; + } + let mut found_props: HashSet = HashSet::default(); + found_props.insert("name".into()); + + for prop in prop_names_set.iter() { + // load temporal props + if let Some(prop_value) = vertex + .properties() + .temporal() + .get(prop) + .and_then(|p| p.latest()) + { + if found_props.contains(prop) { + continue; + } + Self::set_schema_field_from_prop(&mut schema, prop, prop_value); + found_props.insert(prop.clone()); + } + // load static props + if let Some(prop_value) = vertex.properties().constant().get(prop) { + if !found_props.contains(prop) { + Self::set_schema_field_from_prop(&mut schema, prop, prop_value); + found_props.insert(prop.clone()); + } + } + } + + for found_prop in found_props { + prop_names_set.remove(&found_prop); + } + } + + schema.build() + } + + // we need to check every vertex for the properties and add them + // to the schem depending on the type of the property + // + fn schema_for_edge(g: &G) -> Schema { + let mut schema = Self::new_edge_schema_builder(); + + // TODO: load all these from the graph at some point in the future + let mut prop_names_set = g + .edge_meta() + .temporal_prop_meta() + .get_keys() + .into_iter() + .chain(g.edge_meta().const_prop_meta().get_keys()) + .collect::>(); + + for edge in g.edges() { + if prop_names_set.is_empty() { + break; + } + let mut found_props: HashSet = HashSet::new(); + + for prop in prop_names_set.iter() { + // load temporal props + if let Some(prop_value) = edge + .properties() + .temporal() + .get(prop) + .and_then(|p| p.latest()) + { + if found_props.contains(prop) { + continue; + } + Self::set_schema_field_from_prop(&mut schema, prop, prop_value); + found_props.insert(prop.clone()); + } + // load static props + if let Some(prop_value) = edge.properties().constant().get(prop) { + if !found_props.contains(prop) { + Self::set_schema_field_from_prop(&mut schema, prop, prop_value); + found_props.insert(prop.clone()); + } + } + } + + for found_prop in found_props { + prop_names_set.remove(&found_prop); + } + } + + schema.build() + } + + fn index_prop_value(document: &mut Document, prop_field: Field, prop_value: Prop) { + match prop_value { + Prop::Str(prop_text) => { + // add the property to the document + document.add_text(prop_field, prop_text); + } + Prop::DTime(prop_time) => { + let time = + tantivy::DateTime::from_timestamp_nanos(prop_time.and_utc().timestamp_nanos()); + document.add_date(prop_field, time); + } + Prop::U8(prop_u8) => { + document.add_u64(prop_field, u64::from(prop_u8)); + } + Prop::U16(prop_u16) => { + document.add_u64(prop_field, u64::from(prop_u16)); + } + Prop::U64(prop_u64) => { + document.add_u64(prop_field, prop_u64); + } + Prop::I64(prop_i64) => { + document.add_i64(prop_field, prop_i64); + } + Prop::I32(prop_i32) => { + document.add_i64(prop_field, i64::from(prop_i32)); + } + Prop::F64(prop_f64) => { + document.add_f64(prop_field, prop_f64); + } + Prop::F32(prop_f32) => { + document.add_f64(prop_field, f64::from(prop_f32)); + } + Prop::Bool(prop_bool) => { + document.add_bool(prop_field, prop_bool); + } + prop => document.add_text(prop_field, prop.to_string()), + } + } + + fn index_vertices(g: &G) -> tantivy::Result<(Index, IndexReader)> { + let schema = Self::schema_for_vertex(g); + let (index, reader) = + Self::new_index(schema.clone(), Self::default_vertex_index_settings()); + + let time_field = schema.get_field(fields::TIME)?; + let vertex_id_field = schema.get_field(fields::VERTEX_ID)?; + let vertex_id_rev_field = schema.get_field(fields::VERTEX_ID_REV)?; + + let writer = Arc::new(parking_lot::RwLock::new(index.writer(100_000_000)?)); + + let v_ids = (0..g.count_vertices()).collect::>(); + + v_ids.par_chunks(128).try_for_each(|v_ids| { + let writer_lock = writer.clone(); + { + let writer_guard = writer_lock.read(); + for v_id in v_ids { + if let Some(vertex) = g.vertex(VertexRef::new((*v_id).into())) { + Self::index_vertex_view( + vertex, + &schema, + &writer_guard, + time_field, + vertex_id_field, + vertex_id_rev_field, + )?; + } + } + } + + let mut writer_guard = writer_lock.write(); + writer_guard.commit()?; + Ok::<(), TantivyError>(()) + })?; + + reader.reload()?; + Ok((index, reader)) + } + + pub fn from_graph(g: &G) -> tantivy::Result { + let (vertex_index, vertex_reader) = Self::index_vertices(g)?; + let (edge_index, edge_reader) = Self::index_edges(g)?; + + Ok(IndexedGraph { + graph: g.clone(), + vertex_index: Arc::new(vertex_index), + edge_index: Arc::new(edge_index), + reader: vertex_reader, + edge_reader, + }) + } + + fn index_vertex_view>( + vertex: VertexView, + schema: &Schema, + writer: &W, + time_field: Field, + vertex_id_field: Field, + vertex_id_rev_field: Field, + ) -> tantivy::Result<()> { + let vertex_id: u64 = usize::from(vertex.vertex) as u64; + + let mut document = Document::new(); + // add the vertex_id + document.add_u64(vertex_id_field, vertex_id); + document.add_u64(vertex_id_rev_field, u64::MAX - vertex_id); + + let name_field = schema.get_field("name")?; + document.add_text(name_field, vertex.name()); + + for (temp_prop_name, temp_prop_value) in vertex.properties().temporal() { + let prop_field = schema.get_field(&temp_prop_name)?; + for (time, prop_value) in temp_prop_value { + // add time to the document + document.add_i64(time_field, time); + + Self::index_prop_value(&mut document, prop_field, prop_value); + } + } + + for (prop_name, prop_value) in vertex.properties().constant() { + let prop_field = schema.get_field(&prop_name)?; + Self::index_prop_value(&mut document, prop_field, prop_value); + } + + writer.add_document(document)?; + Ok(()) + } + + fn index_edge_view>( + e_ref: EdgeView, + schema: &Schema, + writer: &W, + time_field: Field, + source_field: Field, + destination_field: Field, + edge_id_field: Field, + ) -> tantivy::Result<()> { + let edge_ref = e_ref.eref(); + + let src = e_ref.src(); + let dst = e_ref.dst(); + + let mut document = Document::new(); + let edge_id: u64 = Into::::into(edge_ref.pid()) as u64; + document.add_u64(edge_id_field, edge_id); + document.add_text(source_field, src.name()); + document.add_text(destination_field, dst.name()); + + // add all time events + for e in e_ref.explode() { + if let Some(t) = e.time() { + document.add_i64(time_field, t); + } + } + + for (temp_prop_name, temp_prop_value) in e_ref.properties().temporal() { + let prop_field = schema.get_field(&temp_prop_name)?; + for (time, prop_value) in temp_prop_value { + // add time to the document + document.add_i64(time_field, time); + Self::index_prop_value(&mut document, prop_field, prop_value); + } + } + + for (prop_name, prop_value) in e_ref.properties().constant() { + let prop_field = schema.get_field(&prop_name)?; + Self::index_prop_value(&mut document, prop_field, prop_value); + } + + writer.add_document(document)?; // add the edge itself + Ok(()) + } + + pub fn index_edges(g: &G) -> tantivy::Result<(Index, IndexReader)> { + let schema = Self::schema_for_edge(g); + let (index, reader) = Self::new_index(schema.clone(), Self::default_edge_index_settings()); + + let time_field = schema.get_field(fields::TIME)?; + let source_field = schema.get_field(fields::SOURCE)?; + let destination_field = schema.get_field(fields::DESTINATION)?; + let edge_id_field = schema.get_field(fields::EDGE_ID)?; + + let writer = Arc::new(parking_lot::RwLock::new(index.writer(100_000_000)?)); + + let e_ids = (0..g.count_edges()).collect::>(); + let edge_filter = g.edge_filter(); + e_ids.par_chunks(128).try_for_each(|e_ids| { + let writer_lock = writer.clone(); + { + let writer_guard = writer_lock.read(); + for e_id in e_ids { + if let Some(e_ref) = + g.find_edge_id((*e_id).into(), &g.layer_ids(), edge_filter.as_deref()) + { + let e_view = EdgeView::new(g.clone(), e_ref); + Self::index_edge_view( + e_view, + &schema, + &writer_guard, + time_field, + source_field, + destination_field, + edge_id_field, + )?; + } + } + } + + let mut writer_guard = writer_lock.write(); + writer_guard.commit()?; + Ok::<(), TantivyError>(()) + })?; + + reader.reload()?; + Ok((index, reader)) + } + + fn default_vertex_index_settings() -> IndexSettings { + IndexSettings::default() + } + + fn default_edge_index_settings() -> IndexSettings { + IndexSettings::default() + } + + fn new_index(schema: Schema, index_settings: IndexSettings) -> (Index, IndexReader) { + let index = Index::builder() + .settings(index_settings) + .schema(schema) + .create_in_ram() + .expect("failed to create index"); + + let reader = index + .reader_builder() + .reload_policy(tantivy::ReloadPolicy::Manual) + .try_into() + .unwrap(); + (index, reader) + } + + pub fn new(graph: G, vertex_props: I, edge_props: I2) -> Self + where + S: AsRef, + I: IntoIterator, + I2: IntoIterator, + { + let schema = Self::schema_from_props(vertex_props); + + let (index, reader) = Self::new_index(schema, Self::default_vertex_index_settings()); + + let schema = Self::schema_from_props(edge_props); + + let (edge_index, edge_reader) = + Self::new_index(schema, Self::default_edge_index_settings()); + + IndexedGraph { + graph, + vertex_index: Arc::new(index), + edge_index: Arc::new(edge_index), + reader, + edge_reader, + } + } + + pub fn reload(&self) -> Result<(), GraphError> { + self.reader.reload()?; + Ok(()) + } + + fn resolve_vertex_from_search_result( + &self, + vertex_id: Field, + doc: Document, + ) -> Option> { + let vertex_id: usize = doc + .get_first(vertex_id) + .and_then(|value| value.as_u64())? + .try_into() + .ok()?; + let vertex_id = VertexRef::Internal(vertex_id.into()); + self.graph.vertex(vertex_id) + } + + fn resolve_edge_from_search_result( + &self, + edge_id: Field, + doc: Document, + ) -> Option> { + let edge_id: usize = doc + .get_first(edge_id) + .and_then(|value| value.as_u64())? + .try_into() + .ok()?; + let e_ref = self.graph.find_edge_id( + edge_id.into(), + &self.graph.layer_ids(), + self.graph.edge_filter().as_deref(), + )?; + let e_view = EdgeView::new(self.graph.clone(), e_ref); + Some(e_view) + } + + pub fn search( + &self, + q: &str, + limit: usize, + offset: usize, + ) -> Result>, GraphError> { + let searcher = self.reader.searcher(); + let query_parser = tantivy::query::QueryParser::for_index(&self.vertex_index, vec![]); + let query = query_parser.parse_query(q)?; + + let ranking = TopDocs::with_limit(limit).and_offset(offset); + + let top_docs = searcher.search(&query, &ranking)?; + + let vertex_id = self.vertex_index.schema().get_field(fields::VERTEX_ID)?; + + let results = top_docs + .into_iter() + .map(|(_, doc_address)| searcher.doc(doc_address)) + .filter_map(Result::ok) + .filter_map(|doc| self.resolve_vertex_from_search_result(vertex_id, doc)) + .collect::>(); + + Ok(results) + } + + pub fn search_edges( + &self, + q: &str, + limit: usize, + offset: usize, + ) -> Result>, GraphError> { + let searcher = self.edge_reader.searcher(); + let query_parser = tantivy::query::QueryParser::for_index(&self.edge_index, vec![]); + let query = query_parser.parse_query(q)?; + + let ranking = TopDocs::with_limit(limit).and_offset(offset); + + let top_docs = searcher.search(&query, &ranking)?; + + let edge_id = self.edge_index.schema().get_field(fields::EDGE_ID)?; + + let results = top_docs + .into_iter() + .map(|(_, doc_address)| searcher.doc(doc_address)) + .filter_map(Result::ok) + .filter_map(|doc| self.resolve_edge_from_search_result(edge_id, doc)) + .collect::>(); + + Ok(results) + } +} + +impl InternalAdditionOps for IndexedGraph { + #[inline] + fn next_event_id(&self) -> usize { + self.graph.next_event_id() + } + #[inline] + fn resolve_layer(&self, layer: Option<&str>) -> usize { + self.graph.resolve_layer(layer) + } + + #[inline] + fn resolve_vertex(&self, id: u64, name: Option<&str>) -> VID { + self.graph.resolve_vertex(id, name) + } + + #[inline] + fn resolve_graph_property(&self, prop: &str, is_static: bool) -> usize { + self.graph.resolve_graph_property(prop, is_static) + } + + #[inline] + fn resolve_vertex_property( + &self, + prop: &str, + dtype: PropType, + is_static: bool, + ) -> Result { + self.graph.resolve_vertex_property(prop, dtype, is_static) + } + + #[inline] + fn resolve_edge_property( + &self, + prop: &str, + dtype: PropType, + is_static: bool, + ) -> Result { + self.graph.resolve_edge_property(prop, dtype, is_static) + } + + #[inline] + fn process_prop_value(&self, prop: Prop) -> Prop { + self.graph.process_prop_value(prop) + } + + fn internal_add_vertex( + &self, + t: TimeIndexEntry, + v: VID, + props: Vec<(usize, Prop)>, + ) -> Result<(), GraphError> { + let mut document = Document::new(); + // add time to the document + let time = self.vertex_index.schema().get_field(fields::TIME)?; + document.add_i64(time, *t.t()); + // add name to the document + + let name = self.vertex_index.schema().get_field(fields::NAME)?; + document.add_text(name, self.graph.vertex_name(v)); + + // index all props that are declared in the schema + for (prop_id, prop) in props.iter() { + let prop_name = self.graph.vertex_meta().get_prop_name(*prop_id, false); + if let Ok(field) = self.vertex_index.schema().get_field(&prop_name) { + if let Prop::Str(s) = prop { + document.add_text(field, s) + } + } + } + // add the vertex id to the document + self.graph.internal_add_vertex(t, v, props)?; + // get the field from the index + let vertex_id = self.vertex_index.schema().get_field(fields::VERTEX_ID)?; + let vertex_id_rev = self + .vertex_index + .schema() + .get_field(fields::VERTEX_ID_REV)?; + let index_v_id: u64 = Into::::into(v) as u64; + + document.add_u64(vertex_id, index_v_id); + document.add_u64(vertex_id_rev, u64::MAX - index_v_id); + + let mut writer = self.vertex_index.writer(50_000_000)?; + + writer.add_document(document)?; + + writer.commit()?; + + Ok(()) + } + + fn internal_add_edge( + &self, + _t: TimeIndexEntry, + _src: VID, + _dst: VID, + _props: Vec<(usize, Prop)>, + _layer: usize, + ) -> Result { + todo!() + } +} + +#[cfg(test)] +mod test { + use std::time::SystemTime; + + use tantivy::{doc, DocAddress}; + + use super::*; + + #[test] + fn index_numeric_props() { + let graph = Graph::new(); + + graph + .add_vertex( + 1, + "Blerg", + [ + ("age".to_string(), Prop::U64(42)), + ("balance".to_string(), Prop::I64(-1234)), + ], + ) + .expect("failed to add vertex"); + + let ig: IndexedGraph = graph.into(); + + let results = ig + .search("age:42", 5, 0) + .expect("failed to search for vertex") + .into_iter() + .map(|v| v.name()) + .collect::>(); + + assert_eq!(results, vec!["Blerg"]); + } + + #[test] + #[ignore = "this test is for experiments with the jira graph"] + fn load_jira_graph() -> Result<(), GraphError> { + let graph = Graph::load_from_file("/tmp/graphs/jira").expect("failed to load graph"); + assert!(graph.count_vertices() > 0); + + let now = SystemTime::now(); + + let index_graph: IndexedGraph = graph.into(); + let elapsed = now.elapsed().unwrap().as_secs(); + println!("indexing took: {:?}", elapsed); + + let issues = index_graph.search("name:'DEV-1690'", 5, 0)?; + + assert!(!issues.is_empty()); + + let names = issues.into_iter().map(|v| v.name()).collect::>(); + println!("names: {:?}", names); + + Ok(()) + } + + #[test] + fn create_indexed_graph_from_existing_graph() { + let graph = Graph::new(); + + graph + .add_vertex(1, "Gandalf", [("kind".to_string(), Prop::str("Wizard"))]) + .expect("add vertex failed"); + + graph + .add_vertex( + 2, + "Frodo", + [ + ("kind".to_string(), Prop::str("Hobbit")), + ("has_ring".to_string(), Prop::str("yes")), + ], + ) + .expect("add vertex failed"); + + graph + .add_vertex(2, "Merry", [("kind".to_string(), Prop::str("Hobbit"))]) + .expect("add vertex failed"); + + graph + .add_vertex(4, "Gollum", [("kind".to_string(), Prop::str("Creature"))]) + .expect("add vertex failed"); + + graph + .add_vertex(9, "Gollum", [("has_ring".to_string(), Prop::str("yes"))]) + .expect("add vertex failed"); + + graph + .add_vertex(9, "Frodo", [("has_ring".to_string(), Prop::str("no"))]) + .expect("add vertex failed"); + + graph + .add_vertex(10, "Frodo", [("has_ring".to_string(), Prop::str("yes"))]) + .expect("add vertex failed"); + + graph + .add_vertex(10, "Gollum", [("has_ring".to_string(), Prop::str("no"))]) + .expect("add vertex failed"); + + let indexed_graph: IndexedGraph = + IndexedGraph::from_graph(&graph).expect("failed to generate index from graph"); + indexed_graph.reload().expect("failed to reload index"); + + let results = indexed_graph + .search("kind:hobbit", 10, 0) + .expect("search failed"); + let mut actual = results.into_iter().map(|v| v.name()).collect::>(); + let mut expected = vec!["Frodo", "Merry"]; + // FIXME: this is not deterministic + actual.sort(); + expected.sort(); + + assert_eq!(actual, expected); + + let results = indexed_graph + .search("kind:wizard", 10, 0) + .expect("search failed"); + let actual = results.into_iter().map(|v| v.name()).collect::>(); + let expected = vec!["Gandalf"]; + assert_eq!(actual, expected); + + let results = indexed_graph + .search("kind:creature", 10, 0) + .expect("search failed"); + let actual = results.into_iter().map(|v| v.name()).collect::>(); + let expected = vec!["Gollum"]; + assert_eq!(actual, expected); + + // search by name + let results = indexed_graph + .search("name:gollum", 10, 0) + .expect("search failed"); + let actual = results.into_iter().map(|v| v.name()).collect::>(); + let expected = vec!["Gollum"]; + assert_eq!(actual, expected); + } + + #[test] + fn add_vertex_search_by_name() { + let graph = IndexedGraph::new(Graph::new(), NO_PROPS, NO_PROPS); + + graph + .add_vertex(1, "Gandalf", NO_PROPS) + .expect("add vertex failed"); + + graph.reload().expect("reload failed"); + + let vertices = graph + .search(r#"name:gandalf"#, 10, 0) + .expect("search failed"); + + let actual = vertices.into_iter().map(|v| v.name()).collect::>(); + let expected = vec!["Gandalf"]; + + assert_eq!(actual, expected); + } + + #[test] + fn add_vertex_search_by_description() { + let graph = IndexedGraph::new(Graph::new(), [("description", Prop::str(""))], NO_PROPS); + + graph + .add_vertex( + 1, + "Bilbo", + [("description".to_string(), Prop::str("A hobbit"))], + ) + .expect("add vertex failed"); + + graph + .add_vertex( + 2, + "Gandalf", + [("description".to_string(), Prop::str("A wizard"))], + ) + .expect("add vertex failed"); + + graph.reload().expect("reload failed"); + // Find the Wizard + let vertices = graph + .search(r#"description:wizard"#, 10, 0) + .expect("search failed"); + let actual = vertices.into_iter().map(|v| v.name()).collect::>(); + let expected = vec!["Gandalf"]; + assert_eq!(actual, expected); + // Find the Hobbit + let vertices = graph + .search(r#"description:'hobbit'"#, 10, 0) + .expect("search failed"); + let actual = vertices.into_iter().map(|v| v.name()).collect::>(); + let expected = vec!["Bilbo"]; + assert_eq!(actual, expected); + } + + #[test] + fn add_vertex_search_by_description_and_time() { + let graph = IndexedGraph::new(Graph::new(), [("description", Prop::str(""))], NO_PROPS); + + graph + .add_vertex( + 1, + "Gandalf", + [("description".to_string(), Prop::str("The wizard"))], + ) + .expect("add vertex failed"); + + graph + .add_vertex( + 2, + "Saruman", + [("description".to_string(), Prop::str("Another wizard"))], + ) + .expect("add vertex failed"); + + graph.reload().expect("reload failed"); + // Find Saruman + let vertices = graph + .search(r#"description:wizard AND time:[2 TO 5]"#, 10, 0) + .expect("search failed"); + let actual = vertices.into_iter().map(|v| v.name()).collect::>(); + let expected = vec!["Saruman"]; + assert_eq!(actual, expected); + // Find Gandalf + let vertices = graph + .search(r#"description:'wizard' AND time:[1 TO 2}"#, 10, 0) + .expect("search failed"); + let actual = vertices.into_iter().map(|v| v.name()).collect::>(); + let expected = vec!["Gandalf"]; + assert_eq!(actual, expected); + // Find both wizards + let vertices = graph + .search(r#"description:'wizard' AND time:[1 TO 100]"#, 10, 0) + .expect("search failed"); + let mut actual = vertices.into_iter().map(|v| v.name()).collect::>(); + let mut expected = vec!["Gandalf", "Saruman"]; + + // FIXME: this is not deterministic + actual.sort(); + expected.sort(); + + assert_eq!(actual, expected); + } + + #[test] + fn search_by_edge_props() { + let g = Graph::new(); + + g.add_edge( + 1, + "Frodo", + "Gandalf", + [("type".to_string(), Prop::str("friends"))], + None, + ) + .expect("add edge failed"); + g.add_edge( + 1, + "Frodo", + "Gollum", + [("type".to_string(), Prop::str("enemies"))], + None, + ) + .expect("add edge failed"); + + let ig: IndexedGraph = g.into(); + + let results = ig + .search_edges(r#"type:friends"#, 10, 0) + .expect("search failed"); + let actual = results + .into_iter() + .map(|e| (e.src().name(), e.dst().name())) + .collect::>(); + let expected = vec![("Frodo".to_string(), "Gandalf".to_string())]; + + assert_eq!(actual, expected); + + let results = ig + .search_edges(r#"type:enemies"#, 10, 0) + .expect("search failed"); + let actual = results + .into_iter() + .map(|e| (e.src().name(), e.dst().name())) + .collect::>(); + let expected = vec![("Frodo".to_string(), "Gollum".to_string())]; + + assert_eq!(actual, expected); + } + + #[test] + fn search_by_edge_src_dst() { + let g = Graph::new(); + + g.add_edge(1, "Frodo", "Gandalf", NO_PROPS, None) + .expect("add edge failed"); + g.add_edge(1, "Frodo", "Gollum", NO_PROPS, None) + .expect("add edge failed"); + + let ig: IndexedGraph = g.into(); + + let results = ig + .search_edges(r#"from:Frodo"#, 10, 0) + .expect("search failed"); + let mut actual = results + .into_iter() + .map(|e| (e.src().name(), e.dst().name())) + .collect::>(); + let mut expected = vec![ + ("Frodo".to_string(), "Gandalf".to_string()), + ("Frodo".to_string(), "Gollum".to_string()), + ]; + + actual.sort(); + expected.sort(); + + assert_eq!(actual, expected); + + // search by destination + let results = ig.search_edges("to:gollum", 10, 0).expect("search failed"); + let actual = results + .into_iter() + .map(|e| (e.src().name(), e.dst().name())) + .collect::>(); + let expected = vec![("Frodo".to_string(), "Gollum".to_string())]; + + assert_eq!(actual, expected); + } + + #[test] + fn tantivy_101() { + let vertex_index_props = vec!["name"]; + + let mut schema = Schema::builder(); + + for prop in vertex_index_props { + schema.add_text_field(prop.as_ref(), TEXT); + } + + // ensure time is part of the index + schema.add_u64_field("time", INDEXED | STORED); + // ensure we add vertex_id as stored to get back the vertex id after the search + schema.add_text_field("vertex_id", FAST | STORED); + + let index = Index::create_in_ram(schema.build()); + + let reader = index + .reader_builder() + .reload_policy(tantivy::ReloadPolicy::OnCommit) + .try_into() + .unwrap(); + + { + let mut writer = index.writer(50_000_000).unwrap(); + + let name = index.schema().get_field("name").unwrap(); + let time = index.schema().get_field("time").unwrap(); + let vertex_id = index.schema().get_field("vertex_id").unwrap(); + + writer + .add_document(doc!(name => "Gandalf", time => 1u64, vertex_id => 0u64)) + .expect("add document failed"); + + writer.commit().expect("commit failed"); + } + + reader.reload().unwrap(); + + let searcher = reader.searcher(); + + let query_parser = tantivy::query::QueryParser::for_index(&index, vec![]); + let query = query_parser.parse_query(r#"name:"gandalf""#).unwrap(); + + let ranking = TopDocs::with_limit(10).order_by_u64_field(fields::VERTEX_ID.to_string()); + let top_docs: Vec<(u64, DocAddress)> = searcher.search(&query, &ranking).unwrap(); + + assert!(!top_docs.is_empty()); + } + + #[test] + fn property_name_on_vertex_does_not_crash() { + let g = Graph::new(); + g.add_vertex(0, "test", [("name", "test")]).unwrap(); + let gi: IndexedGraph<_> = g.into(); + } +} diff --git a/raphtory/src/vectors/mod.rs b/raphtory/src/vectors/mod.rs new file mode 100644 index 0000000000..3ef1bd3aa2 --- /dev/null +++ b/raphtory/src/vectors/mod.rs @@ -0,0 +1,976 @@ +// use async_openai::types::{CreateEmbeddingRequest, EmbeddingInput}; +// use async_openai::Client; +use async_trait::async_trait; +use futures_util::future::{join_all, BoxFuture}; +// use futures_util::StreamExt; +use itertools::{chain, Itertools}; +use serde::{Deserialize, Serialize, Serializer}; +use std::{ + borrow::Borrow, + collections::{hash_map::DefaultHasher, HashMap, HashSet}, + convert::identity, + fmt::{Display, Formatter}, + fs::{create_dir_all, File}, + future::Future, + hash::{Hash, Hasher}, + io::{BufReader, BufWriter}, + path::Path, +}; + +// use crate::model::graph::edge::Edge; +// use numpy::PyArray2; +// use pyo3::{types::IntoPyDict, Python}; +use crate::{ + db::{ + api::view::internal::{DynamicGraph, IntoDynamic}, + graph::{edge::EdgeView, vertex::VertexView, views::window_graph::WindowedGraph}, + }, + prelude::{EdgeViewOps, GraphViewOps, Layer, LayerOps, TimeOps, VertexViewOps}, +}; + +// #[derive(Clone)] +// struct EdgeId { +// src: u64, +// dst: u64, +// } + +#[derive(Clone, Debug, Eq, PartialEq, Hash)] +enum EntityId { + Node { id: u64 }, + Edge { src: u64, dst: u64 }, +} + +impl EntityId { + fn as_node(&self) -> u64 { + match self { + EntityId::Node { id } => *id, + EntityId::Edge { .. } => panic!("edge id unwrapped as a node id"), + } + } +} + +impl From<&VertexView> for EntityId { + fn from(value: &VertexView) -> Self { + EntityId::Node { id: value.id() } + } +} + +impl From> for EntityId { + fn from(value: VertexView) -> Self { + EntityId::Node { id: value.id() } + } +} + +impl From<&EdgeView> for EntityId { + fn from(value: &EdgeView) -> Self { + EntityId::Edge { + src: value.src().id(), + dst: value.dst().id(), + } + } +} + +impl From> for EntityId { + fn from(value: EdgeView) -> Self { + EntityId::Edge { + src: value.src().id(), + dst: value.dst().id(), + } + } +} + +pub trait EmbeddingFunction: Send + Sync { + fn call(&self, texts: Vec) -> BoxFuture<'static, Vec>; +} + +impl EmbeddingFunction for T +where + T: Fn(Vec) -> F + Send + Sync, + F: Future> + Send + 'static, +{ + fn call(&self, texts: Vec) -> BoxFuture<'static, Vec> { + Box::pin(self(texts)) + } +} + +#[async_trait] +pub trait Vectorizable { + async fn vectorize( + &self, + embedding: Box, + cache_dir: &Path, + ) -> VectorizedGraph; + + async fn vectorize_with_templates( + &self, + embedding: Box, + cache_dir: &Path, + node_template: N, + edge_template: E, + // FIXME: I tried to put templates behind an option but didn't work and hadn't time to fix it + ) -> VectorizedGraph + where + N: Fn(&VertexView) -> String + Sync + Send + 'static, + E: Fn(&EdgeView) -> String + Sync + Send + 'static; +} + +#[async_trait] +impl Vectorizable for G { + async fn vectorize( + &self, + embedding: Box, + cache_dir: &Path, + ) -> VectorizedGraph { + let node_template = |vertex: &VertexView| default_node_template(vertex); + let edge_template = |edge: &EdgeView| default_edge_template(edge); + + self.vectorize_with_templates(embedding, cache_dir, node_template, edge_template) + .await + } + + async fn vectorize_with_templates( + &self, + embedding: Box, + cache_dir: &Path, + node_template: N, + edge_template: E, + ) -> VectorizedGraph + where + N: Fn(&VertexView) -> String + Sync + Send + 'static, + E: Fn(&EdgeView) -> String + Sync + Send + 'static, + { + create_dir_all(cache_dir).expect("Impossible to use cache dir"); + + let node_docs = self + .vertices() + .iter() + .map(|vertex| vertex.generate_doc(&node_template)); + let edge_docs = self.edges().map(|edge| edge.generate_doc(&edge_template)); + + let node_embeddings = generate_embeddings(node_docs, &embedding, cache_dir).await; + let edge_embeddings = generate_embeddings(edge_docs, &embedding, cache_dir).await; + + VectorizedGraph { + graph: self.clone(), + embedding, + node_embeddings, + edge_embeddings, + node_template: Box::new(node_template), + edge_template: Box::new(edge_template), + } + } +} + +fn default_node_template(vertex: &VertexView) -> String { + let name = vertex.name(); + let property_list = vertex.generate_property_list(&identity, vec![], vec![]); + format!("The entity {name} has the following details:\n{property_list}") +} + +#[allow(unstable_name_collisions)] // just update itertools when this is actually stabilised +fn default_edge_template(edge: &EdgeView) -> String { + let src = edge.src().name(); + let dst = edge.dst().name(); + // TODO: property list + + edge.layer_names() + .map(|layer| { + let times = edge + .layer(layer.clone()) + .unwrap() + .history() + .iter() + .join(", "); + match layer.as_ref() { + "_default" => format!("{src} interacted with {dst} at times: {times}"), + layer => format!("{src} {layer} {dst} at times: {times}"), + } + }) + .intersperse("\n".to_owned()) + .collect() +} + +pub struct VectorizedGraph { + graph: G, + embedding: Box, + node_embeddings: HashMap, + edge_embeddings: HashMap, + node_template: Box) -> String + Sync + Send>, + edge_template: Box) -> String + Sync + Send>, +} + +const CHUNK_SIZE: usize = 1000; + +impl VectorizedGraph { + // FIXME: this should return a Result + pub async fn similarity_search( + &self, + query: &str, + init: usize, + min_nodes: usize, + min_edges: usize, + limit: usize, + window_start: Option, + window_end: Option, + ) -> Vec { + let query_embedding = self.embedding.call(vec![query.to_owned()]).await.remove(0); + + let (graph, window_nodes, window_edges): ( + DynamicGraph, + Box>, + Box>, + ) = match (window_start, window_end) { + (None, None) => ( + self.graph.clone().into_dynamic(), + Box::new(self.node_embeddings.iter()), + Box::new(self.edge_embeddings.iter()), + ), + (start, end) => { + let start = start.unwrap_or(i64::MIN); + let end = end.unwrap_or(i64::MAX); + let window = self.graph.window(start, end); + let nodes = self.window_embeddings(&self.node_embeddings, &window); + let edges = self.window_embeddings(&self.edge_embeddings, &window); + ( + window.clone().into_dynamic(), + Box::new(nodes), + Box::new(edges), + ) + } + }; + + // FIRST STEP: ENTRY POINT SELECTION: + assert!( + min_nodes + min_edges <= init, + "min_nodes + min_edges needs to be less or equal to init" + ); + let generic_init = init - min_nodes - min_edges; + + let mut entry_point: Vec = vec![]; + + let scored_nodes = score_entities(&query_embedding, window_nodes); + let mut selected_nodes = find_top_k(scored_nodes, init); + + let scored_edges = score_entities(&query_embedding, window_edges); + let mut selected_edges = find_top_k(scored_edges, init); + + for _ in 0..min_nodes { + let (id, _) = selected_nodes.next().unwrap(); + entry_point.push(id.clone()); + } + for _ in 0..min_edges { + let (id, _) = selected_edges.next().unwrap(); + entry_point.push(id.clone()); + } + + let remaining_entities = find_top_k(chain!(selected_nodes, selected_edges), generic_init); + for (id, _distance) in remaining_entities { + entry_point.push(id.clone()); + } + + // SECONDS STEP: EXPANSION + let mut entity_ids = entry_point; + + while entity_ids.len() < limit { + let candidates = entity_ids.iter().flat_map(|id| match id { + EntityId::Node { id } => { + let edges = graph.vertex(*id).unwrap().edges(); + edges + .map(|edge| { + let edge_id = edge.into(); + let edge_embedding = self.edge_embeddings.get(&edge_id).unwrap(); + (edge_id, edge_embedding) + }) + .collect_vec() + } + EntityId::Edge { src, dst } => { + let edge = graph.edge(*src, *dst).unwrap(); + let src_id: EntityId = edge.src().into(); + let dst_id: EntityId = edge.dst().into(); + let src_embedding = self.node_embeddings.get(&src_id).unwrap(); + let dst_embedding = self.node_embeddings.get(&dst_id).unwrap(); + vec![(src_id, src_embedding), (dst_id, dst_embedding)] + } + }); + + let unique_candidates = candidates.unique_by(|(id, _)| id.clone()); + let valid_candidates = unique_candidates.filter(|(id, _)| !entity_ids.contains(id)); + let scored_candidates = score_entities(&query_embedding, valid_candidates); + let sorted_candidates = find_top_k(scored_candidates, usize::MAX); + let sorted_candidates_ids = sorted_candidates.map(|(id, _)| id).collect_vec(); + + if sorted_candidates_ids.is_empty() { + // TODO: use similarity search again with the whole graph with init + 1 !! + break; + } + + entity_ids.extend(sorted_candidates_ids); + } + + // FINAL STEP: REPRODUCE DOCUMENTS: + + entity_ids + .iter() + .take(limit) + .map(|id| match id { + EntityId::Node { id } => { + self.graph + .vertex(*id) + .unwrap() + .generate_doc(&self.node_template) + .content + } + EntityId::Edge { src, dst } => { + self.graph + .edge(*src, *dst) + .unwrap() + .generate_doc(&self.edge_template) + .content + } + }) + .collect_vec() + } + + fn window_embeddings<'a, I>( + &self, + embeddings: I, + window: &WindowedGraph, + ) -> impl Iterator + 'a + where + I: IntoIterator + 'a, + { + let window = window.clone(); + embeddings.into_iter().filter(move |(id, _)| match id { + EntityId::Node { id } => window.has_vertex(*id), + EntityId::Edge { src, dst } => window.has_edge(*src, *dst, Layer::All), + }) + } + + // pub async fn search_old( + // &self, + // query: &str, + // node_init: usize, + // edge_init: usize, + // limit: usize, + // ) -> Vec { + // let query_embedding = compute_embeddings(vec![query.to_owned()]).await.remove(0); + // + // let mut entry_point: Vec = vec![]; + // let selected_nodes = find_top_k(&query_embedding, &self.node_embeddings, node_init); + // let selected_edges = find_top_k(&query_embedding, &self.edge_embeddings, edge_init); + // for (id, distance) in chain!(selected_nodes, selected_edges) { + // println!(" - At {distance}: {id}"); + // entry_point.push(id.clone()); + // if let EntityId::Edge { src, dst } = id { + // entry_point.push(EntityId::Node { id: *src }); + // entry_point.push(EntityId::Node { id: *dst }); + // } + // } + // + // let mut entity_ids = entry_point; + // + // // it might happen that a node is include here twice, from two different paths in the graph + // // but that is not a problem because the entity_ids list is force to be unique + // let candidates: Vec = entity_ids + // .iter() + // .filter(|id| matches!(id, EntityId::Node { .. })) + // .flat_map(|id| self.get_candidates_from_node(&query_embedding, id)) + // .unique_by(|candidate| (candidate.node.clone(), candidate.edge.clone())) + // .collect_vec(); + // + // let mut sorted_candidates = SortedVec::from(candidates); + // + // println!("TODO: print sorted candidates"); + // + // while entity_ids.len() < limit && sorted_candidates.len() > 0 { + // let ExpandCandidate { node, edge, .. } = sorted_candidates.pop().unwrap(); + // // we could terminate the loop instead I guess + // + // if !entity_ids.contains(&node) { + // entity_ids.push(node.clone()); + // } + // if !entity_ids.contains(&edge) { + // entity_ids.push(edge); + // } + // + // for new_candidate in self.get_candidates_from_node(&query_embedding, &node) { + // let already_candidate = || { + // sorted_candidates + // .iter() + // .any(|candidate| candidate.edge == new_candidate.edge) + // }; + // let already_selected = || entity_ids.iter().any(|id| id == &new_candidate.edge); + // if !already_selected() && !already_candidate() { + // sorted_candidates.insert(new_candidate); + // } + // } + // } + // + // entity_ids + // .iter() + // .take(limit) + // .map(|id| match id { + // EntityId::Node { id } => { + // self.graph + // .vertex(*id) + // .unwrap() + // .generate_doc(&self.node_template) + // .content + // } + // EntityId::Edge { src, dst } => { + // self.graph + // .edge(*src, *dst) + // .unwrap() + // .generate_doc(&self.edge_template) + // .content + // } + // }) + // .collect_vec() + // } + + // returns an iterator of triplets: (node id, edge id, score) as candidates to be included in entity_ids + // fn get_candidates_from_node<'a>( + // &'a self, + // query: &'a Embedding, + // node_id: &EntityId, + // ) -> impl Iterator + 'a { + // let vertex = self.graph.vertex(node_id.as_node()).unwrap(); + // let in_edges = vertex.in_edges().map(move |edge| ExpandCandidate { + // node: (&edge.src()).into(), + // edge: (&edge).into(), + // score: self.score_pair(&query, edge.src(), edge), + // }); + // let out_edges = vertex.out_edges().map(move |edge| ExpandCandidate { + // node: (&edge.dst()).into(), + // edge: (&edge).into(), + // score: self.score_pair(&query, edge.dst(), edge), + // }); + // chain!(in_edges, out_edges) + // } + + // fn score_pair(&self, query: &Embedding, node: VertexView, edge: EdgeView) -> f32 { + // let node_vector = self.node_embeddings.get(&(&node).into()).unwrap(); + // let node_similarity = cosine(query, node_vector); + // let edge_vector = self.edge_embeddings.get(&(&edge).into()).unwrap(); + // let edge_similarity = cosine(query, edge_vector); + // + // if node_similarity > edge_similarity { + // node_similarity + // } else { + // edge_similarity + // } + // } +} + +async fn generate_embeddings( + docs: I, + embedding: &Box, + cache_dir: &Path, +) -> HashMap +where + I: Iterator, +{ + // ----------------- SEQUENTIAL-ASYNC-VERSION ----------------- + // let mut embeddings = vec![]; + // let embedding_stream = stream! { + // for doc in docs { + // yield (doc.id, doc_to_vec(doc, cache_dir)) + // } + // }; + // pin_mut!(embedding_stream); + // while let Some(embedding) = embedding_stream.next() { + // embeddings.push(embedding); + // } + // ------------------------------------------------------------ + + let mut embeddings = HashMap::new(); + let mut misses = vec![]; + + for doc in docs { + match retrieve_embedding_from_cache(&doc, cache_dir) { + Some(embedding) => { + embeddings.insert(doc.id, embedding); + } + None => misses.push(doc), + } + } + + let embedding_tasks = misses + .chunks(CHUNK_SIZE) + .map(|chunk| compute_embeddings_with_cache(chunk.to_vec(), embedding, cache_dir)); + let computed_embeddings = join_all(embedding_tasks).await.into_iter().flatten(); + for (id, embedding) in computed_embeddings { + embeddings.insert(id, embedding); + } + + embeddings +} + +async fn compute_embeddings_with_cache( + docs: Vec, + embedding: &Box, + cache_dir: &Path, +) -> Vec<(EntityId, Embedding)> { + let texts = docs.iter().map(|doc| doc.content.clone()).collect_vec(); + let embeddings = embedding.call(texts).await; + docs.into_iter() + .zip(embeddings) + .map(|(doc, embedding)| { + let doc_hash = hash_doc(&doc); // FIXME: I'm hashing twice + let embedding_cache = EmbeddingCache { + doc_hash, + embedding, + }; + let doc_path = cache_dir.join(doc.id.to_string()); + let doc_file = + File::create(doc_path).expect("Couldn't create file to store embedding cache"); + let mut doc_writer = BufWriter::new(doc_file); + bincode::serialize_into(&mut doc_writer, &embedding_cache) + .expect("Couldn't serialize embedding cache"); + (doc.id, embedding_cache.embedding) + }) + .collect_vec() +} + +fn retrieve_embedding_from_cache(doc: &EntityDocument, cache_dir: &Path) -> Option { + let doc_path = cache_dir.join(doc.id.to_string()); + let doc_file = File::open(doc_path).ok()?; + let mut doc_reader = BufReader::new(doc_file); + let embedding_cache: EmbeddingCache = bincode::deserialize_from(&mut doc_reader).ok()?; + let doc_hash = hash_doc(doc); + if doc_hash == embedding_cache.doc_hash { + Some(embedding_cache.embedding) + } else { + None + } +} + +// fn find_top_k_old<'a>( +// query: &'a Embedding, +// entities: &'a HashMap, +// k: usize, +// ) -> impl Iterator { +// entities +// .iter() +// .map(|(id, embedding)| (id, cosine(query, embedding))) +// .sorted_by(|(_, d1), (_, d2)| d1.partial_cmp(d2).unwrap().reverse()) +// // We use reverse because default sorting is ascending but we want it descending +// .take(k) +// } + +fn score_entities<'a, I, E>( + query: &'a Embedding, + entities: I, +) -> impl Iterator + 'a +where + I: IntoIterator + 'a, + E: Borrow + 'a, +{ + entities + .into_iter() + .map(|(id, embedding)| (id, cosine(query, embedding))) +} + +/// Returns the top k nodes in descending order +fn find_top_k<'a, I, E>(entities: I, k: usize) -> impl Iterator + 'a +where + I: Iterator + 'a, + E: Borrow + 'a, +{ + entities + .sorted_by(|(_, d1), (_, d2)| d1.partial_cmp(d2).unwrap().reverse()) + // We use reverse because default sorting is ascending but we want it descending + .take(k) +} + +fn cosine(vector1: &Embedding, vector2: &Embedding) -> f32 { + assert_eq!(vector1.len(), vector2.len()); + + let dot_product: f32 = vector1.iter().zip(vector2.iter()).map(|(x, y)| x * y).sum(); + let x_length: f32 = vector1.iter().map(|x| x * x).sum(); + let y_length: f32 = vector2.iter().map(|y| y * y).sum(); + // TODO: store the length of the vector as well so we don't need to recompute it + // Vectors are already normalized for ada but nor for all the models: + // see: https://platform.openai.com/docs/guides/embeddings/which-distance-function-should-i-use + + dot_product / (x_length.sqrt() * y_length.sqrt()) + // dot_product + // TODO: assert that the result is between -1 and 1 +} + +#[derive(Clone)] +pub struct EntityDocument { + id: EntityId, + content: String, +} + +#[derive(Serialize, Deserialize)] +struct EmbeddingCache { + doc_hash: u64, + embedding: Embedding, +} + +pub type Embedding = Vec; + +// async fn compute_embeddings(texts: Vec) -> Vec { +// println!("computing embeddings for {} texts", texts.len()); +// Python::with_gil(|py| { +// let sentence_transformers = py.import("sentence_transformers")?; +// let locals = [("sentence_transformers", sentence_transformers)].into_py_dict(py); +// locals.set_item("texts", texts); +// +// let pyarray: &PyArray2 = py +// .eval( +// &format!( +// "sentence_transformers.SentenceTransformer('thenlper/gte-small').encode(texts)" +// ), +// Some(locals), +// None, +// )? +// .extract()?; +// +// let readonly = pyarray.readonly(); +// let chunks = readonly.as_slice().unwrap().chunks(384).into_iter(); +// let embeddings = chunks +// .map(|chunk| chunk.iter().copied().collect_vec()) +// .collect_vec(); +// +// Ok::>, Box>(embeddings) +// }) +// .unwrap() +// } + +fn hash_doc(doc: &EntityDocument) -> u64 { + let mut hasher = DefaultHasher::new(); + doc.content.hash(&mut hasher); + hasher.finish() +} + +impl Display for EntityId { + fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result { + match self { + EntityId::Node { id } => f.serialize_u64(*id), + EntityId::Edge { src, dst } => { + f.serialize_u64(*src) + .expect("src ID couldn't be serialized"); + f.write_str("-") + .expect("edge ID separator couldn't be serialized"); + f.serialize_u64(*dst) + } + } + } +} + +pub trait GraphEntity: Sized { + // fn entity_id(&self) -> EntityId; + fn generate_doc(&self, template: &T) -> EntityDocument + where + T: Fn(&Self) -> String; + + fn generate_property_list( + &self, + time_fmt: &F, + filter_out: Vec<&str>, + force_static: Vec<&str>, + ) -> String + where + F: Fn(i64) -> D, + D: Display; +} + +impl GraphEntity for VertexView { + #[allow(unstable_name_collisions)] // just update itertools when this is actually stabilised + fn generate_property_list( + &self, + time_fmt: &F, + filter_out: Vec<&str>, + force_static: Vec<&str>, + ) -> String + where + F: Fn(i64) -> D, + D: Display, + { + let time_fmt = |time: i64| time_fmt(time).to_string(); + let missing = || "missing".to_owned(); + let min_time_fmt = self.earliest_time().map(time_fmt).unwrap_or_else(missing); + let min_time = format!("earliest activity: {}", min_time_fmt); + let max_time_fmt = self.latest_time().map(time_fmt).unwrap_or_else(missing); + let max_time = format!("latest activity: {}", max_time_fmt); + + let temporal_props = self + .properties() + .temporal() + .iter() + .filter(|(key, _)| !filter_out.contains(&key.as_ref())) + .filter(|(key, _)| !force_static.contains(&key.as_ref())) + .filter(|(_, v)| { + // the history of the temporal prop has more than one value + v.values() + .into_iter() + .map(|prop| prop.to_string()) + .unique() + .collect_vec() + .len() + > 1 + }) + .collect_vec(); + + let temporal_keys: HashSet<_> = temporal_props.iter().map(|(key, _)| key).collect(); + let temporal_props = temporal_props.iter().map(|(key, value)| { + let time_value_pairs = value.iter().map(|(k, v)| (k, v.to_string())); + time_value_pairs + .unique_by(|(_, value)| value.clone()) + .map(|(time, value)| { + let time = time_fmt(time); + format!("{key} changed to {value} at {time}") + }) + .intersperse("\n".to_owned()) + .collect() + }); + + let prop_storage = self.properties(); + + let static_props = prop_storage + .keys() + .filter(|key| !filter_out.contains(&key.as_ref())) + .filter(|key| !temporal_keys.contains(key)) + .map(|key| { + let prop = prop_storage.get(&key).unwrap().to_string(); + let key = key.to_string(); + format!("{key}: {prop}") + }); + + let props = chain!(static_props, temporal_props).sorted_by(|a, b| a.len().cmp(&b.len())); + // We sort by length so when cutting out the tail of the document we don't remove small properties + + let lines = chain!([min_time, max_time], props); + lines.intersperse("\n".to_owned()).collect() + } + + fn generate_doc(&self, template: &T) -> EntityDocument + where + T: Fn(&Self) -> String, + { + let raw_content = template(self); + let content = match raw_content.char_indices().nth(1000) { + Some((index, _)) => (&raw_content[..index]).to_owned(), + None => raw_content, + }; + // TODO: allow multi document entities !!!!! + // shortened to 1000 (around 250 tokens) to avoid exceeding the max number of tokens, + // when embedding but also when inserting documents into prompts + + EntityDocument { + id: EntityId::Node { id: self.id() }, + content, + } + } +} + +impl GraphEntity for EdgeView { + fn generate_property_list( + &self, + _time_fmt: &F, + _filter_out: Vec<&str>, + _force_static: Vec<&str>, + ) -> String + where + F: Fn(i64) -> D, + D: Display, + { + // TODO: not needed yet + "".to_owned() + } + fn generate_doc(&self, template: &T) -> EntityDocument + where + T: Fn(&Self) -> String, + { + let content = template(self); + EntityDocument { + id: EntityId::Edge { + src: self.src().id(), + dst: self.dst().id(), + }, + content, + } + } +} + +// TODO: re-enable +// #[cfg(test)] +// mod vector_tests { +// use super::*; +// use crate::{ +// core::Prop, +// prelude::{AdditionOps, Graph}, +// }; +// use std::path::PathBuf; +// +// const NO_PROPS: [(&str, Prop); 0] = []; +// +// fn format_time(time: i64) -> String { +// format!("line {time}") +// } +// +// fn node_template(vertex: &VertexView) -> String { +// let name = vertex.name(); +// let node_type = vertex.properties().get("type").unwrap().to_string(); +// let property_list = +// vertex.generate_property_list(&format_time, vec!["type", "_id"], vec![]); +// format!("{name} is a {node_type} with the following details:\n{property_list}") +// } +// +// fn edge_template(edge: &EdgeView) -> String { +// let src = edge.src().name(); +// let dst = edge.dst().name(); +// let lines = edge.history().iter().join(","); +// format!("{src} appeared with {dst} in lines: {lines}") +// } +// +// // TODO: test default templates +// +// #[test] +// fn test_node_into_doc() { +// let g = Graph::new(); +// g.add_vertex( +// 0, +// "Frodo", +// [ +// ("type".to_string(), Prop::str("hobbit")), +// ("age".to_string(), Prop::str("30")), +// ], +// ) +// .unwrap(); +// +// let doc = g +// .vertex("Frodo") +// .unwrap() +// .generate_doc(&node_template) +// .content; +// let expected_doc = r###"Frodo is a hobbit with the following details: +// earliest activity: line 0 +// latest activity: line 0 +// age: 30"###; +// assert_eq!(doc, expected_doc); +// } +// +// #[test] +// fn test_edge_into_doc() { +// let g = Graph::new(); +// g.add_edge(0, "Frodo", "Gandalf", NO_PROPS, Some("talk to")) +// .unwrap(); +// +// let doc = g +// .edge("Frodo", "Gandalf") +// .unwrap() +// .generate_doc(&edge_template) +// .content; +// let expected_doc = "Frodo appeared with Gandalf in lines: 0"; +// assert_eq!(doc, expected_doc); +// } +// +// #[tokio::test] +// async fn test_vector_store() { +// let g = Graph::new(); +// g.add_vertex( +// 0, +// "Gandalf", +// [ +// ("type".to_string(), Prop::str("wizard")), +// ("age".to_string(), Prop::str("120")), +// ], +// ) +// .unwrap(); +// g.add_vertex( +// 0, +// "Frodo", +// [ +// ("type".to_string(), Prop::str("hobbit")), +// ("age".to_string(), Prop::str("30")), +// ], +// ) +// .unwrap(); +// g.add_edge(0, "Frodo", "Gandalf", NO_PROPS, Some("talk to")) +// .unwrap(); +// g.add_vertex( +// 2, +// "Aragorn", +// [ +// ("type".to_string(), Prop::str("human")), +// ("age".to_string(), Prop::str("40")), +// ], +// ) +// .unwrap(); +// +// dotenv().ok(); +// let vec_store = VectorStore::load_graph( +// g, +// &PathBuf::from("/tmp/raphtory/vector-cache-lotr-test"), +// Some(Box::new(node_template)), +// Some(Box::new(edge_template)), +// ) +// .await; +// +// let docs = vec_store +// .search("Find a magician", 1, 0, 0, 1, None, None) +// .await; +// assert!(docs[0].contains("Gandalf is a wizard")); +// +// let docs = vec_store +// .search("Find a young person", 1, 0, 0, 1, None, None) +// .await; +// assert!(docs[0].contains("Frodo is a hobbit")); // this fails when using gte-small +// +// // with window! +// let docs = vec_store +// .search("Find a young person", 1, 0, 0, 1, Some(1), Some(3)) +// .await; +// assert!(!docs[0].contains("Frodo is a hobbit")); // this fails when using gte-small +// +// let docs = vec_store +// .search( +// "Has anyone appeared with anyone else?", +// 1, +// 0, +// 0, +// 1, +// None, +// None, +// ) +// .await; +// assert!(docs[0].contains("Frodo appeared with Gandalf")); +// } +// +// fn average_vectors(vec1: &Embedding, vec2: &Embedding) -> Embedding { +// vec1.iter() +// .zip(vec2) +// .map(|(a, b)| (a + b) / 2.0) +// .collect_vec() +// } +// +// #[tokio::test] +// async fn test_combinations() { +// dotenv().ok(); +// // I want to test if a document tuple node-edge can rank higher than +// +// let ticket = "DEV-1303 is an issue created by the Pometry team with the following details:\nearliest activity: 1667924841177\nlatest activity: 1676301689177\n_id: DEV-1303\nname: DEV-1303\njira_id: 12212\npriority: Medium\nresolution: Done\nstatus: CANCELLED\njira_url: https://pometry.atlassian.net/rest/agile/1.0/issue/12212\nsummary: Build ReadTheDocs during CI/CD as a Test to ensure it still works\ndescription: {panel:bgColor=#eae6ff}\nRemove me and Insert *what* needs to be done and *why* it needs to be done\n{panel}\n\nThis must replicate the read the docs build process. "; +// let edge = +// "Pedro Rico Pinazo was assigned to work on issue DEV-1303 at time: 2022-06-29 12:34:15"; +// let question = "tell me about someone that has been working on documentation"; +// +// let ticket_embedding = compute_embeddings(vec![ticket.to_owned()]).await.remove(0); +// let edge_embedding = compute_embeddings(vec![edge.to_owned()]).await.remove(0); +// let question_embedding = compute_embeddings(vec![question.to_owned()]) +// .await +// .remove(0); +// let comb_embedding = average_vectors(&ticket_embedding, &edge_embedding); +// +// let ticket_score = cosine(&question_embedding, &ticket_embedding); +// let edge_score = cosine(&question_embedding, &edge_embedding); +// let comb_score = cosine(&question_embedding, &comb_embedding); +// +// dbg!(ticket_score); +// dbg!(edge_score); +// dbg!(comb_score); +// } +// } diff --git a/resource/graphql-demo.jpg b/resource/graphql-demo.jpg new file mode 100644 index 0000000000..3049a045e3 Binary files /dev/null and b/resource/graphql-demo.jpg differ