diff --git a/.github/CODEOWNERS b/.github/CODEOWNERS
new file mode 100644
index 00000000..1f3ae27a
--- /dev/null
+++ b/.github/CODEOWNERS
@@ -0,0 +1 @@
+* @eroux @10zinten
diff --git a/.github/workflows/publish.yaml b/.github/workflows/publish.yaml
index ac463096..f205f4e6 100644
--- a/.github/workflows/publish.yaml
+++ b/.github/workflows/publish.yaml
@@ -14,66 +14,38 @@ jobs:
python-version: [3.8]
steps:
- - uses: actions/checkout@v1
+ - uses: actions/checkout@v1
- - name: Set up Python ${{ matrix.python-version }}
- uses: actions/setup-python@v1
- with:
- python-version: ${{ matrix.python-version }}
-
- - name: Install dependencies
- run: |
- python -m pip install --upgrade pip
- pip install -r requirements-dev.txt
- pip install -e .
+ - name: Set up Python ${{ matrix.python-version }}
+ uses: actions/setup-python@v1
+ with:
+ python-version: ${{ matrix.python-version }}
- - name: Run Test
- env:
- GITHUB_ORG: ${{ secrets.GH_ORG }}
- GITHUB_TOKEN: ${{ secrets.ADMIN_GITHUB_TOKEN }}
- run: |
- pytest tests/
+ - name: Install dependencies
+ run: |
+ python -m pip install --upgrade pip
+ pip install -r requirements-dev.txt
+ pip install -e .
+
+ - name: Run Test
+ env:
+ GITHUB_ORG: ${{ secrets.GH_ORG }}
+ GITHUB_TOKEN: ${{ secrets.ADMIN_GITHUB_TOKEN }}
+ run: |
+ PYTHONPATH=./docs_src pytest
publish:
needs: test
runs-on: ubuntu-latest
steps:
- - uses: actions/checkout@v2
- with:
- fetch-depth: 0
- token: ${{ secrets.ADMIN_GITHUB_TOKEN }}
-
- - name: Python Semantic Release
- uses: relekang/python-semantic-release@master
- with:
- github_token: ${{ secrets.ADMIN_GITHUB_TOKEN }}
- pypi_token: ${{ secrets.PYPI_PASSWORD }}
-
- docs:
- name: Deploy docs
- runs-on: ubuntu-latest
- steps:
- - name: Checkout main
- uses: actions/checkout@v2
-
- - uses: actions/setup-python@v4
+ - uses: actions/checkout@v2
with:
- python-version: '3.8'
+ fetch-depth: 0
+ token: ${{ secrets.ADMIN_GITHUB_TOKEN }}
- - name: setup workspace
- run: |
- pip install -r requirements-docs.txt
- echo docs.openpecha.org > "${GITHUB_WORKSPACE}/docs/docs/CNAME"
- remote_repo="https://x-access-token:${GITHUB_TOKEN}@${GITHUB_DOMAIN:-"github.com"}/${GITHUB_REPOSITORY}.git"
- git config --global --add safe.directory "$GITHUB_WORKSPACE"
- git config --global user.name "${GITHUB_ACTOR}"
- git config --global user.email "${GITHUB_ACTOR}@users.noreply.${GITHUB_DOMAIN:-"github.com"}"
- git remote rm origin
- git remote add origin "${remote_repo}"
-
- - name: deploy
- run: |
- cd docs
- mkdocs gh-deploy --force
-
+ - name: Python Semantic Release
+ uses: python-semantic-release/python-semantic-release@v7.34.6
+ with:
+ github_token: ${{ secrets.ADMIN_GITHUB_TOKEN }}
+ pypi_token: ${{ secrets.PYPI_PASSWORD }}
diff --git a/.github/workflows/test-coverage.yaml b/.github/workflows/test-coverage.yaml
index 0dae8e4e..15a81fbb 100644
--- a/.github/workflows/test-coverage.yaml
+++ b/.github/workflows/test-coverage.yaml
@@ -37,5 +37,5 @@ jobs:
GITHUB_ORG: ${{ secrets.GH_ORG }}
GITHUB_TOKEN: ${{ secrets.ADMIN_GITHUB_TOKEN }}
run: |
- coverage run -m pytest tests/
+ PYTHONPATH=./docs_src coverage run -m pytest
coverage report
diff --git a/.github/workflows/test.yml b/.github/workflows/test.yml
index a1ca59bd..2338c286 100644
--- a/.github/workflows/test.yml
+++ b/.github/workflows/test.yml
@@ -37,4 +37,4 @@ jobs:
env:
GITHUB_ORG: ${{ secrets.GH_ORG }}
GITHUB_TOKEN: ${{ secrets.ADMIN_GITHUB_TOKEN }}
- run: pytest -vv
+ run: PYTHONPATH=./docs_src pytest -vv
diff --git a/CHANGELOG.md b/CHANGELOG.md
index 0ff616e4..d91997aa 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -2,6 +2,217 @@
+## v0.11.13 (2024-06-05)
+
+### Fix
+
+* **ocr:** Another fix for #274 ([`2a7b401`](https://github.com/OpenPecha/Toolkit/commit/2a7b4016edd7a94cb026bc81e5ebd2fef043d06c))
+
+## v0.11.12 (2024-06-05)
+
+### Fix
+
+* PYPI email verification error for new release ([`545d8ea`](https://github.com/OpenPecha/Toolkit/commit/545d8eacb9aa1fd3b267304b902f40daf07fd738))
+
+## v0.11.11 (2024-06-05)
+
+### Fix
+
+* Tigger release ([`d0573a5`](https://github.com/OpenPecha/Toolkit/commit/d0573a59f22a3faf63aa688d2f99510873ec4043))
+
+## v0.11.10 (2024-02-22)
+
+### Fix
+
+* **OCRFormatter:** Add same_line_ratio_threshold class variable ([#272](https://github.com/OpenPecha/Toolkit/issues/272)) ([`5b47b77`](https://github.com/OpenPecha/Toolkit/commit/5b47b778dc53fbfc3710825638e54a7f3338ccaa))
+
+## v0.11.9 (2023-12-21)
+
+### Fix
+
+* **ocr:** Checking the abnormal post correction feature added ([#264](https://github.com/OpenPecha/Toolkit/issues/264)) ([`e94d65d`](https://github.com/OpenPecha/Toolkit/commit/e94d65dae8dce63eaf415eb62300e46eab9d9796))
+
+### Documentation
+
+* Remove openpecha.org docs ([`3b2e2f1`](https://github.com/OpenPecha/Toolkit/commit/3b2e2f124cc769725e39bcd96ad70eff94c7baac))
+
+## v0.11.8 (2023-10-05)
+
+### Fix
+
+* **ci:** Pin python-semantic-release version ([`a10c298`](https://github.com/OpenPecha/Toolkit/commit/a10c298e7c7a8d09cda0d7a2addae39b033a4d6b))
+* **dependency:** Make commit parser happy ([`6c6eae1`](https://github.com/OpenPecha/Toolkit/commit/6c6eae177ebedcfe19cf5ebbf3332d679b1173c6))
+
+## v0.11.7 (2023-05-29)
+### Fix
+
+* **github-storage:** Set current checkout branch as default ([`e2d6318`](https://github.com/OpenPecha/Toolkit/commit/e2d631876b21601f1afdf9b84a6daa0adbbf0246))
+
+## v0.11.6 (2023-05-17)
+### Fix
+* **elan:** Indent ANNOTATION_VALUE tag ([`946d45d`](https://github.com/OpenPecha/Toolkit/commit/946d45db0e327cfe892489996e1de092a2d1776e))
+* **elan:** Put end_payload in the end ([`adb9848`](https://github.com/OpenPecha/Toolkit/commit/adb98482112f8cc5eb1898eb4e0dd7557286d63c))
+
+## v0.11.5 (2023-05-03)
+### Fix
+* **ocr:** Handle case where pecha_id is None ([`8740f22`](https://github.com/OpenPecha/Toolkit/commit/8740f22447a2f9e101eddb7b798833c83f5dffae))
+
+## v0.11.4 (2023-03-31)
+### Fix
+* **utils:** Download private pecha ([`5ce7113`](https://github.com/OpenPecha/Toolkit/commit/5ce71136969d328be01e92f56ce793d1c5e2f992))
+* **storage:** Generate auth remote url ([`5172865`](https://github.com/OpenPecha/Toolkit/commit/5172865c010cda2759fd302c76c83a3bb247b5b4))
+
+## v0.11.3 (2023-03-29)
+### Fix
+* **core/pecha:** Add base_names_list prop to pecha ([`58e7135`](https://github.com/OpenPecha/Toolkit/commit/58e7135f08afab18faffdea8cce0d19964636abf))
+* **core/pecha:** Pecha publish method accepts branch ([`5c599ca`](https://github.com/OpenPecha/Toolkit/commit/5c599ca3b1ed6cba85b02595f96c0d2d35050cde))
+
+## v0.11.2 (2023-03-21)
+### Fix
+* **core/pecha:** Overwriting bases in metedata ([`f9033eb`](https://github.com/OpenPecha/Toolkit/commit/f9033eb066268047fe2e146d58f685d91ba00038))
+
+## v0.11.1 (2023-03-21)
+### Fix
+* **core/pecha:** Make arg optional ([`67fd90b`](https://github.com/OpenPecha/Toolkit/commit/67fd90bffeab0a44abb0ff488998867c560be08c))
+
+## v0.11.0 (2023-03-17)
+### Feature
+* **elan:** Initial implementation of elan serializer ([`3f8cd41`](https://github.com/OpenPecha/Toolkit/commit/3f8cd41a115e8b9cff667e0e94b2dc02a8b6032f))
+
+### Fix
+* **elan:** Get media_url from TranscriptionTimeSpanLayer ([`d060818`](https://github.com/OpenPecha/Toolkit/commit/d060818109304ef418e42b0d9cc24d91f017b039))
+* **pecha:** Create meta.bases only if it doesn't exist ([`38e8d7e`](https://github.com/OpenPecha/Toolkit/commit/38e8d7e0b02a4cf1479a763d9e1badae6a1795f4))
+
+## v0.10.0 (2023-03-15)
+### Feature
+* **otranscribe:** Initial implementation for oTranscribe formatter ([`13e2c83`](https://github.com/OpenPecha/Toolkit/commit/13e2c8307fd6f9df9011ba2023119515602fa97b))
+* Add TranscriptionTimeSpanLayer ([`096f8ff`](https://github.com/OpenPecha/Toolkit/commit/096f8ff2dcff8ffa21960dff69fc1057b82c78fa))
+* Add a Layer for transcription ([`454a304`](https://github.com/OpenPecha/Toolkit/commit/454a3043ff22065c615643baeb4a5dae48203185))
+* Add annotation for transcription ([`ee669a3`](https://github.com/OpenPecha/Toolkit/commit/ee669a3685c1bd6cb8ae0268d2d8784047ff4c96))
+
+### Fix
+* **otranscribe:** Take directory as an input path ([`9e1e9b5`](https://github.com/OpenPecha/Toolkit/commit/9e1e9b50202373ca958f3c0ee41a194c7400298c))
+* **core/pecha:** Pass layerEum obj instead of str ([`bba5d1f`](https://github.com/OpenPecha/Toolkit/commit/bba5d1f9a34d39436862a9b5a57b4ccad17a9762))
+* **otranscribe:** Add test data for oTranscribe formatter ([`acd9a22`](https://github.com/OpenPecha/Toolkit/commit/acd9a22a1dc5c8ef6e6dd03434cc74a6facdf225))
+* Read_layers_file file, get_base_metadata, about ([`14200c8`](https://github.com/OpenPecha/Toolkit/commit/14200c800a437f28bcb08cb8b7a06c077cc81bd3))
+
+## v0.9.25 (2023-03-14)
+### Fix
+* **po-exporter:** Test case has been updated ([`267b8b3`](https://github.com/OpenPecha/Toolkit/commit/267b8b396ffb64ddb5dee67f88cf4f937fde0f48))
+
+## v0.9.24 (2023-02-13)
+### Fix
+* **core:** Check existence before unlink ([`190147e`](https://github.com/OpenPecha/Toolkit/commit/190147e32d97f58b795f9e6e6442164765a32976))
+
+## v0.9.23 (2023-01-23)
+### Fix
+* **google_vision:** Fix rare case in Google Vision json output ([#236](https://github.com/OpenPecha/Toolkit/issues/236)) ([`90b5dd6`](https://github.com/OpenPecha/Toolkit/commit/90b5dd6cbf37aef0f621a569eea8fd66d96b29c9))
+
+## v0.9.22 (2023-01-20)
+### Fix
+* **baregit:** Fix access to non existing layer ([`7ab4d0b`](https://github.com/OpenPecha/Toolkit/commit/7ab4d0b6167e6456d294330ac58cf46e311c75d2))
+
+## v0.9.21 (2023-01-19)
+### Fix
+* **rdf:** Better RDF export for NorbuKetaka texts ([`b4e3013`](https://github.com/OpenPecha/Toolkit/commit/b4e3013e8b8b7e8ba64b72952bbf65b976e280a2))
+
+## v0.9.20 (2023-01-05)
+### Fix
+* **alignment:** All test passed for alignment ([`eb56db6`](https://github.com/OpenPecha/Toolkit/commit/eb56db66cb459fdd5791d08c5d0dae7763114be6))
+* **alignment:** Updated from OpenpechaFs to OpenpechaGitRepo ([`2a6bcb7`](https://github.com/OpenPecha/Toolkit/commit/2a6bcb7fec6480f3aa56542ebf9d7fdd3aebc6aa))
+* **alignment:** Pecha publish updated to upload the assets ([`3e5e032`](https://github.com/OpenPecha/Toolkit/commit/3e5e0323b0236e1d57bb5c0b7c0b218eff0e0584))
+* **alignment:** Fix sentence segmenter ([`a3b0977`](https://github.com/OpenPecha/Toolkit/commit/a3b09773395e466c7c2e546bce5223d6b9752db6))
+* **alignment:** Changed back the update_alignment in tmx ([`e6a0bee`](https://github.com/OpenPecha/Toolkit/commit/e6a0bee387986338d0f7b4500f6f20c4d51bfa13))
+* **alignment:** All test passed ([`e42d9c5`](https://github.com/OpenPecha/Toolkit/commit/e42d9c5bb8be87ee0117eb03a9be3eb61967a911))
+* **alignment:** Updated other tests ([`c32dbf1`](https://github.com/OpenPecha/Toolkit/commit/c32dbf12d76417b1a55b61485eadcd929c8e74fe))
+* **alignment:** Updated test and tmx ([`32c0c88`](https://github.com/OpenPecha/Toolkit/commit/32c0c889a7388890c25009efef68286294b285d3))
+* **alignment:** Tmx alignment reformat ([`2c26bd7`](https://github.com/OpenPecha/Toolkit/commit/2c26bd735b072e1d3db1610fba310b011ab954e4))
+* **alignment:** Updated create_opf of alignment ([`092b9ca`](https://github.com/OpenPecha/Toolkit/commit/092b9caec4a640e7847cf881846c63ba2ac777f4))
+
+## v0.9.19 (2022-12-30)
+### Fix
+* **hotfix:** Option to not use blupdate ([`418aa36`](https://github.com/OpenPecha/Toolkit/commit/418aa3694408080a78aae63af1eadba1378e8b2b))
+
+## v0.9.18 (2022-12-21)
+### Fix
+* **pecha:** Add storage attr to OpenPechaGitRepo ([`186b307`](https://github.com/OpenPecha/Toolkit/commit/186b3074604a175166f35bb9c61226b748bd5d3e))
+
+## v0.9.17 (2022-12-17)
+### Fix
+* **core:** Create OpenPechaGitRepo ([`ebf9c19`](https://github.com/OpenPecha/Toolkit/commit/ebf9c19781a8c083a4be727fb4e1e6a8b7cd2130))
+
+## v0.9.16 (2022-12-12)
+### Fix
+* **test-formatter:** Updated formatter test to use remove duplicates option ([`be796bd`](https://github.com/OpenPecha/Toolkit/commit/be796bddf2948616b46de17c199f3e72c571039b))
+
+## v0.9.15 (2022-12-12)
+### Fix
+* **tests:** Tests pass, do not use option in other tests ([`411ef5b`](https://github.com/OpenPecha/Toolkit/commit/411ef5ba7a46a1315a56be0d818270a38836139f))
+* **ocr:** Option to remove duplicate symbols, #220 ([`a4c7fe0`](https://github.com/OpenPecha/Toolkit/commit/a4c7fe0e4f64f596bb2fabfa1d061a8f0905b67c))
+* **formatter-ocr:** Checks if bbox overlaps more than 60% ([`c081ef3`](https://github.com/OpenPecha/Toolkit/commit/c081ef37d2c3f6b99e1edabf11ee4cb63ebab0d2))
+* **formatter-ocr:** Added remove duplicates and overalap ([`cf11570`](https://github.com/OpenPecha/Toolkit/commit/cf11570653e9dcec0a4b0db39ed62cbf94c6d206))
+
+## v0.9.14 (2022-11-30)
+### Fix
+* Replace AnnType with LayerEnum ([`6a995fc`](https://github.com/OpenPecha/Toolkit/commit/6a995fc2db40c6f9a7714c3c19523bab84955bc6))
+
+## v0.9.13 (2022-11-30)
+### Fix
+* Replace AnnType with LayerEnum ([`e0feb81`](https://github.com/OpenPecha/Toolkit/commit/e0feb817c3c3f90b02aa3253adabb875c6a8f5e9))
+
+## v0.9.12 (2022-11-28)
+### Fix
+* Remove AnnType dependency which is redundant ([`fce9d7d`](https://github.com/OpenPecha/Toolkit/commit/fce9d7ddb9f13ca12072a72fc5a1d3ce1759d8b4))
+
+## v0.9.11 (2022-11-28)
+### Fix
+* Circular import ([`4577a7d`](https://github.com/OpenPecha/Toolkit/commit/4577a7df2bf4b7085ee1cc9406cd59363f49d7b0))
+
+### Documentation
+* Switch to mkdir-material insider ([`e1c0a45`](https://github.com/OpenPecha/Toolkit/commit/e1c0a45f294287f65e51e52489e4f21c08cd1486))
+
+## v0.9.10 (2022-11-23)
+### Fix
+* **hocr-formatter:** Removed the update for empty volume bugs ([`9193669`](https://github.com/OpenPecha/Toolkit/commit/91936697e7c5a908cc1a1d376d2bcdc9f256ca04))
+* **hocr-formatter:** Unzip html.zip and read html ([`9791dce`](https://github.com/OpenPecha/Toolkit/commit/9791dce0cabcb2e7953854e318393d4e5062c36f))
+
+## v0.9.9 (2022-11-22)
+### Fix
+* **pecha:** Fix BUDA API ([`ace0d31`](https://github.com/OpenPecha/Toolkit/commit/ace0d31e171ba01e40d45ea68258b2b39ea0d824))
+
+## v0.9.8 (2022-11-07)
+### Fix
+* **pecha:** Handle box rotation ([`182c674`](https://github.com/OpenPecha/Toolkit/commit/182c6749464f2db15e5b2a1ec648f09816db2e53))
+
+## v0.9.7 (2022-10-20)
+### Fix
+* **test_cli:** Remove full path assert in download_pecha ([`5bd01af`](https://github.com/OpenPecha/Toolkit/commit/5bd01af5625eb56054320c329d2e91d68de99604))
+* **cli:** Downgrade click version and add cli test ([`a82f153`](https://github.com/OpenPecha/Toolkit/commit/a82f153c8b3ff7d277f5ceed939ed294ec04e730))
+
+## v0.9.6 (2022-10-20)
+### Fix
+* Disable git rebase when downloading pecha ([`d1c87c6`](https://github.com/OpenPecha/Toolkit/commit/d1c87c64cacfd45c5379cd01929944b52e9c06a2))
+
+## v0.9.5 (2022-10-14)
+### Fix
+* **cli:** Add batch download command ([`ef5a7d8`](https://github.com/OpenPecha/Toolkit/commit/ef5a7d80904f75c5450887aadb877e6bb59295cc))
+* **cli:** Download cmd now only download single pecha ([`5ee31c9`](https://github.com/OpenPecha/Toolkit/commit/5ee31c92a8f8c80caf79a9fc3f81d966656aca67))
+
+## v0.9.4 (2022-10-14)
+### Fix
+* **pecha:** Update is private with geo restriction availibilty ([`3e9b3c2`](https://github.com/OpenPecha/Toolkit/commit/3e9b3c2142d4a619c1f968095990f837238fe97d))
+* **pecha:** Used storage object to get org name and token. update pecha about ([`66696f2`](https://github.com/OpenPecha/Toolkit/commit/66696f25171cf2b27b5f921e65bf304ea31b9d85))
+* **googel-vision:** Return none and o for get_bboxes_for_page if page is empty ([`a6e01e8`](https://github.com/OpenPecha/Toolkit/commit/a6e01e8a2f42569bb706250c744a48fb6e632a03))
+* **google-vision:** Check first char for unicode category ([`3deaaa2`](https://github.com/OpenPecha/Toolkit/commit/3deaaa2903b60c0fc696904bdda7d4571a7a235c))
+* **ocr:** Get bdrc_scan_id from data provider ([`85aa344`](https://github.com/OpenPecha/Toolkit/commit/85aa344c843cdf6b9a1682ca651b4974be4dc971))
+* **catalog-manager:** Updated create_opf to the new format and add data_provider ([`4f492ad`](https://github.com/OpenPecha/Toolkit/commit/4f492ad6245e0e530d6008a5bdc9f1f9831f1965))
+* **test:** Assert annotation object updated ([`3c44292`](https://github.com/OpenPecha/Toolkit/commit/3c44292ab264db78a128ad28e1173204f36debb9))
+* **ocr:** Add pecha id default as none ([`a7cc7ad`](https://github.com/OpenPecha/Toolkit/commit/a7cc7adc6f8f160c1a0165a0492f95ea6da0d909))
+* **pecha:** Update pecha about and add is private to pecha ([`54428a5`](https://github.com/OpenPecha/Toolkit/commit/54428a5c19a83779bdcd6824ac4eb1e1968571bb))
+* **pecha:** Publish existing pecha with changes ([`99af8b0`](https://github.com/OpenPecha/Toolkit/commit/99af8b0d7fbdcc15b58cdd7a9a916d29c0fbaa0d))
+* **pecha:** Publish asset in release with pecha ([`efad1ba`](https://github.com/OpenPecha/Toolkit/commit/efad1ba981a61dc0a3a6785e81503dc4b159fdbe))
+* **storages:** Add check geo_restriciton in meta for private repo ([`09b1162`](https://github.com/OpenPecha/Toolkit/commit/09b1162fea2d3b3d13e4267222b07db67526f72a))
+
## v0.9.3 (2022-10-07)
### Fix
* **utils:** Add download release ([`1b93132`](https://github.com/OpenPecha/Toolkit/commit/1b9313255341bf1d4f7e054353fa8da5cd575421))
diff --git a/README.md b/README.md
index ecd1c04d..1985b325 100644
--- a/README.md
+++ b/README.md
@@ -4,6 +4,7 @@
+