Skip to content

Commit

Permalink
tesseract(3,4): Remove autoupdate
Browse files Browse the repository at this point in the history
  • Loading branch information
issaclin32 committed Jun 19, 2022
1 parent 17e4e95 commit 790c866
Show file tree
Hide file tree
Showing 4 changed files with 40 additions and 74 deletions.
22 changes: 7 additions & 15 deletions bucket/tesseract3-languages.json
Original file line number Diff line number Diff line change
@@ -1,8 +1,13 @@
{
"version": "3.04.00",
"description": "Trained models for the Tesseract Open Source OCR Engine (version 3)",
"homepage": "https://github.com/tesseract-ocr/tessdata_fast",
"license": "Apache-2.0",
"description": "Trained models for the Tesseract Open Source OCR Engine",
"version": "3.04.00",
"notes": [
"This packages has overwritten the 'TESSDATA_PREFIX' environment variable with \"$dir\".",
"After updating \"tesseract3\" please run \"scoop reset tesseract3-languages\" to update the environment variable!"
],
"depends": "versions/tesseract3",
"url": [
"https://github.com/tesseract-ocr/tessdata/archive/3.04.00.zip",
"https://raw.githubusercontent.com/USCDataScience/counterfeit-electronics-tesseract/319a6eeacff181dad5c02f3e7a3aff804eaadeca/Training%20Tesseract/snum.traineddata"
Expand All @@ -12,20 +17,7 @@
"36f772980ff17c66a767f584a0d80bf2302a1afa585c01a226c1863afcea1392"
],
"extract_dir": "tessdata-3.04.00",
"notes": [
"This packages has overwritten the 'TESSDATA_PREFIX' environment variable with \"$dir\".",
"After updating \"tesseract3\" please run \"scoop reset tesseract3-languages\" to update the environment variable!"
],
"depends": "tesseract3",
"env_set": {
"TESSDATA_PREFIX": "$dir"
},
"checkver": {
"url": "https://api.github.com/repos/tesseract-ocr/tessdata/releases",
"regex": "\"(3[\\d.]+)\""
},
"autoupdate": {
"url": "https://github.com/tesseract-ocr/tessdata/archive/$version.zip",
"extract_dir": "tessdata-$version"
}
}
27 changes: 10 additions & 17 deletions bucket/tesseract3.json
Original file line number Diff line number Diff line change
@@ -1,8 +1,15 @@
{
"version": "3.05.02-20180621",
"description": "Tesseract. An open-source OCR Engine (version 3)",
"homepage": "https://github.com/UB-Mannheim/tesseract/wiki",
"license": "Apache-2.0",
"version": "3.05.02-20180621",
"description": "Open Source OCR Engine",
"notes": [
"Recognition data files can be installed via \"scoop install tesseract3-languages\"",
"or downloaded manually from https://github.com/tesseract-ocr/tessdata"
],
"suggest": {
"tesseract-languages": "tesseract3-languages"
},
"url": "https://digi.bib.uni-mannheim.de/tesseract/tesseract-ocr-setup-3.05.02-20180621.exe#/dl.7z",
"hash": "26bd9ab1fadf0334a6fb60a45269d87e8a60824df82b7cc74c6d665c0fc1ec0c",
"bin": [
Expand All @@ -28,19 +35,5 @@
"if (Test-Path $langdir) {",
" env \"TESSDATA_PREFIX\" $global $langdir",
"}"
],
"notes": [
"Recognition data files can be installed via \"scoop install tesseract3-languages\"",
"or downloaded manually from https://github.com/tesseract-ocr/tessdata"
],
"suggest": {
"tesseract-languages": "tesseract3-languages"
},
"checkver": {
"url": "https://digi.bib.uni-mannheim.de/tesseract/?C=M;O=D",
"regex": "tesseract-ocr-setup-(3.[\\d\\w.-]+)\\.exe"
},
"autoupdate": {
"url": "https://digi.bib.uni-mannheim.de/tesseract/tesseract-ocr-setup-$version.exe#/dl.7z"
}
]
}
19 changes: 7 additions & 12 deletions bucket/tesseract4-languages.json
Original file line number Diff line number Diff line change
@@ -1,8 +1,13 @@
{
"version": "4.1.0",
"description": "Fast integer versions of trained models for the Tesseract Open Source OCR Engine (version 4)",
"homepage": "https://github.com/tesseract-ocr/tessdata_fast",
"license": "Apache-2.0",
"description": "Fast integer versions of trained models for the Tesseract Open Source OCR Engine",
"version": "4.1.0",
"notes": [
"This packages has overwritten the 'TESSDATA_PREFIX' environment variable with \"$dir\".",
"After updating \"tesseract4\" please run \"scoop reset tesseract4-languages\" to update the environment variable!"
],
"depends": "versions/tesseract4",
"url": [
"https://github.com/tesseract-ocr/tessdata_fast/archive/4.1.0.zip",
"https://raw.githubusercontent.com/tesseract-ocr/tessdata/d87b3cbc75555bd3282e0cadab5e159e2d468396/equ.traineddata",
Expand All @@ -14,17 +19,7 @@
"36f772980ff17c66a767f584a0d80bf2302a1afa585c01a226c1863afcea1392"
],
"extract_dir": "tessdata_fast-4.1.0",
"notes": [
"This packages has overwritten the 'TESSDATA_PREFIX' environment variable with \"$dir\".",
"After updating \"tesseract4\" please run \"scoop reset tesseract4-languages\" to update the environment variable!"
],
"depends": "tesseract4",
"env_set": {
"TESSDATA_PREFIX": "$dir"
},
"checkver": "github",
"autoupdate": {
"url": "https://github.com/tesseract-ocr/tessdata_fast/archive/$version.zip",
"extract_dir": "tessdata_fast-$version"
}
}
46 changes: 16 additions & 30 deletions bucket/tesseract4.json
Original file line number Diff line number Diff line change
@@ -1,8 +1,15 @@
{
"version": "4.1.0-elag2019",
"description": "Tesseract. An open-source OCR Engine (version 4)",
"homepage": "https://github.com/UB-Mannheim/tesseract/wiki",
"license": "Apache-2.0",
"version": "4.1.0-elag2019",
"description": "Open Source OCR Engine",
"notes": [
"Recognition data files can be installed via \"scoop install tesseract4-languages\"",
"or downloaded manually from https://github.com/tesseract-ocr/tessdata_fast"
],
"suggest": {
"tesseract-languages": "tesseract4-languages"
},
"architecture": {
"64bit": {
"url": "https://digi.bib.uni-mannheim.de/tesseract/tesseract-ocr-w64-setup-v4.1.0-elag2019.exe#/dl.7z",
Expand All @@ -13,6 +20,12 @@
"hash": "082cd4b852f512cff544721df109721188667f84c383782d6828e6cba844db4b"
}
},
"post_install": [
"$langdir = versiondir tesseract4-languages current $global",
"if (Test-Path $langdir) {",
" env \"TESSDATA_PREFIX\" $global $langdir",
"}"
],
"bin": [
"ambiguous_words.exe",
"classifier_tester.exe",
Expand All @@ -34,32 +47,5 @@
"env_set": {
"TESSDATA_PREFIX": "$persist_dir\\tessdata"
},
"persist": "tessdata",
"post_install": [
"$langdir = versiondir tesseract4-languages current $global",
"if (Test-Path $langdir) {",
" env \"TESSDATA_PREFIX\" $global $langdir",
"}"
],
"notes": [
"Recognition data files can be installed via \"scoop install tesseract4-languages\"",
"or downloaded manually from https://github.com/tesseract-ocr/tessdata_fast"
],
"suggest": {
"tesseract-languages": "tesseract4-languages"
},
"checkver": {
"url": "https://digi.bib.uni-mannheim.de/tesseract/?C=M;O=D",
"regex": "tesseract-ocr-w32-setup-v(4.[\\d\\w.-]+)\\.exe"
},
"autoupdate": {
"architecture": {
"64bit": {
"url": "https://digi.bib.uni-mannheim.de/tesseract/tesseract-ocr-w64-setup-v$version.exe#/dl.7z"
},
"32bit": {
"url": "https://digi.bib.uni-mannheim.de/tesseract/tesseract-ocr-w32-setup-v$version.exe#/dl.7z"
}
}
}
"persist": "tessdata"
}

0 comments on commit 790c866

Please sign in to comment.