beimingmaster
diff --git a/‎.github/dependabot.yml‎
Lines changed: 7 additions & 0 deletions b/‎.github/dependabot.yml‎
Lines changed: 7 additions & 0 deletions
diff --git a/‎.travis.yml‎
Lines changed: 4 additions & 6 deletions b/‎.travis.yml‎
Lines changed: 4 additions & 6 deletions
diff --git a/‎README.md‎
Lines changed: 69 additions & 30 deletions b/‎README.md‎
Lines changed: 69 additions & 30 deletions
diff --git a/‎appveyor.yml‎
Lines changed: 21 additions & 0 deletions b/‎appveyor.yml‎
Lines changed: 21 additions & 0 deletions
diff --git a/‎jbang-catalog.json‎
Lines changed: 8 additions & 0 deletions b/‎jbang-catalog.json‎
Lines changed: 8 additions & 0 deletions
@@ -0,0 +1,7 @@
+version: 2
+updates:
+- package-ecosystem: maven
+  directory: "/"
+  schedule:
+    interval: daily
+  open-pull-requests-limit: 10
@@ -2,10 +2,8 @@ language: java
 install: mvn install -DskipTests=true -Dmaven.javadoc.skip=true -Dgpg.skip=true -B -V
 script: mvn test -Dgpg.skip=true
 jdk:
-  - oraclejdk7
-  - openjdk7
-  - oraclejdk8
+  - openjdk8
+  - openjdk9
+  - openjdk10
+  - openjdk11
 sudo: false
-
-
-
@@ -1,11 +1,9 @@
-tabula-java [![Build Status](https://travis-ci.org/tabulapdf/tabula-java.svg?branch=master)](https://travis-ci.org/tabulapdf/tabula-java) [![Join the chat at https://gitter.im/tabulapdf/tabula-java](https://badges.gitter.im/Join%20Chat.svg)](https://gitter.im/tabulapdf/tabula-java?utm_source=badge&utm_medium=badge&utm_campaign=pr-badge&utm_content=badge)
+tabula-java [![Build Status](https://travis-ci.org/tabulapdf/tabula-java.svg?branch=master)](https://travis-ci.org/tabulapdf/tabula-java) [![Build status](https://ci.appveyor.com/api/projects/status/l5gym1mjhrd2v8yn?svg=true)](https://ci.appveyor.com/project/jazzido/tabula-java)
 ===========
 
-`tabula-java` is a library for extracting tables from PDF files — it is the table extraction engine that used to power [Tabula](http://tabula.technology/) ([repo](http://github.com/tabulapdf/tabula)). You can use `tabula-java` as a command-line tool to programmatically extract tables from PDFs.
+`tabula-java` is a library for extracting tables from PDF files — it is the table extraction engine that powers [Tabula](http://tabula.technology/) ([repo](http://github.com/tabulapdf/tabula)). You can use `tabula-java` as a command-line tool to programmatically extract tables from PDFs.
 
-(This is the new version of the extraction engine; the previous code can be found at [`tabula-extractor`](http://github.com/tabulapdf/tabula-extractor).)
-
-© 2014-2016 Manuel Aristarán. Available under MIT License. See [`LICENSE`](LICENSE).
+© 2014-2020 Manuel Aristarán. Available under MIT License. See [`LICENSE`](LICENSE).
 
 ## Download
 
@@ -16,58 +14,72 @@ Download a version of the tabula-java's jar, with all dependencies included, tha
 `tabula-java` provides a command line application:
 
 ```
-$ java -jar ./target/tabula-0.9.1-jar-with-dependencies.jar --help
-
-usage: tabula [-a <AREA>] [-b <DIRECTORY>] [-c <COLUMNS>] [-d] [-f <FORMAT>] [-g] [-h] [-i]
-       [-n] [-o <OUTFILE>] [-p <PAGES>] [-r] [-s <PASSWORD>] [-u] [-v]
+$ java -jar target/tabula-1.0.5-jar-with-dependencies.jar --help
+usage: tabula [-a <AREA>] [-b <DIRECTORY>] [-c <COLUMNS>] [-f <FORMAT>]
+       [-g] [-h] [-i] [-l] [-n] [-o <OUTFILE>] [-p <PAGES>] [-r] [-s
+       <PASSWORD>] [-t] [-u] [-v]
 
 Tabula helps you extract tables from PDFs
- -a,--area <AREA>           Portion of the page to analyze
-                            (top,left,bottom,right). Example: --area
-                            269.875,12.75,790.5,561. Default is entire
-                            page
- -c,--columns <COLUMNS>     X coordinates of column boundaries. Example
-                            --columns 10.1,20.2,30.3
- -d,--debug                 Print detected table areas instead of
-                            processing.
- -b,--batch <DIRECTORY>     Convert all .pdfs in the provided directory
 
+ -a,--area <AREA>           -a/--area = Portion of the page to analyze.
+                            Example: --area 269.875,12.75,790.5,561.
+                            Accepts top,left,bottom,right i.e. y1,x1,y2,x2
+                            where all values are in points relative to the
+                            top left corner. If all values are between
+                            0-100 (inclusive) and preceded by '%', input
+                            will be taken as % of actual height or width
+                            of the page. Example: --area %0,0,100,50. To
+                            specify multiple areas, -a option should be
+                            repeated. Default is entire page
+ -b,--batch <DIRECTORY>     Convert all .pdfs in the provided directory.
+ -c,--columns <COLUMNS>     X coordinates of column boundaries. Example
+                            --columns 10.1,20.2,30.3. If all values are
+                            between 0-100 (inclusive) and preceded by '%',
+                            input will be taken as % of actual width of
+                            the page. Example: --columns %25,50,80.6
  -f,--format <FORMAT>       Output format: (CSV,TSV,JSON). Default: CSV
  -g,--guess                 Guess the portion of the page to analyze per
                             page.
  -h,--help                  Print this help text.
  -i,--silent                Suppress all stderr output.
- -n,--no-spreadsheet        Force PDF not to be extracted using
-                            spreadsheet-style extraction (if there are
-                            ruling lines separating each cell, as in a PDF
-                            of an Excel spreadsheet)
+ -l,--lattice               Force PDF to be extracted using lattice-mode
+                            extraction (if there are ruling lines
+                            separating each cell, as in a PDF of an Excel
+                            spreadsheet)
+ -n,--no-spreadsheet        [Deprecated in favor of -t/--stream] Force PDF
+                            not to be extracted using spreadsheet-style
+                            extraction (if there are no ruling lines
+                            separating each cell)
  -o,--outfile <OUTFILE>     Write output to <file> instead of STDOUT.
                             Default: -
  -p,--pages <PAGES>         Comma separated list of ranges, or all.
                             Examples: --pages 1-3,5-7, --pages 3 or
                             --pages all. Default is --pages 1
- -r,--spreadsheet           Force PDF to be extracted using
-                            spreadsheet-style extraction (if there are
-                            ruling lines separating each cell, as in a PDF
-                            of an Excel spreadsheet)
+ -r,--spreadsheet           [Deprecated in favor of -l/--lattice] Force
+                            PDF to be extracted using spreadsheet-style
+                            extraction (if there are ruling lines
+                            separating each cell, as in a PDF of an Excel
+                            spreadsheet)
  -s,--password <PASSWORD>   Password to decrypt document. Default is empty
+ -t,--stream                Force PDF to be extracted using stream-mode
+                            extraction (if there are no ruling lines
+                            separating each cell)
  -u,--use-line-returns      Use embedded line returns in cells. (Only in
                             spreadsheet mode.)
  -v,--version               Print version and exit.
-
 ```
 
-It also includes a debugging tool, run `java -cp ./target/tabula-0.9.1-jar-with-dependencies.jar technology.tabula.debug.Debug -h` for the available options.
+It also includes a debugging tool, run `java -cp ./target/tabula-1.0.5-jar-with-dependencies.jar technology.tabula.debug.Debug -h` for the available options.
 
 You can also integrate `tabula-java` with any JVM language. For Java examples, see the [`tests`](src/test/java/technology/tabula/) folder.
 
 JVM start-up time is a lot of the cost of the `tabula` command, so if you're trying to extract many tables from PDFs, you have a few options for speeding it up:
 
  - the -b option, which allows you to convert all pdfs in a given directory
  - the [drip](https://github.com/ninjudd/drip) utility
- - the [Ruby](http://github.com/tabulapdf/tabula-extractor), [R](https://github.com/leeper/tabulizer), and [Node.js](https://github.com/ezodude/tabula-js) bindings
+ - the [Ruby](http://github.com/tabulapdf/tabula-extractor), [Python](https://github.com/chezou/tabula-py), [R](https://github.com/leeper/tabulizer), and [Node.js](https://github.com/ezodude/tabula-js) bindings
  - writing your own program in any JVM language (Java, JRuby, Scala) that imports tabula-java.
- - waiting for us to implement an API/server-style system (it's on the roadmap)
+ - waiting for us to implement an API/server-style system (it's on the [roadmap](https://github.com/tabulapdf/tabula-api))
 
 ## Building from Source
 
@@ -76,3 +88,30 @@ Clone this repo and run:
 ```
 mvn clean compile assembly:single
 ```
+
+## Contributing
+
+Interested in helping out? We'd love to have your help!
+
+You can help by:
+
+- [Reporting a bug](https://github.com/tabulapdf/tabula-java/issues).
+- Adding or editing documentation.
+- Contributing code via a Pull Request.
+- Spreading the word about `tabula-java` to people who might be able to benefit from using it.
+
+### Backers
+
+You can also support our continued work on `tabula-java` with a one-time or monthly donation [on OpenCollective](https://opencollective.com/tabulapdf#support). Organizations who use `tabula-java` can also [sponsor the project](https://opencollective.com/tabulapdf#support) for acknowledgement on [our official site](http://tabula.technology/) and this README.
+
+Special thanks to the following users and organizations for generously supporting Tabula with donations and grants:
+
+<a href="https://opencollective.com/tabulapdf/backer/0/website" target="_blank"><img src="https://opencollective.com/tabulapdf/backer/0/avatar"></a>
+<a href="https://opencollective.com/tabulapdf/backer/1/website" target="_blank"><img src="https://opencollective.com/tabulapdf/backer/1/avatar"></a>
+<a href="https://opencollective.com/tabulapdf/backer/2/website" target="_blank"><img src="https://opencollective.com/tabulapdf/backer/2/avatar"></a>
+<a href="https://opencollective.com/tabulapdf/backer/3/website" target="_blank"><img src="https://opencollective.com/tabulapdf/backer/3/avatar"></a>
+<a href="https://opencollective.com/tabulapdf/backer/4/website" target="_blank"><img src="https://opencollective.com/tabulapdf/backer/4/avatar"></a>
+<a href="https://opencollective.com/tabulapdf/backer/5/website" target="_blank"><img src="https://opencollective.com/tabulapdf/backer/5/avatar"></a>
+
+<a title="The John S. and James L. Knight Foundation" href="http://www.knightfoundation.org/" target="_blank"><img alt="The John S. and James L. Knight Foundation" src="https://knightfoundation.org/wp-content/uploads/2019/10/KF_Logotype_Icon-and-Stacked-Name.png" width="300"></a>
+<a title="The Shuttleworth Foundation" href="https://shuttleworthfoundation.org/" target="_blank"><img width="200" alt="The Shuttleworth Foundation" src="https://raw.githubusercontent.com/tabulapdf/tabula/gh-pages/shuttleworth.jpg"></a>
@@ -0,0 +1,21 @@
+version: '{build}'
+install:
+  - ps: |
+      Add-Type -AssemblyName System.IO.Compression.FileSystem
+      if (!(Test-Path -Path "C:\maven\apache-maven-3.5.4" )) {
+        (new-object System.Net.WebClient).DownloadFile(
+          'http://www-us.apache.org/dist/maven/maven-3/3.5.4/binaries/apache-maven-3.5.4-bin.zip',
+          'C:\maven-bin.zip'
+        )
+        [System.IO.Compression.ZipFile]::ExtractToDirectory("C:\maven-bin.zip", "C:\maven")
+      }
+  - cmd: SET PATH=C:\maven\apache-maven-3.5.4\bin;%JAVA_HOME%\bin;%PATH%
+  - cmd: SET MAVEN_OPTS=-Xmx2g
+  - cmd: SET JAVA_OPTS=-Xmx2g
+build_script:
+  - mvn clean package -B -DskipTests -Dmaven.javadoc.skip=true
+test_script:
+  - mvn install -B -Dmaven.javadoc.skip=true -Dgpg.skip
+cache:
+  - C:\maven -> appveyor.yml
+  - C:\Users\appveyor\.m2 -> appveyor.yml
@@ -0,0 +1,8 @@
+{
+  "catalogs": {},
+  "aliases": {
+    "tabula": {
+      "script-ref": "https://github.com/tabulapdf/tabula-java/releases/download/v1.0.4/tabula-1.0.4-jar-with-dependencies.jar"
+    }
+  }
+}