Skip to content

Commit

Permalink
Updated test and readme
Browse files Browse the repository at this point in the history
  • Loading branch information
mykolamelnykml committed Dec 6, 2024
1 parent 0e85058 commit 3906b5a
Show file tree
Hide file tree
Showing 2 changed files with 3 additions and 0 deletions.
2 changes: 2 additions & 0 deletions README.md
Original file line number Diff line number Diff line change
Expand Up @@ -143,6 +143,7 @@ val df = spark.read.format("pdf")
.option("resolution", "200")
.option("pagePerPartition", "2")
.option("reader", "pdfBox")
.option("ocrConfig", "psm=11")
.load("path to the pdf file(s)")

df.select("path", "document").show()
Expand All @@ -164,6 +165,7 @@ df = spark.read.format("pdf") \
.option("resolution", "200") \
.option("pagePerPartition", "2") \
.option("reader", "pdfBox") \
.option("ocrConfig", "psm=11") \
.load("path to the pdf file(s)")

df.select("path", "document").show()
Expand Down
1 change: 1 addition & 0 deletions src/test/scala/PdfDatasourceSuite.scala
Original file line number Diff line number Diff line change
Expand Up @@ -86,6 +86,7 @@ class PdfDatasourceSuite extends AnyFunSuite with BeforeAndAfterEach {
.option("resolution", "200")
.option("pagePerPartition", "2")
.option("reader", reader)
.option("ocrConfig", "psm=11")
.load(pdfPath)
(filePath, fileName, pdfDF)
}
Expand Down

0 comments on commit 3906b5a

Please sign in to comment.