BobLd
diff --git a/‎README.md‎
Lines changed: 1 addition & 5 deletions b/‎README.md‎
Lines changed: 1 addition & 5 deletions
diff --git a/‎Tabula.Csv/Tabula.Csv.csproj‎
Lines changed: 3 additions & 3 deletions b/‎Tabula.Csv/Tabula.Csv.csproj‎
Lines changed: 3 additions & 3 deletions
diff --git a/‎Tabula.Json/Tabula.Json.csproj‎
Lines changed: 3 additions & 3 deletions b/‎Tabula.Json/Tabula.Json.csproj‎
Lines changed: 3 additions & 3 deletions
diff --git a/‎Tabula.Tests/PdfPigExtensionsTests.cs‎
Lines changed: 462 additions & 0 deletions b/‎Tabula.Tests/PdfPigExtensionsTests.cs‎
Lines changed: 462 additions & 0 deletions
diff --git a/‎Tabula.Tests/Tabula.Tests.csproj‎
Lines changed: 12 additions & 6 deletions b/‎Tabula.Tests/Tabula.Tests.csproj‎
Lines changed: 12 additions & 6 deletions
diff --git a/‎Tabula.Tests/TestObjectExtractor.cs‎
Lines changed: 9 additions & 20 deletions b/‎Tabula.Tests/TestObjectExtractor.cs‎
Lines changed: 9 additions & 20 deletions
diff --git a/‎Tabula.Tests/TestSpreadsheetExtractor.cs‎
Lines changed: 14 additions & 14 deletions b/‎Tabula.Tests/TestSpreadsheetExtractor.cs‎
Lines changed: 14 additions & 14 deletions
diff --git a/‎Tabula.Tests/TestTableDetection.cs‎
Lines changed: 1 addition & 1 deletion b/‎Tabula.Tests/TestTableDetection.cs‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎Tabula.Tests/TestWriters.cs‎
Lines changed: 3 additions & 3 deletions b/‎Tabula.Tests/TestWriters.cs‎
Lines changed: 3 additions & 3 deletions
diff --git a/‎Tabula.Tests/TestsIcdar2013.cs‎
Lines changed: 1 addition & 2 deletions b/‎Tabula.Tests/TestsIcdar2013.cs‎
Lines changed: 1 addition & 2 deletions
@@ -5,7 +5,7 @@
 ![Linux](https://github.com/BobLd/tabula-sharp/workflows/Linux/badge.svg)
 ![Mac OS](https://github.com/BobLd/tabula-sharp/workflows/Mac%20OS/badge.svg)
 
-- Supports .NET 5, .NET Core 3.1, .NET Standard 2.0, .NET Framework 4.5, 4.51, 4.52, 4.6, 4.61, 4.62, 4.7
+- Supports .NET 6, .NET Core 3.1, .NET Standard 2.0, .NET Framework 4.52, 4.6, 4.61, 4.62, 4.7
 - No java bindings
 
 NuGet packages available on the [releases](https://github.com/BobLd/tabula-sharp/releases) page and on www.nuget.org:
@@ -56,7 +56,3 @@ using (PdfDocument document = PdfDocument.Open("doc.pdf", new ParsingOptions() {
 ![example](images/stream-us-018.png)
 ## Lattice mode - SpreadsheetExtractionAlgorithm
 ![example](images/lattice-eu-004.png)
-
-# HELP WANTED
-- The original java implementation uses STR trees in [`RectangleSpatialIndex`](https://github.com/tabulapdf/tabula-java/blob/master/src/main/java/technology/tabula/RectangleSpatialIndex.java). This is not the case here so it might be a bit slower. Any help implementing a similar approach is welcome.
-
@@ -1,10 +1,10 @@
 <Project Sdk="Microsoft.NET.Sdk">
 
   <PropertyGroup>
-    <TargetFrameworks>netcoreapp3.1;netstandard2.0;net452;net46;net461;net462;net47;net5.0;net6.0</TargetFrameworks>
+    <TargetFrameworks>netcoreapp3.1;netstandard2.0;net452;net46;net461;net462;net47;net6.0</TargetFrameworks>
     <Description>Extract tables from PDF files (port of tabula-java using PdfPig). Csv and Tsv writers.</Description>
     <PackageProjectUrl>https://github.com/BobLd/tabula-sharp</PackageProjectUrl>
-    <Version>0.1.3</Version>
+    <Version>0.1.4-alpha001</Version>
     <Authors>BobLd</Authors>
     <PackageTags>pdf, extract, table, tabula, pdfpig, parse, extraction, csv, tsv, excel, export</PackageTags>
     <PackageLicenseExpression>MIT</PackageLicenseExpression>
@@ -22,7 +22,7 @@
   </ItemGroup>
 
   <ItemGroup>
-    <PackageReference Include="CsvHelper" Version="27.2.1" />
+    <PackageReference Include="CsvHelper" Version="30.0.1" />
   </ItemGroup>
 
   <ItemGroup>
 
@@ -1,10 +1,10 @@
 <Project Sdk="Microsoft.NET.Sdk">
 
   <PropertyGroup>
-    <TargetFrameworks>netcoreapp3.1;netstandard2.0;net452;net46;net461;net462;net47;net5.0;net6.0</TargetFrameworks>
+    <TargetFrameworks>netcoreapp3.1;netstandard2.0;net452;net46;net461;net462;net47;net6.0</TargetFrameworks>
     <Description>Extract tables from PDF files (port of tabula-java using PdfPig). Json writer.</Description>
     <PackageProjectUrl>https://github.com/BobLd/tabula-sharp</PackageProjectUrl>
-    <Version>0.1.3</Version>
+    <Version>0.1.4-alpha001</Version>
     <Company>BobLd</Company>
     <Authors>BobLd</Authors>
     <PackageTags>pdf, extract, table, tabula, pdfpig, parse, extraction, json, export</PackageTags>
@@ -22,7 +22,7 @@
   </ItemGroup>
 
   <ItemGroup>
-    <PackageReference Include="Newtonsoft.Json" Version="13.0.1" />
+    <PackageReference Include="Newtonsoft.Json" Version="13.0.3" />
   </ItemGroup>
 
   <ItemGroup>
 
@@ -9,12 +9,18 @@
   </PropertyGroup>
 
   <ItemGroup>
-    <PackageReference Include="CsvHelper" Version="27.2.1" />
-    <PackageReference Include="Microsoft.NET.Test.Sdk" Version="16.5.0" />
-    <PackageReference Include="Newtonsoft.Json" Version="13.0.1" />
-    <PackageReference Include="xunit" Version="2.4.0" />
-    <PackageReference Include="xunit.runner.visualstudio" Version="2.4.0" />
-    <PackageReference Include="coverlet.collector" Version="1.2.0" />
+    <PackageReference Include="CsvHelper" Version="30.0.1" />
+    <PackageReference Include="Microsoft.NET.Test.Sdk" Version="17.6.2" />
+    <PackageReference Include="Newtonsoft.Json" Version="13.0.3" />
+    <PackageReference Include="xunit" Version="2.4.2" />
+    <PackageReference Include="xunit.runner.visualstudio" Version="2.4.5">
+      <PrivateAssets>all</PrivateAssets>
+      <IncludeAssets>runtime; build; native; contentfiles; analyzers; buildtransitive</IncludeAssets>
+    </PackageReference>
+    <PackageReference Include="coverlet.collector" Version="6.0.0">
+      <PrivateAssets>all</PrivateAssets>
+      <IncludeAssets>runtime; build; native; contentfiles; analyzers; buildtransitive</IncludeAssets>
+    </PackageReference>
   </ItemGroup>
 
   <ItemGroup>
 
@@ -23,8 +23,7 @@ public void TestCanReadPDFWithOwnerEncryption()
         {
             using (PdfDocument pdf_document = PdfDocument.Open("Resources/S2MNCEbirdisland.pdf"))
             {
-                ObjectExtractor oe = new ObjectExtractor(pdf_document);
-                PageIterator pi = oe.Extract();
+                PageIterator pi = ObjectExtractor.Extract(pdf_document);
                 int i = 0;
                 while (pi.MoveNext())
                 {
@@ -39,9 +38,8 @@ public void TestGoodPassword()
         {
             using (PdfDocument pdf_document = PdfDocument.Open("Resources/encrypted.pdf", new ParsingOptions() { Password = "userpassword" }))
             {
-                ObjectExtractor oe = new ObjectExtractor(pdf_document);
                 List<PageArea> pages = new List<PageArea>();
-                PageIterator pi = oe.Extract();
+                PageIterator pi = ObjectExtractor.Extract(pdf_document);
                 while (pi.MoveNext())
                 {
                     pages.Add(pi.Current);
@@ -55,8 +53,7 @@ public void TestTextExtractionDoesNotRaise()
         {
             using (PdfDocument pdf_document = PdfDocument.Open("Resources/rotated_page.pdf", new ParsingOptions() { ClipPaths = true }))
             {
-                ObjectExtractor oe = new ObjectExtractor(pdf_document);
-                PageIterator pi = oe.Extract();
+                PageIterator pi = ObjectExtractor.Extract(pdf_document);
 
                 Assert.True(pi.MoveNext());
                 Assert.NotNull(pi.Current);
@@ -69,8 +66,7 @@ public void TestShouldDetectRulings()
         {
             using (PdfDocument pdf_document = PdfDocument.Open("Resources/should_detect_rulings.pdf", new ParsingOptions() { ClipPaths = true }))
             {
-                ObjectExtractor oe = new ObjectExtractor(pdf_document);
-                PageIterator pi = oe.Extract();
+                PageIterator pi = ObjectExtractor.Extract(pdf_document);
 
                 PageArea page = pi.Next();
                 IReadOnlyList<Ruling> rulings = page.GetRulings();
@@ -87,8 +83,7 @@ public void TestDontThrowNPEInShfill()
         {
             using (PdfDocument pdf_document = PdfDocument.Open("Resources/labor.pdf", new ParsingOptions() { ClipPaths = true }))
             {
-                ObjectExtractor oe = new ObjectExtractor(pdf_document);
-                PageIterator pi = oe.Extract();
+                PageIterator pi = ObjectExtractor.Extract(pdf_document);
                 Assert.True(pi.MoveNext());
 
                 PageArea p = pi.Current;
@@ -103,8 +98,7 @@ public void TestExtractOnePage()
             {
                 Assert.Equal(2, pdf_document.NumberOfPages);
 
-                ObjectExtractor oe = new ObjectExtractor(pdf_document);
-                PageArea page = oe.Extract(2);
+                PageArea page = ObjectExtractor.Extract(pdf_document, 2);
 
                 Assert.NotNull(page);
             }
@@ -117,8 +111,7 @@ public void TestExtractWrongPageNumber()// throws IOException
             {
                 Assert.Equal(2, pdf_document.NumberOfPages);
 
-                ObjectExtractor oe = new ObjectExtractor(pdf_document);
-                Assert.Throws<IndexOutOfRangeException>(() => oe.Extract(3));
+                Assert.Throws<IndexOutOfRangeException>(() => ObjectExtractor.Extract(pdf_document, 3));
             }
         }
 
@@ -127,9 +120,7 @@ public void TestTextElementsContainedInPage()
         {
             using (PdfDocument pdf_document = PdfDocument.Open("Resources/cs-en-us-pbms.pdf", new ParsingOptions() { ClipPaths = true }))
             {
-                ObjectExtractor oe = new ObjectExtractor(pdf_document);
-
-                PageArea page = oe.ExtractPage(1);
+                PageArea page = ObjectExtractor.ExtractPage(pdf_document, 1);
 
                 foreach (TextElement te in page.GetText())
                 {
@@ -143,9 +134,7 @@ public void TestDoNotNPEInPointComparator()
         {
             using (PdfDocument pdf_document = PdfDocument.Open("Resources/npe_issue_206.pdf", new ParsingOptions() { ClipPaths = true }))
             {
-                ObjectExtractor oe = new ObjectExtractor(pdf_document);
-
-                PageArea p = oe.ExtractPage(1);
+                PageArea p = ObjectExtractor.ExtractPage(pdf_document, 1);
                 Assert.NotNull(p);
             }
         }
 
@@ -212,7 +212,7 @@ public void TestSpanningCells()
             PageArea page = UtilsForTesting.GetPage("Resources/spanning_cells.pdf", 1);
             string expectedJson = UtilsForTesting.LoadJson("Resources/json/spanning_cells.json");
             SpreadsheetExtractionAlgorithm se = new SpreadsheetExtractionAlgorithm();
-            List<Table> tables = se.Extract(page);
+            IReadOnlyList<Table> tables = se.Extract(page);
             Assert.Equal(2, tables.Count);
 
             var expectedJObject = (JArray)JsonConvert.DeserializeObject(expectedJson);
@@ -268,7 +268,7 @@ public void TestSpanningCellsToCsv()
             PageArea page = UtilsForTesting.GetPage("Resources/spanning_cells.pdf", 1);
             string expectedCsv = UtilsForTesting.LoadCsv("Resources/csv/spanning_cells.csv");
             SpreadsheetExtractionAlgorithm se = new SpreadsheetExtractionAlgorithm();
-            List<Table> tables = se.Extract(page);
+            IReadOnlyList<Table> tables = se.Extract(page);
             Assert.Equal(2, tables.Count);
 
             StringBuilder sb = new StringBuilder();
@@ -281,7 +281,7 @@ public void TestIncompleteGrid()
         {
             PageArea page = UtilsForTesting.GetPage("Resources/china.pdf", 1);
             SpreadsheetExtractionAlgorithm se = new SpreadsheetExtractionAlgorithm();
-            List<Table> tables = se.Extract(page);
+            IReadOnlyList<Table> tables = se.Extract(page);
             Assert.Equal(2, tables.Count);
         }
 
@@ -290,7 +290,7 @@ public void TestNaturalOrderOfRectanglesDoesNotBreakContract()
         {
             PageArea page = UtilsForTesting.GetPage("Resources/us-017.pdf", 2);
             SpreadsheetExtractionAlgorithm se = new SpreadsheetExtractionAlgorithm();
-            List<Table> tables = se.Extract(page);
+            IReadOnlyList<Table> tables = se.Extract(page);
 
             string expected = "Project,Agency,Institution\r\nNanotechnology and its publics,NSF,Pennsylvania State University\r\n\"Public information and deliberation in nanoscience and\rnanotechnology policy (SGER)\",Interagency,\"North Carolina State\rUniversity\"\r\n\"Social and ethical research and education in agrifood\rnanotechnology (NIRT)\",NSF,Michigan State University\r\n\"From laboratory to society: developing an informed\rapproach to nanoscale science and engineering (NIRT)\",NSF,University of South Carolina\r\nDatabase and innovation timeline for nanotechnology,NSF,UCLA\r\nSocial and ethical dimensions of nanotechnology,NSF,University of Virginia\r\n\"Undergraduate exploration of nanoscience,\rapplications and societal implications (NUE)\",NSF,\"Michigan Technological\rUniversity\"\r\n\"Ethics and belief inside the development of\rnanotechnology (CAREER)\",NSF,University of Virginia\r\n\"All centers, NNIN and NCN have a societal\rimplications components\",\"NSF, DOE,\rDOD, and NIH\",\"All nanotechnology centers\rand networks\""; // \r\n
 
@@ -325,7 +325,7 @@ public void TestSpreadsheetWithNoBoundingFrameShouldBeSpreadsheet()
             SpreadsheetExtractionAlgorithm se = new SpreadsheetExtractionAlgorithm();
             bool isTabular = se.IsTabular(page);
             Assert.True(isTabular);
-            List<Table> tables = se.Extract(page);
+            IReadOnlyList<Table> tables = se.Extract(page);
 
             StringBuilder sb = new StringBuilder();
             (new CSVWriter()).Write(sb, tables[0]);
@@ -337,7 +337,7 @@ public void TestExtractSpreadsheetWithinAnArea()
         {
             PageArea page = UtilsForTesting.GetAreaFromPage("Resources/puertos1.pdf", 1, new PdfRectangle(30.32142857142857, 793 - 554.8821428571429, 546.7964285714286, 793 - 273.9035714285714)); // 273.9035714285714f, 30.32142857142857f, 554.8821428571429f, 546.7964285714286f);
             SpreadsheetExtractionAlgorithm se = new SpreadsheetExtractionAlgorithm();
-            List<Table> tables = se.Extract(page);
+            IReadOnlyList<Table> tables = se.Extract(page);
             Table table = tables[0];
             Assert.Equal(15, table.Rows.Count);
 
@@ -417,7 +417,7 @@ public void TestShouldDetectASingleSpreadsheet()
         {
             PageArea page = UtilsForTesting.GetAreaFromPage("Resources/offense.pdf", 1, new PdfRectangle(16.44, 792 - 680.85, 597.84, 792 - 16.44)); // 68.08f, 16.44f, 680.85f, 597.84f);
             SpreadsheetExtractionAlgorithm bea = new SpreadsheetExtractionAlgorithm();
-            List<Table> tables = bea.Extract(page);
+            IReadOnlyList<Table> tables = bea.Extract(page);
             Assert.Single(tables);
         }
 
@@ -426,7 +426,7 @@ public void TestExtractTableWithExternallyDefinedRulings()
         {
             PageArea page = UtilsForTesting.GetPage("Resources/us-007.pdf", 1);
             SpreadsheetExtractionAlgorithm bea = new SpreadsheetExtractionAlgorithm();
-            List<Table> tables = bea.Extract(page, EXTERNALLY_DEFINED_RULINGS.ToList());
+            IReadOnlyList<Table> tables = bea.Extract(page, EXTERNALLY_DEFINED_RULINGS.ToList());
             Assert.Single(tables);
             Table table = tables[0];
             Assert.Equal(18, table.Cells.Count);
@@ -458,7 +458,7 @@ public void TestAnotherExtractTableWithExternallyDefinedRulings()
         {
             PageArea page = UtilsForTesting.GetPage("Resources/us-024.pdf", 1);
             SpreadsheetExtractionAlgorithm bea = new SpreadsheetExtractionAlgorithm();
-            List<Table> tables = bea.Extract(page, EXTERNALLY_DEFINED_RULINGS2.ToList());
+            IReadOnlyList<Table> tables = bea.Extract(page, EXTERNALLY_DEFINED_RULINGS2.ToList());
             Assert.Single(tables);
             Table table = tables[0];
 
@@ -472,7 +472,7 @@ public void TestSpreadsheetsSortedByTopAndRight()
             PageArea page = UtilsForTesting.GetPage("Resources/sydney_disclosure_contract.pdf", 1);
 
             SpreadsheetExtractionAlgorithm sea = new SpreadsheetExtractionAlgorithm();
-            List<Table> tables = sea.Extract(page);
+            IReadOnlyList<Table> tables = sea.Extract(page);
             for (int i = 1; i < tables.Count; i++)
             {
                 Assert.True(tables[i - 1].Top >= tables[i].Top); // Assert.True(tables[i - 1].getTop() <= tables[i].getTop());
@@ -485,7 +485,7 @@ public void TestDontStackOverflowQuicksort()
             PageArea page = UtilsForTesting.GetPage("Resources/failing_sort.pdf", 1);
 
             SpreadsheetExtractionAlgorithm sea = new SpreadsheetExtractionAlgorithm();
-            List<Table> tables = sea.Extract(page);
+            IReadOnlyList<Table> tables = sea.Extract(page);
             for (int i = 1; i < tables.Count; i++)
             {
                 Assert.True(tables[i - 1].Top >= tables[i].Top); //Assert.True(tables[i - 1].getTop() <= tables[i].getTop());
@@ -497,7 +497,7 @@ public void TestRTL()
         {
             PageArea page = UtilsForTesting.GetPage("Resources/arabic.pdf", 1);
             SpreadsheetExtractionAlgorithm sea = new SpreadsheetExtractionAlgorithm();
-            List<Table> tables = sea.Extract(page);
+            IReadOnlyList<Table> tables = sea.Extract(page);
             // Assert.Equal(1, tables.size());
             Table table = tables[0];
 
@@ -528,7 +528,7 @@ public void TestRealLifeRTL()
         {
             PageArea page = UtilsForTesting.GetPage("Resources/mednine.pdf", 1);
             SpreadsheetExtractionAlgorithm sea = new SpreadsheetExtractionAlgorithm();
-            List<Table> tables = sea.Extract(page);
+            IReadOnlyList<Table> tables = sea.Extract(page);
             Assert.Single(tables);
             Table table = tables[0];
             var rows = table.Rows;
@@ -580,7 +580,7 @@ public void TestSpreadsheetExtractionIssue656()
             string expectedCsv = UtilsForTesting.LoadCsv("Resources/csv/Publication_of_award_of_Bids_for_Transport_Sector__August_2016.csv");
 
             SpreadsheetExtractionAlgorithm sea = new SpreadsheetExtractionAlgorithm();
-            List<Table> tables = sea.Extract(page);
+            IReadOnlyList<Table> tables = sea.Extract(page);
             Assert.Single(tables);
             Table table = tables[0];
 
 
@@ -16,7 +16,7 @@ public class TestTableDetection
 
         //private static Level defaultLogLevel;
 
-        private class TestStatus
+        private sealed class TestStatus
         {
             public int numExpectedTables;
             public int numCorrectlyDetectedTables;
 
@@ -20,7 +20,7 @@ private Table GetTable()
             return bea.Extract(page)[0];
         }
 
-        private List<Table> GetTables()
+        private IReadOnlyList<Table> GetTables()
         {
             PageArea page = UtilsForTesting.GetPage("Resources/twotables.pdf", 1);
             SpreadsheetExtractionAlgorithm sea = new SpreadsheetExtractionAlgorithm();
@@ -144,7 +144,7 @@ public void TestCSVSerializeInfinity()
         public void TestJSONSerializeTwoTables()
         {
             string expectedJson = UtilsForTesting.LoadJson("Resources/json/twotables.json");
-            List<Table> tables = this.GetTables();
+            IReadOnlyList<Table> tables = this.GetTables();
 
             StringBuilder sb = new StringBuilder();
             (new JSONWriter()).Write(sb, tables);
@@ -178,7 +178,7 @@ public void TestJSONSerializeTwoTables()
         public void TestCSVSerializeTwoTables()
         {
             string expectedCsv = UtilsForTesting.LoadCsv("Resources/csv/twotables.csv");
-            List<Table> tables = this.GetTables();
+            IReadOnlyList<Table> tables = this.GetTables();
 
             /*
             StringBuilder sb = new StringBuilder();
 
@@ -15,8 +15,7 @@ public void Eu004()
         {
             using (PdfDocument document = PdfDocument.Open("Resources/icdar2013-dataset/competition-dataset-eu/eu-004.pdf", new ParsingOptions() { ClipPaths = true }))
             {
-                ObjectExtractor oe = new ObjectExtractor(document);
-                PageArea page = oe.Extract(3);
+                PageArea page = ObjectExtractor.Extract(document, 3);
 
                 var detector = new SimpleNurminenDetectionAlgorithm();
                 var regions = detector.Detect(page);
Original file line number	Diff line number	Diff line change
`@@ -23,8 +23,7 @@ public void TestCanReadPDFWithOwnerEncryption()`
`23`	`23`	`{`
`24`	`24`	`using (PdfDocument pdf_document = PdfDocument.Open("Resources/S2MNCEbirdisland.pdf"))`
`25`	`25`	`{`
`26`		`- ObjectExtractor oe = new ObjectExtractor(pdf_document);`
`27`		`- PageIterator pi = oe.Extract();`
	`26`	`+ PageIterator pi = ObjectExtractor.Extract(pdf_document);`
`28`	`27`	`int i = 0;`
`29`	`28`	`while (pi.MoveNext())`
`30`	`29`	`{`
`@@ -39,9 +38,8 @@ public void TestGoodPassword()`
`39`	`38`	`{`
`40`	`39`	`using (PdfDocument pdf_document = PdfDocument.Open("Resources/encrypted.pdf", new ParsingOptions() { Password = "userpassword" }))`
`41`	`40`	`{`
`42`		`- ObjectExtractor oe = new ObjectExtractor(pdf_document);`
`43`	`41`	`List<PageArea> pages = new List<PageArea>();`
`44`		`- PageIterator pi = oe.Extract();`
	`42`	`+ PageIterator pi = ObjectExtractor.Extract(pdf_document);`
`45`	`43`	`while (pi.MoveNext())`
`46`	`44`	`{`
`47`	`45`	`pages.Add(pi.Current);`
`@@ -55,8 +53,7 @@ public void TestTextExtractionDoesNotRaise()`
`55`	`53`	`{`
`56`	`54`	`using (PdfDocument pdf_document = PdfDocument.Open("Resources/rotated_page.pdf", new ParsingOptions() { ClipPaths = true }))`
`57`	`55`	`{`
`58`		`- ObjectExtractor oe = new ObjectExtractor(pdf_document);`
`59`		`- PageIterator pi = oe.Extract();`
	`56`	`+ PageIterator pi = ObjectExtractor.Extract(pdf_document);`
`60`	`57`
`61`	`58`	`Assert.True(pi.MoveNext());`
`62`	`59`	`Assert.NotNull(pi.Current);`
`@@ -69,8 +66,7 @@ public void TestShouldDetectRulings()`
`69`	`66`	`{`
`70`	`67`	`using (PdfDocument pdf_document = PdfDocument.Open("Resources/should_detect_rulings.pdf", new ParsingOptions() { ClipPaths = true }))`
`71`	`68`	`{`
`72`		`- ObjectExtractor oe = new ObjectExtractor(pdf_document);`
`73`		`- PageIterator pi = oe.Extract();`
	`69`	`+ PageIterator pi = ObjectExtractor.Extract(pdf_document);`
`74`	`70`
`75`	`71`	`PageArea page = pi.Next();`
`76`	`72`	`IReadOnlyList<Ruling> rulings = page.GetRulings();`
`@@ -87,8 +83,7 @@ public void TestDontThrowNPEInShfill()`
`87`	`83`	`{`
`88`	`84`	`using (PdfDocument pdf_document = PdfDocument.Open("Resources/labor.pdf", new ParsingOptions() { ClipPaths = true }))`
`89`	`85`	`{`
`90`		`- ObjectExtractor oe = new ObjectExtractor(pdf_document);`
`91`		`- PageIterator pi = oe.Extract();`
	`86`	`+ PageIterator pi = ObjectExtractor.Extract(pdf_document);`
`92`	`87`	`Assert.True(pi.MoveNext());`
`93`	`88`
`94`	`89`	`PageArea p = pi.Current;`
`@@ -103,8 +98,7 @@ public void TestExtractOnePage()`
`103`	`98`	`{`
`104`	`99`	`Assert.Equal(2, pdf_document.NumberOfPages);`
`105`	`100`
`106`		`- ObjectExtractor oe = new ObjectExtractor(pdf_document);`
`107`		`- PageArea page = oe.Extract(2);`
	`101`	`+ PageArea page = ObjectExtractor.Extract(pdf_document, 2);`
`108`	`102`
`109`	`103`	`Assert.NotNull(page);`
`110`	`104`	`}`
`@@ -117,8 +111,7 @@ public void TestExtractWrongPageNumber()// throws IOException`
`117`	`111`	`{`
`118`	`112`	`Assert.Equal(2, pdf_document.NumberOfPages);`
`119`	`113`
`120`		`- ObjectExtractor oe = new ObjectExtractor(pdf_document);`
`121`		`- Assert.Throws<IndexOutOfRangeException>(() => oe.Extract(3));`
	`114`	`+ Assert.Throws<IndexOutOfRangeException>(() => ObjectExtractor.Extract(pdf_document, 3));`
`122`	`115`	`}`
`123`	`116`	`}`
`124`	`117`
`@@ -127,9 +120,7 @@ public void TestTextElementsContainedInPage()`
`127`	`120`	`{`
`128`	`121`	`using (PdfDocument pdf_document = PdfDocument.Open("Resources/cs-en-us-pbms.pdf", new ParsingOptions() { ClipPaths = true }))`
`129`	`122`	`{`
`130`		`- ObjectExtractor oe = new ObjectExtractor(pdf_document);`
`131`		`-`
`132`		`- PageArea page = oe.ExtractPage(1);`
	`123`	`+ PageArea page = ObjectExtractor.ExtractPage(pdf_document, 1);`
`133`	`124`
`134`	`125`	`foreach (TextElement te in page.GetText())`
`135`	`126`	`{`
`@@ -143,9 +134,7 @@ public void TestDoNotNPEInPointComparator()`
`143`	`134`	`{`
`144`	`135`	`using (PdfDocument pdf_document = PdfDocument.Open("Resources/npe_issue_206.pdf", new ParsingOptions() { ClipPaths = true }))`
`145`	`136`	`{`
`146`		`- ObjectExtractor oe = new ObjectExtractor(pdf_document);`
`147`		`-`
`148`		`- PageArea p = oe.ExtractPage(1);`
	`137`	`+ PageArea p = ObjectExtractor.ExtractPage(pdf_document, 1);`
`149`	`138`	`Assert.NotNull(p);`
`150`	`139`	`}`
`151`	`140`	`}`
Original file line number	Diff line number	Diff line change
`@@ -16,7 +16,7 @@ public class TestTableDetection`
`16`	`16`
`17`	`17`	`//private static Level defaultLogLevel;`
`18`	`18`
`19`		`- private class TestStatus`
	`19`	`+ private sealed class TestStatus`
`20`	`20`	`{`
`21`	`21`	`public int numExpectedTables;`
`22`	`22`	`public int numCorrectlyDetectedTables;`
Original file line number	Diff line number	Diff line change
`@@ -20,7 +20,7 @@ private Table GetTable()`
`20`	`20`	`return bea.Extract(page)[0];`
`21`	`21`	`}`
`22`	`22`
`23`		`- private List<Table> GetTables()`
	`23`	`+ private IReadOnlyList<Table> GetTables()`
`24`	`24`	`{`
`25`	`25`	`PageArea page = UtilsForTesting.GetPage("Resources/twotables.pdf", 1);`
`26`	`26`	`SpreadsheetExtractionAlgorithm sea = new SpreadsheetExtractionAlgorithm();`
`@@ -144,7 +144,7 @@ public void TestCSVSerializeInfinity()`
`144`	`144`	`public void TestJSONSerializeTwoTables()`
`145`	`145`	`{`
`146`	`146`	`string expectedJson = UtilsForTesting.LoadJson("Resources/json/twotables.json");`
`147`		`- List<Table> tables = this.GetTables();`
	`147`	`+ IReadOnlyList<Table> tables = this.GetTables();`
`148`	`148`
`149`	`149`	`StringBuilder sb = new StringBuilder();`
`150`	`150`	`(new JSONWriter()).Write(sb, tables);`
`@@ -178,7 +178,7 @@ public void TestJSONSerializeTwoTables()`
`178`	`178`	`public void TestCSVSerializeTwoTables()`
`179`	`179`	`{`
`180`	`180`	`string expectedCsv = UtilsForTesting.LoadCsv("Resources/csv/twotables.csv");`
`181`		`- List<Table> tables = this.GetTables();`
	`181`	`+ IReadOnlyList<Table> tables = this.GetTables();`
`182`	`182`
`183`	`183`	`/*`
`184`	`184`	`StringBuilder sb = new StringBuilder();`
Original file line number	Diff line number	Diff line change
`@@ -15,8 +15,7 @@ public void Eu004()`
`15`	`15`	`{`
`16`	`16`	`using (PdfDocument document = PdfDocument.Open("Resources/icdar2013-dataset/competition-dataset-eu/eu-004.pdf", new ParsingOptions() { ClipPaths = true }))`
`17`	`17`	`{`
`18`		`- ObjectExtractor oe = new ObjectExtractor(document);`
`19`		`- PageArea page = oe.Extract(3);`
	`18`	`+ PageArea page = ObjectExtractor.Extract(document, 3);`
`20`	`19`
`21`	`20`	`var detector = new SimpleNurminenDetectionAlgorithm();`
`22`	`21`	`var regions = detector.Detect(page);`