Skip to content

Commit a0374b7

Browse files
danilojslDevinTDHa
authored andcommitted
[SPARKNLP-1259] Adding slow mark for URLs readers tests
1 parent 09070ad commit a0374b7

File tree

2 files changed

+3
-6
lines changed

2 files changed

+3
-6
lines changed

python/test/partition/partition_test.py

Lines changed: 3 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -101,7 +101,7 @@ def runTest(self):
101101
self.assertTrue(html_file_df.select("html").count() > 0)
102102

103103

104-
@pytest.mark.fast
104+
@pytest.mark.slow
105105
class PartitionUrlTesSpec(unittest.TestCase):
106106

107107
def runTest(self):
@@ -122,8 +122,8 @@ def runTest(self):
122122
pdf_df = Partition(content_type = "application/pdf").partition(self.html_directory)
123123
pdf_file_df = Partition().partition(f"{self.html_directory}/text_3_pages.pdf")
124124

125-
self.assertTrue(pdf_df.select("text").count() > 0)
126-
self.assertTrue(pdf_file_df.select("text").count() > 0)
125+
self.assertTrue(pdf_df.select("pdf").count() > 0)
126+
self.assertTrue(pdf_file_df.select("pdf").count() > 0)
127127

128128
@pytest.mark.fast
129129
class PartitionTextInMemoryTesSpec(unittest.TestCase):
@@ -139,6 +139,5 @@ def setUp(self):
139139

140140
def runTest(self):
141141
text_df = Partition(group_broken_paragraphs=True).partition_text(text = self.raw_text )
142-
text_df.show(truncate=False)
143142

144143
self.assertTrue(text_df.select("txt").count() > 0)

python/test/partition/partition_transformer_test.py

Lines changed: 0 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -79,7 +79,6 @@ def runTest(self):
7979
pipelineModel = pipeline.fit(emptyDataSet)
8080

8181
resultDf = pipelineModel.transform(self.testDataSet)
82-
resultDf.show(truncate=False)
8382

8483
self.assertTrue(resultDf.select("partition").count() > 0)
8584

@@ -108,6 +107,5 @@ def runTest(self):
108107
pipelineModel = pipeline.fit(self.emptyDataSet)
109108

110109
resultDf = pipelineModel.transform(self.emptyDataSet)
111-
resultDf.show(truncate=False)
112110

113111
self.assertTrue(resultDf.select("partition").count() >= 0)

0 commit comments

Comments
 (0)