Unit test fixes

pull/153/head
Frh 2020-04-22 15:36:37 -07:00
parent 6962c714f9
commit ec0ca1e009
2 changed files with 27 additions and 3 deletions

View File

@ -2388,7 +2388,15 @@ data_stream_flag_size = [
], ],
] ]
data_stream_strip_text = [ # Hybrid adds more content into the header.
data_hybrid_flag_size = [
['', '', '', '', '(As at end-March)', '', '', '', '', '', ''],
['', '', '', '', '', '', '', '', '', '', '(` Billion)']
]
data_hybrid_flag_size.extend(data_stream_flag_size)
data_hybrid_strip_text = [
["VinsauVerre", ""], ["VinsauVerre", ""],
["LesBlancs", "12.5CL"], ["LesBlancs", "12.5CL"],
["A.O.PCôtesduRhône", ""], ["A.O.PCôtesduRhône", ""],
@ -2413,8 +2421,24 @@ data_stream_strip_text = [
["A.O.PCôtesdeProvence", ""], ["A.O.PCôtesdeProvence", ""],
["ChâteauGrandBoise«SainteVictoire»2017", "9€"], ["ChâteauGrandBoise«SainteVictoire»2017", "9€"],
["ChâteauLéoube2016", "10€"], ["ChâteauLéoube2016", "10€"],
["LesRouges", "12CL"],
["A.O.PCôtesduRhône", ""],
["DomainedeDionysos«LaCigalette»", "8€"],
["ChâteauSaintEstèvedUchaux«GrandeRéserve»2014", "9€"],
["DomainedelaGuicharde«CuvéeMassillan»2016", "9€"],
["DomainedelaFlorane«TerrePourpre»2014", "10€"],
["LOratoireStMartin«RéservedesSeigneurs»2015", "11€"],
["A.O.PSaintJoseph", ""],
["DomaineMonierPerréol«Châtelet»2015", "13€"],
["A.O.PChâteauneufduPape", ""],
["DomainedeBeaurenard2011", "15€"],
["A.O.PCornas", ""],
["DomaineLionnet«TerreBrûlée»2012", "15€"],
] ]
# Stream only detects part of the table
data_stream_strip_text = data_hybrid_strip_text[0:-13]
data_stream_edge_tol = [ data_stream_edge_tol = [
["Key figures", ""], ["Key figures", ""],
["", "2016"], ["", "2016"],

View File

@ -227,7 +227,7 @@ def test_hybrid_split_text():
def test_hybrid_flag_size(): def test_hybrid_flag_size():
df = pd.DataFrame(data_stream_flag_size) df = pd.DataFrame(data_hybrid_flag_size)
filename = os.path.join(testdir, "superscript.pdf") filename = os.path.join(testdir, "superscript.pdf")
tables = camelot.read_pdf(filename, flavor="hybrid", flag_size=True) tables = camelot.read_pdf(filename, flavor="hybrid", flag_size=True)
@ -235,7 +235,7 @@ def test_hybrid_flag_size():
def test_hybrid_strip_text(): def test_hybrid_strip_text():
df = pd.DataFrame(data_stream_strip_text) df = pd.DataFrame(data_hybrid_strip_text)
filename = os.path.join(testdir, "detect_vertical_false.pdf") filename = os.path.join(testdir, "detect_vertical_false.pdf")
tables = camelot.read_pdf(filename, flavor="hybrid", strip_text=" ,\n") tables = camelot.read_pdf(filename, flavor="hybrid", strip_text=" ,\n")