@@ -19,16 +19,16 @@ def addCompany(self, companies, company, ticker):
19
19
companies .append (row )
20
20
return
21
21
22
- # Read PDF and return companies names and tickers
22
+ # Read PDF and return people
23
23
def readPeople (self ) -> list :
24
24
people = []
25
25
pageNumber = 0
26
26
# Read until find end strings
27
27
while True :
28
28
page = self .pages [pageNumber ]
29
29
page_content = page .extract_text ()
30
- parsed = '' . join (page_content )
31
- print ( parsed )
30
+ print (page_content )
31
+ # parsed = ''.join(page_content )
32
32
# cels = parsed.split('\n')
33
33
# celNumber = 0
34
34
# cab = (cels[celNumber])
@@ -46,20 +46,20 @@ def readPeople(self) -> list:
46
46
47
47
# celNumber += 2
48
48
49
- else : # cab = "Company Ticker" - Method to discover other pattern of page
50
- # No break lines in page 10
51
- # cabs
52
- headers = cels [celNumber ].rsplit (maxsplit = 1 )
53
- celNumber += 1
54
- while cels [celNumber ][:13 ] != "June 24, 2022" :
55
- # split ticker at right
56
- subCel = cels [celNumber ].rsplit (maxsplit = 1 )
57
- company = subCel [0 ]
58
- ticker = subCel [1 ]
59
- if company != "Company" : # test if cab
60
- self .addCompany (people , company , ticker )
61
-
62
- celNumber += 1
49
+ # else: # cab = "Company Ticker" - Method to discover other pattern of page
50
+ # # No break lines in page 10
51
+ # # cabs
52
+ # headers = cels[celNumber].rsplit(maxsplit=1)
53
+ # celNumber += 1
54
+ # while cels[celNumber][:13] != "June 24, 2022":
55
+ # # split ticker at right
56
+ # subCel = cels[celNumber].rsplit(maxsplit=1)
57
+ # company = subCel[0]
58
+ # ticker = subCel[1]
59
+ # if company != "Company": # test if cab
60
+ # self.addCompany(people, company, ticker)
61
+
62
+ # celNumber += 1
63
63
64
64
if ended :
65
65
break
0 commit comments