Skip to content
Projects
Groups
Snippets
Help
Loading...
Help
Support
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
erp5
Project overview
Project overview
Details
Activity
Releases
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Issues
0
Issues
0
List
Boards
Labels
Milestones
Merge Requests
0
Merge Requests
0
CI / CD
CI / CD
Pipelines
Jobs
Schedules
Analytics
Analytics
CI / CD
Repository
Value Stream
Wiki
Wiki
Snippets
Snippets
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Create a new issue
Jobs
Commits
Issue Boards
Open sidebar
Xavier Thompson
erp5
Commits
917a3065
Commit
917a3065
authored
Feb 24, 2021
by
Jérome Perrin
Browse files
Options
Browse Files
Download
Email Patches
Plain Diff
ERP5Form: remove PDFParser
This code is not used and rely on pdftk that we don't have installed in slapos
parent
2539cd44
Changes
2
Hide whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
0 additions
and
189 deletions
+0
-189
product/ERP5/Document/BusinessTemplate.py
product/ERP5/Document/BusinessTemplate.py
+0
-1
product/ERP5Form/PDFParser.py
product/ERP5Form/PDFParser.py
+0
-188
No files found.
product/ERP5/Document/BusinessTemplate.py
View file @
917a3065
...
...
@@ -6754,7 +6754,6 @@ Business Template is a set of definitions, such as skins, portal types and categ
'Products.ERP5Form.MultiRelationField'
,
'Products.ERP5Form.OOoChart'
,
'Products.ERP5Form.ParallelListField'
,
'Products.ERP5Form.PDFParser'
,
'Products.ERP5Form.PDFTemplate'
,
'Products.ERP5Form.Permissions'
,
'Products.ERP5Form.PlanningBox'
,
...
...
product/ERP5Form/PDFParser.py
deleted
100644 → 0
View file @
2539cd44
# -*- coding: utf-8 -*-
##############################################################################
#
# Copyright (c) 2008 Nexedi SA and Contributors. All Rights Reserved.
# Mayoro DIAGNE <mayoro@nexedi.com>
#
# WARNING: This program as such is intended to be used by professional
# programmers who take the whole responsability of assessing all potential
# consequences resulting from its eventual inadequacies and bugs
# End users who are looking for a ready-to-use solution with commercial
# garantees and support are strongly adviced to contract a Free Software
# Service Company
#
# This program is Free Software; you can redistribute it and/or
# modify it under the terms of the GNU General Public License
# as published by the Free Software Foundation; either version 2
# of the License, or (at your option) any later version.
#
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with this program; if not, write to the Free Software
# Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
#
##############################################################################
import
commands
import
re
import
random
from
AccessControl
import
ClassSecurityInfo
from
tempfile
import
NamedTemporaryFile
PDFTK_EXECUTABLE
=
"pdftk"
class
PDFParser
:
"""
PDF parser API provide methods wich allow to manipulate a pdf file allowing
to convert pages as images
"""
security
=
ClassSecurityInfo
()
def
__init__
(
self
,
pdf_file_descriptor
):
"""
initialise self.data with pdf_file_descriptor if string's
The __init__ function can take either a filename, an open file object
or the content of the file
Initialise self.width self.height and self.pages (page count)
"""
self
.
width
=
None
self
.
height
=
None
self
.
pages
=
None
if
pdf_file_descriptor
is
None
:
raise
ValueError
,
"No PDF file provided, please choose a pdf form "
if
type
(
pdf_file_descriptor
)
==
'str'
:
self
.
data
=
pdf_file_descriptor
elif
hasattr
(
pdf_file_descriptor
,
"read"
):
pdf_file_descriptor
.
seek
(
0
)
self
.
data
=
pdf_file_descriptor
.
read
()
pdf_file_descriptor
.
close
()
else
:
source
=
open
(
pdf_file_descriptor
,
"rb"
)
source
.
seek
(
0
)
self
.
data
=
source
.
read
()
source
.
close
()
# opening new file on HDD to save PDF content
temp_pdf_file
=
NamedTemporaryFile
(
mode
=
"w+b"
)
temp_pdf_name
=
temp_pdf_file
.
name
# going to the begining of the input file
# saving content
temp_pdf
=
open
(
temp_pdf_name
,
'w'
)
# saving content
temp_pdf
.
write
(
self
.
data
)
temp_pdf
.
close
()
command_output
=
commands
.
getstatusoutput
(
'pdfinfo %s'
%
\
temp_pdf_name
)
if
command_output
[
0
]
!=
0
:
raise
ValueError
,
'Error: convert command failed with the following'
\
'error message :
\
n
%s'
%
command_output
[
1
]
# get the pdf page size
rawstr
=
r'''
Page\
ssize: #
begining of the instersting line
\
s* #some sp
aces
(\
S+)
\sx\
s(
\S+) #the matching pattern : width and height in pts'''
compile_obj
=
re
.
compile
(
rawstr
,
re
.
MULTILINE
|
re
.
VERBOSE
)
match_obj
=
re
.
search
(
compile_obj
,
command_output
[
1
])
width
,
height
=
match_obj
.
groups
()
# get the pdf page_count
rawstr
=
r'''
Pages: #begining of the instersting line
\
s* #some sp
aces
(\
S+) #
the matching pattern : width and height in pts'''
compile_obj
=
re
.
compile
(
rawstr
,
re
.
MULTILINE
|
re
.
VERBOSE
)
match_obj
=
re
.
search
(
compile_obj
,
command_output
[
1
])
page_count
=
match_obj
.
groups
()[
0
]
attributes
=
{}
self
.
width
=
int
(
round
(
float
(
width
)))
self
.
height
=
int
(
round
(
float
(
height
)))
self
.
pages
=
int
(
page_count
)
def
getData
(
self
):
"""
Return the content of the pdf file
"""
return
self
.
data
security
.
declarePublic
(
'getPageCount'
)
def
getPageCount
(
self
):
"""
Return the page count of the pdf file
"""
#self.getContentInformation()['Pages']
return
self
.
pages
security
.
declarePublic
(
'getPageWidth'
)
def
getPageWidth
(
self
):
"""
Return the width of the pdf file
"""
return
self
.
width
security
.
declarePublic
(
'getPageHeight'
)
def
getPageHeight
(
self
):
"""
Return the page count of the pdf file
"""
return
self
.
height
security
.
declarePublic
(
'getPageImage'
)
def
getPageImage
(
self
,
page
,
format
,
resolution
,
quality
):
"""
Return a temporary Image object containing the pape page of the pdf file
width, height: attributes in pixel (px)
format: jpg, png, etc...
resolution: resolution of produced image for exemple 600
quality: quality of produced image for exemple 200 raisonable quality
more hight is quality more time it takes to be gererated
"""
temp_pdf_document_name
=
"tmp%s.pdf"
%
str
(
random
.
random
()).
split
(
'.'
)[
-
1
]
temp_pdf_document
=
self
.
newContent
(
temp_object
=
True
,
portal_type
=
'PDF Document'
,
id
=
temp_pdf_document_name
)
temp_pdf_document
.
setData
(
self
.
getData
())
display
=
'xlarge'
mime
,
image_data
=
temp_pdf_document
.
convert
(
format
=
format
,
frame
=
page
,
resolution
=
resolution
,
quality
=
quality
,
display
=
display
)
page_image
=
None
if
image_data
is
not
None
:
page_image
=
self
.
newContent
(
temp_object
=
True
,
portal_type
=
'Image'
,
id
=
"page_%s"
%
page
)
page_image
.
setData
(
page_image
)
return
page_image
def
getFlattenedPDF
(
self
):
"""
Return a flattened PDF. It's use to merge an input PDF's interactive
form fields with the PDF's pages
"""
temp_input_file
=
NamedTemporaryFile
(
mode
=
"w+b"
)
temp_input_name
=
temp_input_file
.
name
temp_input
=
open
(
temp_input_name
,
'w'
)
temp_input
.
write
(
self
.
getData
())
temp_input
.
close
()
temp_output_file
=
NamedTemporaryFile
(
mode
=
"w+b"
)
temp_output_name
=
temp_output_file
.
name
command_output
=
commands
.
getstatusoutput
(
'pdftk %s output %s flatten'
\
%
(
temp_input_name
,
temp_output_name
))
if
command_output
[
0
]
!=
0
:
raise
IOError
,
"pdftk failed with the following error %s"
\
%
command_output
[
1
]
temp_output
=
open
(
temp_output_name
,
'rb'
)
temp_output
.
seek
(
0
)
datas
=
temp_output
.
read
()
temp_output
.
close
()
return
datas
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment