Fix issue 983 PDF UnicodeDecodeError
[mediagoblin.git] / mediagoblin / media_types / pdf / models.py
1 # GNU MediaGoblin -- federated, autonomous media hosting
2 # Copyright (C) 2011, 2012 MediaGoblin contributors. See AUTHORS.
3 #
4 # This program is free software: you can redistribute it and/or modify
5 # it under the terms of the GNU Affero General Public License as published by
6 # the Free Software Foundation, either version 3 of the License, or
7 # (at your option) any later version.
8 #
9 # This program is distributed in the hope that it will be useful,
10 # but WITHOUT ANY WARRANTY; without even the implied warranty of
11 # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 # GNU Affero General Public License for more details.
13 #
14 # You should have received a copy of the GNU Affero General Public License
15 # along with this program. If not, see <http://www.gnu.org/licenses/>.
16
17
18 from mediagoblin.db.base import Base
19
20 from sqlalchemy import (
21 Column, Float, Integer, String, DateTime, ForeignKey)
22 from sqlalchemy.orm import relationship, backref
23
24
25 BACKREF_NAME = "pdf__media_data"
26
27
28 class PdfData(Base):
29 __tablename__ = "pdf__mediadata"
30
31 # The primary key *and* reference to the main media_entry
32 media_entry = Column(Integer, ForeignKey('core__media_entries.id'),
33 primary_key=True)
34 get_media_entry = relationship("MediaEntry",
35 backref=backref(BACKREF_NAME, uselist=False,
36 cascade="all, delete-orphan"))
37 pages = Column(Integer)
38
39 # These are taken from what pdfinfo can do, perhaps others make sense too
40 pdf_author = Column(String)
41 pdf_title = Column(String)
42 # note on keywords: this is the pdf parsed string, it should be considered a cached
43 # value like the rest of these values, since they can be deduced at query time / client
44 # side too.
45 pdf_keywords = Column(String)
46 pdf_creator = Column(String)
47 pdf_producer = Column(String)
48 pdf_creation_date = Column(DateTime)
49 pdf_modified_date = Column(DateTime)
50 pdf_version_major = Column(Integer)
51 pdf_version_minor = Column(Integer)
52 pdf_page_size_width = Column(Float) # unit: pts
53 pdf_page_size_height = Column(Float)
54 pdf_pages = Column(Integer)
55
56
57 DATA_MODEL = PdfData
58 MODELS = [PdfData]