1 # GNU MediaGoblin -- federated, autonomous media hosting
2 # Copyright (C) 2011, 2012 MediaGoblin contributors. See AUTHORS.
4 # This program is free software: you can redistribute it and/or modify
5 # it under the terms of the GNU Affero General Public License as published by
6 # the Free Software Foundation, either version 3 of the License, or
7 # (at your option) any later version.
9 # This program is distributed in the hope that it will be useful,
10 # but WITHOUT ANY WARRANTY; without even the implied warranty of
11 # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 # GNU Affero General Public License for more details.
14 # You should have received a copy of the GNU Affero General Public License
15 # along with this program. If not, see <http://www.gnu.org/licenses/>.
24 from mediagoblin
import mg_globals
as mgg
25 from mediagoblin
.processing
import create_pub_filepath
26 from mediagoblin
.media_types
.ascii
import asciitoimage
28 _log
= logging
.getLogger(__name__
)
30 SUPPORTED_EXTENSIONS
= ['txt', 'asc', 'nfo']
31 MEDIA_TYPE
= 'mediagoblin.media_types.ascii'
34 def sniff_handler(media_file
, **kw
):
35 _log
.info('Sniffing {0}'.format(MEDIA_TYPE
))
36 if kw
.get('media') is not None:
37 name
, ext
= os
.path
.splitext(kw
['media'].filename
)
38 clean_ext
= ext
[1:].lower()
40 if clean_ext
in SUPPORTED_EXTENSIONS
:
46 def process_ascii(proc_state
):
47 """Code to process a txt file. Will be run by celery.
49 A Workbench() represents a local tempory dir. It is automatically
50 cleaned up when this function exits.
52 entry
= proc_state
.entry
53 workbench
= proc_state
.workbench
54 ascii_config
= mgg
.global_config
['media_type:mediagoblin.media_types.ascii']
55 # Conversions subdirectory to avoid collisions
56 conversions_subdir
= os
.path
.join(
57 workbench
.dir, 'conversions')
58 os
.mkdir(conversions_subdir
)
60 queued_filepath
= entry
.queued_media_file
61 queued_filename
= workbench
.localized_file(
62 mgg
.queue_store
, queued_filepath
,
65 queued_file
= file(queued_filename
, 'rb')
68 queued_file_charset
= chardet
.detect(queued_file
.read())
70 # Only select a non-utf-8 charset if chardet is *really* sure
71 # Tested with "Feli\x0109an superjaron", which was detecte
72 if queued_file_charset
['confidence'] < 0.9:
73 interpreted_charset
= 'utf-8'
75 interpreted_charset
= queued_file_charset
['encoding']
77 _log
.info('Charset detected: {0}\nWill interpret as: {1}'.format(
81 queued_file
.seek(0) # Rewind the queued file
83 thumb_filepath
= create_pub_filepath(
84 entry
, 'thumbnail.png')
86 tmp_thumb_filename
= os
.path
.join(
87 conversions_subdir
, thumb_filepath
[-1])
89 ascii_converter_args
= {}
91 if ascii_config
['thumbnail_font']:
92 ascii_converter_args
.update(
93 {'font': ascii_config
['thumbnail_font']})
95 converter
= asciitoimage
.AsciiToImage(
96 **ascii_converter_args
)
98 thumb
= converter
._create
_image
(
101 with
file(tmp_thumb_filename
, 'w') as thumb_file
:
103 (mgg
.global_config
['media:thumb']['max_width'],
104 mgg
.global_config
['media:thumb']['max_height']),
106 thumb
.save(thumb_file
)
108 _log
.debug('Copying local file to public storage')
109 mgg
.public_store
.copy_local_to_storage(
110 tmp_thumb_filename
, thumb_filepath
)
114 original_filepath
= create_pub_filepath(entry
, queued_filepath
[-1])
116 with mgg
.public_store
.get_file(original_filepath
, 'wb') \
118 original_file
.write(queued_file
.read())
120 queued_file
.seek(0) # Rewind *again*
122 unicode_filepath
= create_pub_filepath(entry
, 'ascii-portable.txt')
124 with mgg
.public_store
.get_file(unicode_filepath
, 'wb') \
126 # Decode the original file from its detected charset (or UTF8)
127 # Encode the unicode instance to ASCII and replace any non-ASCII
128 # with an HTML entity (&#
130 unicode(queued_file
.read().decode(
131 interpreted_charset
)).encode(
133 'xmlcharrefreplace'))
135 # Remove queued media file from storage and database.
136 # queued_filepath is in the task_id directory which should
137 # be removed too, but fail if the directory is not empty to be on
138 # the super-safe side.
139 mgg
.queue_store
.delete_file(queued_filepath
) # rm file
140 mgg
.queue_store
.delete_dir(queued_filepath
[:-1]) # rm dir
141 entry
.queued_media_file
= []
143 media_files_dict
= entry
.setdefault('media_files', {})
144 media_files_dict
['thumb'] = thumb_filepath
145 media_files_dict
['unicode'] = unicode_filepath
146 media_files_dict
['original'] = original_filepath