In [1]:
from odt_parse import OdtData
from odt_diff import find_style_by_name
In [2]:
import csv, glob, zipfile
In [3]:
HOME_FOLDER = '/Volumes/GoogleDrive/La meva unitat/Docencia/Curs1819/PS1002/'
SUBMISSION_FOLDER = HOME_FOLDER + 'PDF2ODT'
user_folder = glob.glob(SUBMISSION_FOLDER + '/*')
In [4]:
with open(SUBMISSION_FOLDER + '.txt', 'w', encoding='utf-8') as f:
counter = 0
for ufo in user_folder:
user_files = glob.glob(ufo + '/*')
for ufi in user_files:
tokens = ufi.split('/')
filename = tokens[-1]
user_data = tokens[-2]
user_name, user_id, _, submission_type, _ = user_data.split('_')
fns = filename.split('.')
if len(fns) > 1:
extension = fns[-1]
else:
extension = ''
row = [user_name, user_id, submission_type, filename, extension]
#if filename != ref_name:
# f.write('\nNombre de fichero: %s\n\n' % filename)
if extension == 'odt':
f.write(user_name + '\n' + '-'*len(user_name) + '\n')
doc = OdtData( ufi )
if doc.err:
f.write('Error de lectura de fichero\n')
else:
f.write(doc.meta['IC'] + '\n')
f.write(str(find_style_by_name(ref.style['paragraph'], 'uberschrift1')) + '\n')
f.write(str(find_style_by_name(ref.style['paragraph'], 'verzeichnis1')) + '\n')
f.write('\n' + '#'*40 + '\n\n')
counter += 1
#else:
# f.write('Extensión de fichero incorrecta\n')
print('%d ficheros procesados.' % counter)
In [5]:
user_folder
Out[5]:
In [ ]: