Package translate :: Package convert :: Module oo2po
[hide private]
[frames] | no frames]

Source Code for Module translate.convert.oo2po

  1  #!/usr/bin/env python 
  2  # -*- coding: utf-8 -*- 
  3  # 
  4  # Copyright 2003-2008 Zuza Software Foundation 
  5  #  
  6  # This file is part of translate. 
  7  # 
  8  # translate is free software; you can redistribute it and/or modify 
  9  # it under the terms of the GNU General Public License as published by 
 10  # the Free Software Foundation; either version 2 of the License, or 
 11  # (at your option) any later version. 
 12  #  
 13  # translate is distributed in the hope that it will be useful, 
 14  # but WITHOUT ANY WARRANTY; without even the implied warranty of 
 15  # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the 
 16  # GNU General Public License for more details. 
 17  # 
 18  # You should have received a copy of the GNU General Public License 
 19  # along with translate; if not, write to the Free Software 
 20  # Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
 21  # 
 22   
 23  """convert an OpenOffice.org (SDF) localization file to Gettext PO localization files 
 24   
 25  See: http://translate.sourceforge.net/wiki/toolkit/oo2po for examples and  
 26  usage instructions 
 27  """ 
 28   
 29  import sys 
 30  from translate.storage import po 
 31  from translate.storage import oo 
 32   
 33  # TODO: support using one GSI file as template, another as input (for when English is in one and translation in another) 
 34   
35 -class oo2po:
36 - def __init__(self, sourcelanguage, targetlanguage, blankmsgstr=False, long_keys=False):
37 """construct an oo2po converter for the specified languages""" 38 self.sourcelanguage = sourcelanguage 39 self.targetlanguage = targetlanguage 40 self.blankmsgstr = blankmsgstr 41 self.long_keys = long_keys
42
43 - def maketargetunit(self, part1, part2, translators_comment, key, subkey):
44 """makes a base unit (.po or XLIFF) out of a subkey of two parts""" 45 #TODO: Do better 46 text1 = getattr(part1, subkey) 47 if text1 == "": 48 return None 49 text2 = getattr(part2, subkey) 50 51 unit = po.pounit(text1.decode('utf-8'), encoding="UTF-8") 52 unit.target = text2.decode('utf-8') 53 unit.addlocation(key + "." + subkey) 54 if getattr(translators_comment, subkey).strip() != "": 55 unit.addnote(getattr(translators_comment, subkey), origin="developer") 56 return unit
57
58 - def convertelement(self, theoo):
59 """convert an oo element into a list of base units (.po or XLIFF)""" 60 if self.sourcelanguage in theoo.languages: 61 part1 = theoo.languages[self.sourcelanguage] 62 else: 63 print >> sys.stderr, "/".join(theoo.lines[0].getkey()), "language not found: %s" % (self.sourcelanguage) 64 return [] 65 if self.blankmsgstr: 66 # use a blank part2 67 part2 = oo.ooline() 68 else: 69 if self.targetlanguage in theoo.languages: 70 part2 = theoo.languages[self.targetlanguage] 71 else: 72 # if the language doesn't exist, the translation is missing ... so make it blank 73 part2 = oo.ooline() 74 if "x-comment" in theoo.languages: 75 translators_comment = theoo.languages["x-comment"] 76 else: 77 translators_comment = oo.ooline() 78 key = oo.makekey(part1.getkey(), self.long_keys) 79 unitlist = [] 80 for subkey in ("text", "quickhelptext", "title"): 81 unit = self.maketargetunit(part1, part2, translators_comment, key, subkey) 82 if unit is not None: 83 unitlist.append(unit) 84 return unitlist
85
86 - def convertstore(self, theoofile, duplicatestyle="msgctxt"):
87 """converts an entire oo file to a base class format (.po or XLIFF)""" 88 thetargetfile = po.pofile() 89 # create a header for the file 90 bug_url = 'http://qa.openoffice.org/issues/enter_bug.cgi' + ('''?subcomponent=ui&comment=&short_desc=Localization issue in file: %(filename)s&component=l10n&form_name=enter_issue''' % {"filename": theoofile.filename}).replace(" ", "%20").replace(":", "%3A") 91 targetheader = thetargetfile.init_headers(charset="UTF-8", encoding="8bit", x_accelerator_marker="~", report_msgid_bugs_to=bug_url) 92 targetheader.addnote("extracted from %s" % theoofile.filename, "developer") 93 thetargetfile.setsourcelanguage(self.sourcelanguage) 94 thetargetfile.settargetlanguage(self.targetlanguage) 95 # go through the oo and convert each element 96 for theoo in theoofile.units: 97 unitlist = self.convertelement(theoo) 98 for unit in unitlist: 99 thetargetfile.addunit(unit) 100 thetargetfile.removeduplicates(duplicatestyle) 101 return thetargetfile
102
103 -def verifyoptions(options):
104 """verifies the commandline options""" 105 if not options.pot and not options.targetlanguage: 106 raise ValueError("You must specify the target language unless generating POT files (-P)")
107
108 -def convertoo(inputfile, outputfile, templates, pot=False, sourcelanguage=None, targetlanguage=None, duplicatestyle="msgid_comment", multifilestyle="single"):
109 """reads in stdin using inputstore class, converts using convertorclass, writes to stdout""" 110 inputstore = oo.oofile() 111 if hasattr(inputfile, "filename"): 112 inputfilename = inputfile.filename 113 else: 114 inputfilename = "(input file name not known)" 115 inputstore.filename = inputfilename 116 inputstore.parse(inputfile.read()) 117 if not sourcelanguage: 118 testlangtype = targetlanguage or (inputstore and inputstore.languages[0]) or "" 119 if testlangtype.isdigit(): 120 sourcelanguage = "01" 121 else: 122 sourcelanguage = "en-US" 123 if not sourcelanguage in inputstore.languages: 124 print >> sys.stderr, "Warning: sourcelanguage '%s' not found in inputfile '%s' (contains %s)" % (sourcelanguage, inputfilename, ", ".join(inputstore.languages)) 125 if targetlanguage and targetlanguage not in inputstore.languages: 126 print >> sys.stderr, "Warning: targetlanguage '%s' not found in inputfile '%s' (contains %s)" % (targetlanguage, inputfilename, ", ".join(inputstore.languages)) 127 convertor = oo2po(sourcelanguage, targetlanguage, blankmsgstr=pot, long_keys=multifilestyle!="single") 128 outputstore = convertor.convertstore(inputstore, duplicatestyle) 129 if outputstore.isempty(): 130 return 0 131 outputfile.write(str(outputstore)) 132 return 1
133
134 -def main(argv=None):
135 from translate.convert import convert 136 formats = {"oo":("po", convertoo), "sdf":("po", convertoo)} 137 # always treat the input as an archive unless it is a directory 138 archiveformats = {(None, "input"): oo.oomultifile} 139 parser = convert.ArchiveConvertOptionParser(formats, usepots=True, description=__doc__, archiveformats=archiveformats) 140 parser.add_option("-l", "--language", dest="targetlanguage", default=None, 141 help="set target language to extract from oo file (e.g. af-ZA)", metavar="LANG") 142 parser.add_option("", "--source-language", dest="sourcelanguage", default=None, 143 help="set source language code (default en-US)", metavar="LANG") 144 parser.add_option("", "--nonrecursiveinput", dest="allowrecursiveinput", default=True, action="store_false", help="don't treat the input oo as a recursive store") 145 parser.add_duplicates_option() 146 parser.add_multifile_option() 147 parser.passthrough.append("pot") 148 parser.passthrough.append("sourcelanguage") 149 parser.passthrough.append("targetlanguage") 150 parser.verifyoptions = verifyoptions 151 parser.run(argv)
152 153 if __name__ == '__main__': 154 main() 155