summaryrefslogtreecommitdiff
path: root/tools/eos-html-extractor
diff options
context:
space:
mode:
authorPhilip Chimento <philip@endlessm.com>2015-06-04 11:40:35 -0700
committerPhilip Chimento <philip@endlessm.com>2015-06-04 14:28:16 -0700
commit9b628605064811bbfd2faf72e07899d8c37fe15c (patch)
tree30394717676b47fa8ea65f909fa6d188a44e2f38 /tools/eos-html-extractor
parente75acb0f04ac1d63ea7e50b5753eb023ca8b71e6 (diff)
eos-html-extractor PEP8 and consistency cleanup
[endlessm/eos-sdk#3245]
Diffstat (limited to 'tools/eos-html-extractor')
-rwxr-xr-xtools/eos-html-extractor58
1 files changed, 30 insertions, 28 deletions
diff --git a/tools/eos-html-extractor b/tools/eos-html-extractor
index 84a0062..64800c9 100755
--- a/tools/eos-html-extractor
+++ b/tools/eos-html-extractor
@@ -1,36 +1,37 @@
#!/usr/bin/env python
-'''
-Created on July 19, 2013
-@author: Sebastian
-'''
-# This scraper depends on the BeautifulSoup4 module, make sure
-# it's installed by running the following:
-# apt-get install python-bs4
+# Copyright 2013-2015 Endless Mobile, Inc.
+
import argparse
-import os, re, urllib
+import os
+import re
+import urllib
from bs4 import BeautifulSoup
from HTMLParser import HTMLParser
+
# Parser that adds line numbers to the HTML strings that need translating
class TranslatableHTMLParser(HTMLParser):
def handle_data(self, data):
- if data in translatable_strings:
- # Determine if comment should be included
- most_recent_comment = comments_with_line_numbers[(len(comments_with_line_numbers))-1]
- comment_string = most_recent_comment[0]
- comment_line = most_recent_comment[1]
- code_line = HTMLParser.getpos(self)[0]
- # Comment takes up at least one line by default (hence the +1)
- comment_length = len(re.findall(r"\n", comment_string)) + 1
- optional_comment = ""
- # If the comment immediately preceded this string, include it
- if comment_line + comment_length == code_line:
- optional_comment = " ".join(comment_string.split())
- all_translatable_data.append((data.strip(), code_line, optional_comment))
+ if data not in translatable_strings:
+ return
+
+ # Determine if comment should be included
+ most_recent_comment = comments_with_line_numbers[-1]
+ comment_string, comment_line = most_recent_comment
+ code_line = self.getpos()[0]
+
+ # Comment takes up at least one line by default (hence the +1)
+ comment_length = len(re.findall(r'\n', comment_string)) + 1
+ optional_comment = ''
+
+ # If the comment immediately preceded this string, include it
+ if comment_line + comment_length == code_line:
+ optional_comment = ' '.join(comment_string.split())
+ all_translatable_data.append((data.strip(), code_line, optional_comment))
def handle_comment(self, comment):
- comments_with_line_numbers.append((comment, HTMLParser.getpos(self)[0]))
+ comments_with_line_numbers.append((comment, self.getpos()[0]))
parser = argparse.ArgumentParser(description='Extract translatable strings ' +
'from HTML files. This is xgettext for HTML.')
@@ -50,8 +51,9 @@ page = urllib.urlopen(urllib.pathname2url(html_file)).read()
soup = BeautifulSoup(page)
# Extract all translatable strings from that HTML
-translatable_divs = soup.find_all(attrs={"name" : "translatable"})
-translatable_strings = map(lambda div: div.contents[0].encode('utf-8'), translatable_divs)
+translatable_divs = soup.find_all(attrs={'name': 'translatable'})
+translatable_strings = map(lambda div: div.contents[0].encode('utf-8'),
+ translatable_divs)
# Find the line numbers for those strings
all_translatable_data = []
@@ -61,7 +63,7 @@ parser.feed(page)
# Write out all info about the translatable strings found in this file
for string, line_num, optional_comment in all_translatable_data:
- print ("#line " + str(line_num) + " \"" + final_path + "\"")
- if optional_comment != "":
- print ("// " + optional_comment)
- print ("_(\"" + string + "\");")
+ print('#line {line} "{path}"'.format(line=line_num, path=final_path))
+ if optional_comment != '':
+ print('// ' + optional_comment)
+ print('_("{string}");'.format(string=string))