|
@@ -1,4 +1,7 @@
|
|
|
|
|
|
|
|
+from microblog import My_Html_Parser
|
|
|
|
+# from html.parser import HTMLParser
|
|
|
|
+from html import escape
|
|
import sys, traceback, dateutil.parser
|
|
import sys, traceback, dateutil.parser
|
|
try:
|
|
try:
|
|
import feedgenerator
|
|
import feedgenerator
|
|
@@ -17,7 +20,7 @@ def line2words(lines, limit):
|
|
words = line.split()
|
|
words = line.split()
|
|
for word in words:
|
|
for word in words:
|
|
l = len(word)
|
|
l = len(word)
|
|
- if l + char_count > limit:
|
|
|
|
|
|
+ if limit > 0 and (l + char_count > limit):
|
|
break_outer_loop = True
|
|
break_outer_loop = True
|
|
break;
|
|
break;
|
|
output.append(word)
|
|
output.append(word)
|
|
@@ -32,6 +35,33 @@ def line2words(lines, limit):
|
|
output.append("...")
|
|
output.append("...")
|
|
return output
|
|
return output
|
|
|
|
|
|
|
|
+# this is similar tot he markup function in microblog
|
|
|
|
+def enrich_msg(lines, is_atom=True):
|
|
|
|
+ if not is_atom:
|
|
|
|
+ return string
|
|
|
|
+ content = []
|
|
|
|
+ parser = My_Html_Parser([])
|
|
|
|
+ for line in lines:
|
|
|
|
+ parser.feed(line)
|
|
|
|
+ if parser.stack == [] \
|
|
|
|
+ and (parser.completed_by == "" or parser.completed_by not in line):
|
|
|
|
+ words = line.split()
|
|
|
|
+ for i in range(len(words)):
|
|
|
|
+ word = words[i]
|
|
|
|
+ if word.find("src=") == 0 \
|
|
|
|
+ or word.find("href=") == 0:
|
|
|
|
+ continue
|
|
|
|
+ elif word.find("https://") != -1:
|
|
|
|
+ w = escape(word)
|
|
|
|
+ new_word = ("<a href=\"%s\">%s</a>") % (w, w)
|
|
|
|
+ words[i] = new_word
|
|
|
|
+ words.insert(0,"<p>")
|
|
|
|
+ words.append("</p>")
|
|
|
|
+ content.append(" ".join(words))
|
|
|
|
+ else:
|
|
|
|
+ content.append(line)
|
|
|
|
+ return content
|
|
|
|
+
|
|
def write_feed(posts, filename, params):
|
|
def write_feed(posts, filename, params):
|
|
feed = None
|
|
feed = None
|
|
t = params["title"]
|
|
t = params["title"]
|
|
@@ -50,23 +80,35 @@ def write_feed(posts, filename, params):
|
|
description = d,
|
|
description = d,
|
|
)
|
|
)
|
|
base_url = l
|
|
base_url = l
|
|
|
|
+ TITLE_LEN_LIMIT = 60
|
|
|
|
+ DESC_LEN_LIMIT = -1 if params["use_atom"] else 300
|
|
for post in posts:
|
|
for post in posts:
|
|
# len of post.message is number of lines
|
|
# len of post.message is number of lines
|
|
- TITLE_LEN_LIMIT = 60
|
|
|
|
- DESC_LEN_LIMIT = 300
|
|
|
|
msg = post.message
|
|
msg = post.message
|
|
ti = " ".join(
|
|
ti = " ".join(
|
|
line2words(msg,TITLE_LEN_LIMIT))
|
|
line2words(msg,TITLE_LEN_LIMIT))
|
|
- de = " ".join(
|
|
|
|
- line2words(msg,DESC_LEN_LIMIT))
|
|
|
|
|
|
+ if params["use_atom"]:
|
|
|
|
+ de = " ".join(enrich_msg(msg))
|
|
|
|
+ else:
|
|
|
|
+ de = " ".join(
|
|
|
|
+ line2words(msg,DESC_LEN_LIMIT))
|
|
li = base_url + ("#%i" % post.num)
|
|
li = base_url + ("#%i" % post.num)
|
|
p = dateutil.parser.parse(post.timestamp)
|
|
p = dateutil.parser.parse(post.timestamp)
|
|
- feed.add_item(
|
|
|
|
- title = ti,
|
|
|
|
- link = li,
|
|
|
|
- description = de,
|
|
|
|
- pubdate = p
|
|
|
|
- )
|
|
|
|
|
|
+ if params["use_atom"]:
|
|
|
|
+ feed.add_item(
|
|
|
|
+ title = ti,
|
|
|
|
+ link = li,
|
|
|
|
+ description = str(),
|
|
|
|
+ content = de,
|
|
|
|
+ pubdate = p
|
|
|
|
+ )
|
|
|
|
+ else:
|
|
|
|
+ feed.add_item(
|
|
|
|
+ title = ti,
|
|
|
|
+ link = li,
|
|
|
|
+ description = de,
|
|
|
|
+ pubdate = p
|
|
|
|
+ )
|
|
with open(filename, 'w') as f:
|
|
with open(filename, 'w') as f:
|
|
f.write(feed.writeString('utf-8'))
|
|
f.write(feed.writeString('utf-8'))
|
|
del feed
|
|
del feed
|