X-Git-Url: https://wagner.pp.ru/gitweb/?a=blobdiff_plain;ds=sidebyside;f=convertdump.py;h=c99fff9b7d8d33bf311056c5ee7419ba660eb313;hb=761ab13d84c0ea48d701ae7c030092c49bdf0ff4;hp=f098a58f2a2e0b29fd0fbaca86ceb3a5a7e75509;hpb=e359daff1784de16d7bddaa8b8a1c91b85a90312;p=oss%2Fljdump.git diff --git a/convertdump.py b/convertdump.py index f098a58..c99fff9 100755 --- a/convertdump.py +++ b/convertdump.py @@ -30,6 +30,7 @@ import os import codecs import sys import getopt +import re from time import strptime, strftime @@ -85,7 +86,9 @@ def addEntryForId(outDoc, element, username, id, includeSecure): # Create an event node (special case because for some reason there are two # 'event' elements in the pydump output, which is probably LJ's fault) event = inDoc.getElementsByTagName("event")[0] - appendTextNode(outDoc, entry, "event", getNodeText(event, "event")) + eventText = getNodeText(event, "event") + + appendTextNode(outDoc, entry, "event", replaceLJTags(eventText)) security = getNodeText(inDoc, "security") @@ -152,8 +155,8 @@ def addCommentsForId(outDoc, entry, username, id): getNodeText(comment, "subject")) # Create an event element - appendTextNode(outDoc, outComment, "event", - getNodeText(comment, "body")) + bodyText = getNodeText(comment, "body") + appendTextNode(outDoc, outComment, "event", replaceLJTags(bodyText)) # Create the author element author = outDoc.createElement("author") @@ -172,6 +175,31 @@ def addCommentsForId(outDoc, entry, username, id): if(parentId != ""): appendTextNode(outDoc, outComment, "parent_itemid", parentId) +def replaceLJTags(entry): + rv = entry + + # replace lj user tags + userRE = re.compile('', re.IGNORECASE) + rv = re.sub(userRE, '\\1', rv) + + # replace lj comm tags + commRE = re.compile('', re.IGNORECASE) + rv = re.sub(commRE, '\\1', rv) + + # replace lj-cut tags + namedCutRE = re.compile('', + re.IGNORECASE|re.DOTALL) + rv = re.sub(namedCutRE, '', rv) + + cutRE = re.compile('', re.IGNORECASE) + rv = re.sub(cutRE, '', rv) + + cutRE = re.compile('', re.IGNORECASE) + rv = re.sub(cutRE, '', rv) + + return rv + + def usage(): print( "Usage: convertdump.py [arguments]" ) print( """