fogo archive: (.*?) by .*?

#!/usr/bin/env python """ This allows me to easily enter data into various logs from the command line. For example: 'b http://wwws.sun.com/software/xml/developers/diffmk/refentry.html w misc Noted ^' results in '

030121: misc] Noted diffmk.

' This script can be easily extended for new "schemes" that parse the intput and output it into a specified format. """ def times(): import string, time now = time.localtime() date_token = time.strftime("%y%m%d",now) return date_token def hyperize(entry, title, url): """ Replace the line with the '^' character with a hypertext link """ import re return re.sub('(.*)\^(.*)','\\1%s\\2' % (url,title), entry) def encode(s): ''' Encode character for XML ''' s = s.replace("&", "&") s = s.replace("<", "<") s = s.replace(">", ">") s = s.replace("\t", " ") return s def printUsage(message): print message print "Usage: b [url]? scheme [scheme parameters]? entry" def getScheme(options={}): """ Matches the option string to grammar and output function """ import re, sys scheme_regexps = { r'(?P(\.|http)\S*)? ?(?Pg) (?P.*)' : outGoatee, r'(?P(\.|http)\S*)? ?(?Pw) (?P\w*) (?P.*)' : outW3C, r'(?Pqw) (?P.*)' : queryW3C } for key in scheme_regexps.keys(): if re.match(key,options): function = scheme_regexps[key] regexp = key smatch = re.match(regexp, options, re.DOTALL|re.IGNORECASE) params = smatch.groupdict() if params: return(function(params)) else: printUsage("Sorry, you scheme parameters were not correct.") printUsage("Sorry, I don't understand the scheme or URI") sys.exit() def outGoatee(params={}): import os, re print "Outputting to Goatee Nifty" entry = params['entry'] url = encode(params['url']) title = '' if url: title = getTitle(url) date_token = times() formatted_entry = '

%s (%s)

' % (url, title, date_token, entry) # print formatted_entry file = '/home/reagle/data/2web/goatee/nifty-stuff.html' fd = open(file) content = fd.read() fd.close() insertion_pattern = re.compile('(

)') newcontent = insertion_pattern.sub('\\1 \n %s' % formatted_entry,content, re.DOTALL|re.IGNORECASE) if newcontent: fd = open(file,'w') fd.write(newcontent) fd.close() else: printUsage("Sorry, output regexp subsitution failed.") def outW3C(params={}): import os, re print "Outputting to W3C log" activity= params['activity'] entry = params['entry'] url = encode(params['url']) title ='' if url: title = getTitle(url) # title = 'This is a test title' date_token = times() formatted_entry = "

%s: %s] %s

" % (date_token, activity, hyperize(entry,title,url)) print "ENTRY IS", formatted_entry file = '/home/reagle/data/2web/WWW/Team/Reagle/Overview.html' fd = open(file) content = fd.read() fd.close() insertion_pattern = re.compile('(