more retries in pull, join to move into folders

This commit is contained in:
Michael Murtaugh 2015-12-03 14:08:25 +01:00
parent 1cec879add
commit 568a8f0790
3 changed files with 43 additions and 7 deletions

View File

@ -54,3 +54,6 @@ etherdump pull <padid/path>
etherdump sync etherdump sync
push / pull file contents to pad push / pull file contents to pad
why
-------
Etherdump is useful as a means of dumping the contents of etherpad to files, as a way of opening up the contents of the service to other services / methods / uses / tools / situations. (Files also of course allow for archival tools / methods)

View File

@ -25,7 +25,21 @@ def main(args):
inputs = args.input inputs = args.input
inputs.sort() inputs.sort()
inputs = [x for x in inputs if not os.path.isdir(x)]
def base (x): def base (x):
return re.sub(r"(\.html)|(\.diff\.html)|(\.meta\.json)|(\.txt)$", "", x) return re.sub(r"(\.html)|(\.diff\.html)|(\.meta\.json)|(\.txt)$", "", x)
from pprint import pprint #from pprint import pprint
pprint(group(inputs, base)) #pprint()
gg = group(inputs, base)
for items in gg:
itembase = base(items[0])
try:
os.mkdir(itembase)
except OSError:
pass
for i in items:
newloc = os.path.join(itembase, i)
print "'{0}' => '{1}'".format(i, newloc)
os.rename(i, newloc)

View File

@ -6,6 +6,8 @@ from datetime import datetime
from urllib import urlencode from urllib import urlencode
from urllib2 import HTTPError from urllib2 import HTTPError
from common import * from common import *
from time import sleep
""" """
pull(meta): pull(meta):
@ -118,10 +120,27 @@ def main (args):
f.write(html.encode("utf-8")) f.write(html.encode("utf-8"))
if args.all or args.dhtml: if args.all or args.dhtml:
data['startRev'] = "0" tries = 0
html = getjson(info['apiurl']+'createDiffHTML?'+urlencode(data)) skip = False
html = html['data']['html'] while not skip:
with open(p+".diff.html", "w") as f: try:
f.write(html.encode("utf-8")) data['startRev'] = "0"
html = getjson(info['apiurl']+'createDiffHTML?'+urlencode(data))
html = html['data']['html']
with open(p+".diff.html", "w") as f:
f.write(html.encode("utf-8"))
break
except HTTPError as e:
print ("HTTPERROR {0}".format(e), file=sys.stderr)
tries += 1
if tries >= 5:
print (" Too many errors, deleting .diff.html and skipping", file=sys.stderr)
try:
os.remove(p+".diff.html")
except OSError:
pass
skip=True
else:
sleep(0.1)
print("\n{0} pad(s) changed".format(count), file=sys.stderr) print("\n{0} pad(s) changed".format(count), file=sys.stderr)