Mais um script para dividir os dumps do PostgreSQL em arquivos de objeto

https://gist.github.com/2572360

#! /usr/bin/python
import os, re, sys

# Split pg_dump files to schema/type file hierarchy
# Use with files produced by pg_dump -s

#TODO: Identify dropped objects and delete from tree

# Detect object header lines
re_obj
= re.compile(r'-- Name: ([-ws.]+)(?:([-ws[],]*))?; Type: ([-ws]+); Schema: ([-w]+); Owner: ([-w]*)(?:; Tablespace: )?([-w]*)n', flags=re.IGNORECASE)

if len(sys.argv) < 2:
print 'Usage: pg_schema_split infile [outdir]'
sys
.exit()

infile
= sys.argv[1]
outdir
= os.path.split(sys.argv[0][0])
if len(sys.argv) > 2 : outdir = sys.argv[2]

name
, type, schema, owner, tablespace = ['']*5
sql
= ''

for line in open(infile,'r').readlines():
obj
= re_obj.match(line)
if obj:
ot
= re_obj.search(line).group(2)
if ot not in ('COMMENT', 'SEQUENCE OWNED BY'): # Keep these in parent script
if schema != 'pg_catalog' and name > '':
if schema == '-': schema = 'public'
type
= type.replace(' ','_').lower()

#print 'Name: %s; Type: %s; Schema: %s; Owner: %s; Tablespace: %s' % (name, type, schema, owner, tablespace or '(default)')
print 'Schema: %s; Type: %s; Name: %s' % (schema, type, name)

sqlpath
= os.path.join(outdir, schema, type)
if not os.path.exists(sqlpath):
print '*** mkdir %s' % sqlpath
os
.makedirs(sqlpath)
sqlf
= os.path.join(sqlpath, '%s.sql' % name)

sql
= sql.replace('nn','n') # Cleanup line spacing
open
(sqlf,'w').write(sql.strip())

name
, type, schema, owner, tablespace = re_obj.search(line).groups()
sql
= ''
elif line.strip() != '--': # Skip empty comment lines
sql
+= line