Exemplo n.º 1
0
import json
from datatools import helpers

''' 
        Combine matched and single pilot jl files, 
        remove environment canada records, then add new ec records (210)
'''
def depts():
    ''' Generator '''
    for r in records:
        if r['owner_org'] != 'ec':
            yield r

def jlrecords(file):        
    return [json.loads(line) for line in open(helpers.load_dir(0)+file)]   

if __name__ == "__main__":
    # Combine pilot records but exlude original from enviroment canaada

    pilot=jlrecords("pilot-bilingual.jl")
    pilot.extend(jlrecords("pilot-matched.jl"))
    
    records=[r for r in pilot if r['owner_org'] != "ec"]
    #records.extend(jlrecords("ec.jl"))
    Need to combine more record types and document before I can tag this
    Also, figure if there are more files like : file:///temp/d13c729f-1ff0-41b5-9546-17b62593c2b8.xml
    load_file=open(helpers.load_dir(0)+"pilot.jl","w")  
    
    [load_file.write(json.dumps(r)+"\n") for r in records]
Exemplo n.º 2
0
def jlrecords(file):        
    return [json.loads(line) for line in open(helpers.load_dir(0)+file)]   
Exemplo n.º 3
0
        for e in r.getchildren():
            resource[e.tag]=e.text
            #if e.tag=='language':resource[e.tag]=extract_language_from_name(e.text)
        res.append(resource)
    pack['resources']=res
    pack['keywords'] = clean_keywords(pack['keywords'])
    pack['keywords_fra'] =   clean_keywords(pack['keywords_fra'])
    pack['ready_to_publish']=False
    print pack['date_published']
    #print json.dumps(pack,sort_keys=True,indent=4, separators=(',', ': '))
    return json.dumps(pack)

    
def process(dir,outfile): 
    transform = 'iso19139.xsl'
    jlfile = open(os.path.normpath(outfile), "w")
    for (path, dirs, files) in os.walk(os.path.normpath(dir)):
        for file in files:
            if file =='metadata.iso19139.xml':
                jlfile.write(nap_reduce(os.path.join(path,file),transform)+"\n")
    jlfile.close()
if __name__ == '__main__':
   file = "iso19139.xml"
   outfile =helpers.load_dir()+"ec.jl"
   dir="/Users/peder/dev/OpenData/data_sources/ec/"

   process(dir,outfile)
   #transform='json.xsl'