Ejemplo n.º 1
0
    def test(self):
        query="""
        select 
            cat.filename as catname, 
            cat.filetype as cattype,
            cat.id as catid,
            im.filename as imname,
            im.filetype as imtype,
            im.id as imid
        from
            dr004_files im,
            (select 
                id,filename,filetype,catalog_parentid 
             from 
                dr004_files 
             where 
                filetype='red_cat') cat
        where
            cat.catalog_parentid = im.id
        """

        print 'query:',query

        oc=oracle_util.Connection()
        res = oc.Execute(query)
        oc.Close()

        return res
Ejemplo n.º 2
0
def get_coadd_cat_info(band=None, dictlist=False):
    """
    we demand the band since band is not set in the database for most
    tables and we want to set it explicitly

    get all the DES coadd catalog info
    """

    q="""
    select
        *
    from
        catalog
    where
        catalogtype = 'coadd_cat' 
        and project = 'DES'
        and catalogname like '%%_%s_cat%%'
    order by
        catalog.run
    """ % band

    stdout.write(q)

    conn = oracle_util.Connection()
    res = conn.Execute(q, dictlist=dictlist, lower=True)

    if res is not None:
        if dictlist:
            for i in range(len(res)):
                res[i]['band'] = band
        else:
            res['band'] = band
    return res
Ejemplo n.º 3
0
    def get_filetype_info(self,band,filetype,columns=None):
        """
        Get some info for all files of a given filetype.  filetype could be,
        e.g., 'red','red_cat','coadd','coadd_cat', etc
        """
        if columns is None:
            columns="id,run,band,filetype,filename,filedate"
            if 'coadd' in filetype:
                columns+=",tilename"
        if isinstance(columns,(tuple,list)):
            columns=','.join(columns)

        table = '%s_files' % self._release
        query="""
            select 
                {columns}
            from 
                {table} 
            where 
                band = '{band}'
                and filetype='{filetype}'""".format(columns=columns,
                                                    table=table,
                                                    band=band,
                                                    filetype=filetype)
        stdout.write("query: \n%s\n" % query)
        oc=oracle_util.Connection()
        res = oc.Execute(query)
        return res
Ejemplo n.º 4
0
    def collate_coadd(self,band):
        table = '%s_files' % self._release
        query="""
        select 
            im.band as band,
            im.id as im_id,
            im.run as im_run,
            im.filename as im_filename,
            im.filetype as im_filetype,
            im.tilename as im_tilename,
            cat.id as cat_id,
            cat.run as cat_run,
            cat.filename as cat_filename, 
            cat.filetype as cat_filetype,
            cat.tilename as cat_tilename,
            cat.catalog_parentid as cat_parentid
        from
            {table} cat,
            {table} im
        where
            im.filetype = 'coadd'
            and im.band = 'i'
            and cat.catalog_parentid = im.id
        """.format(table=table,band=band)

        stdout.write("query: \n%s\n" % query)
        oc=oracle_util.Connection()
        res = oc.Execute(query)
        return res
Ejemplo n.º 5
0
    def collate_red_old(self,band):
        table = '%s_files' % self._release
        query="""
        select 
            im.band as band,
            im.file_exposure_name as exposurename,
            im.ccd as ccd,
            im.id as im_id,
            im.run as im_run,
            im.filename as im_filename,
            im.filetype as im_filetype,
            cat.id as cat_id,
            cat.run as cat_run,
            cat.filename as cat_filename, 
            cat.filetype as cat_filetype,
            cat.catalog_parentid as cat_parentid
        from
            {table} cat,
            (select 
                id,run,band,ccd,filename,filetype,filedate,
                file_exposure_name
             from 
                {table}
             where 
                band = '{band}'
                and filetype='red') im
        where
            cat.catalog_parentid = im.id
        """.format(table=table,band=band)

        stdout.write("query: \n%s\n" % query)
        oc=oracle_util.Connection()
        res = oc.Execute(query)
        return res
Ejemplo n.º 6
0
def dump_query(q, fname):
    import sfile
    conn = oracle_util.Connection()
    stdout.write(q+'\n')
    res = conn.Execute(q)
    stdout.write("Writing to file: %s\n" % fname)
    sfile.write(res, fname)
    res=0
    return
Ejemplo n.º 7
0
def get_tile_run(tilename, verbose=False, multi=False):
    """
    Try to get the appropriate run identifier for the input tilename
    Currently choses the latest one
    """

    #runreg='DES%'
    #query="""
    #    SELECT 
    #        distinct(run) 
    #    FROM 
    #        location
    #    WHERE
    #        tilename like '%s'
    #        AND run like '%s'
    #    ORDER BY
    #        run DESC
    #""" % (tilename, runreg)

    query="""
        SELECT 
            distinct(run) 
        FROM 
            location
        WHERE
            tilename like '%s'
        ORDER BY
            run DESC
    """ % (tilename,)
    

    if verbose:
        sys.stdout.write('%s\n' % query)

    o=oracle_util.Connection()
    res = o.Execute(query)
    if res is None:
        return None

    if multi:
        return res['run']
    else:
        run = res['run'][0]
        return run
Ejemplo n.º 8
0
    def collate_red(self,band):
        """

        Note the kludge on filename to remove dups associated with standard
        star fields

        """

        table = '%s_files' % self._release
        query="""
        select 
            im.band as band,
            im.file_exposure_name as exposurename,
            im.ccd as ccd,
            im.id as im_id,
            im.run as im_run,
            im.filename as im_filename,
            im.filetype as im_filetype,
            cat.id as cat_id,
            cat.run as cat_run,
            cat.filename as cat_filename, 
            cat.filetype as cat_filetype,
            cat.catalog_parentid as cat_parentid
        from
            {table} cat,
            {table} im
        where
            im.filetype = 'red'
            and im.band = '{band}'
            and im.filename not like 'decam%-0-%.fits%'
            and cat.catalog_parentid = im.id
        """.format(table=table,band=band)

        stdout.write("query: \n%s\n" % query)
        oc=oracle_util.Connection()
        res = oc.Execute(query)
        return res
Ejemplo n.º 9
0
def query_byvalue(table, colname, values):
    """
    Assumes these are unique
    """

    conn = oracle_util.Connection()

    n = len(values)

    chunksize = 1000
    nchunk = n/chunksize
    nleft = n % chunksize

    res = None
    if nleft > 0:
        nget = nchunk+1
    else:
        nget = nchunk
    for i in range(nget):
        vals = [str(val) for val in values[i*chunksize:(i+1)*chunksize]]
        valstring = ','.join(vals)
        q = """
        select 
            *
        from
            %s
        where %s in (%s)
        """ % (table, colname, valstring)
        
        tres = conn.Execute(q)
        if res is None:
            res = numpy.zeros(n, dtype=tres.dtype)

        res[i*chunksize:i*chunksize + len(tres)] = tres
        
    return res
Ejemplo n.º 10
0
def get_coadd_id(tilename, band, run=None, verbose=False):
    if run is None:
        run = get_tile_run(tilename, verbose=verbose)
        if run is None:
            return None

    query="""
        SELECT
            id
        FROM
            coadd
        WHERE
            tilename like '%s'
            AND run like '%s'
            AND band like '%s'
    """ % (tilename, run, band)

    if verbose:
        sys.stdout.write('%s\n' % query)
    o=oracle_util.Connection()
    res = o.Execute(query)
    if res is None:
        return None
    return res['id']
Ejemplo n.º 11
0
def get_latest_dc4locations(limit=None, band=None):
    """
    At this stage we just need the files with nite like '2008%'.

    Then we just get the lastest version of the file (not sure
    at this point why there are multiple). That is the step we
    do for removing dups but keeping the latest.
    """

    conn = oracle_util.Connection()

    nite = '2008%'


    stdout.write('Getting images corresponding to catalogs\n')

    cat_loc_join = """
    SELECT
        catalog.id as cat_id, 
        catalog.parentid,
        location.id as image_id,
        location.project,
        location.fileclass,
        location.filetype,
        location.exposurename,
        location.filename,
        location.tilename,
        location.band,
        location.ccd,
        location.run
    FROM
        catalog, location
    WHERE
        catalog.project = 'DES'
        AND catalog.catalogtype = 'red_cat'
        AND catalog.nite LIKE '%s'
        AND catalog.parentid = location.id
    """ % (nite,)

    if band is not None:
        cat_loc_join += "    AND location.band = '%s'" % band

    stdout.write(cat_loc_join+'\n')
    imloc = conn.Execute(cat_loc_join)

    stdout.write("Returned %d rows\n" % imloc.size)

    stdout.write('Getting latest runs\n') 
    ind = GetLatestRuns(imloc)
    imloc = imloc[ind]


    catloc = query_byvalue('location','id',imloc['cat_id'])

    return imloc, catloc
    

    # First get the images
    image_query = """
    SELECT
        *
    FROM
        location
    WHERE
        project = 'DES'
        AND filetype='red'
        AND nite LIKE '%s'
    """ % (nite,)


    if limit is not None:
        image_query += ' ' + limit

     
    stdout.write(image_query+'\n')
    imloc = conn.Execute(image_query)

    stdout.write('Getting latest runs\n')
    ind = GetLatestRuns(imloc)
    imloc = imloc[ind]

        
    return imloc, catloc
Ejemplo n.º 12
0
def dump_table_inchunks(tables_in, columns_in, fname, chunksize=1000000,
                        constraints='',
                        dryrun=False):
    import sfile
    conn = oracle_util.Connection()

    if isinstance(tables_in, str):
        tables = [tables_in]
    else:
        tables = tables_in
    if isinstance(columns_in, str):
        columns = [columns_in]
    else:
        columns = columns_in



    q="select count(*) from %s" % tables[0]
    stdout.write(q+'\n')
    res = conn.Execute(q)
    nrows = res['count(*)'][0]

    nchunk = nrows/chunksize
    nleft = nrows % chunksize

    stdout.write('Total number of rows: %s\n' % nrows)
    stdout.write('Chunksize: %s\n' % chunksize)
    stdout.write('    Main chunks: %s\n' % nchunk)
    stdout.write('    leftover:    %s\n' % nleft)
    stdout.write("Output file: '%s'\n" % fname)

    nget = nchunk
    if nleft > 0:
        nget += 1

    colstr = ','.join(columns)
    tabstr = ','.join(tables)
    for i in range(nget):

        rowmin = i*chunksize + 1
        rowmax = (i+1)*chunksize + 1
        q = """
        select 
            %s
        from
            %s
        where
            rownum >= %s
            AND rownum < %s
            %s
        """ % (colstr, tabstr, rowmin, rowmax, constraints)

        stdout.write(q+'\n')
        res = conn.Execute(q)

        if res is not None:
            stdout.write("Found: %s\n" % len(res))
        else:
            stderr.write("Found no rows\n");

        if not dryrun and res is not None:
            if i == 0:
                sfile.write(res, fname)
            else:
                sfile.write(res, fname, append=True)

    conn.Close()
Ejemplo n.º 13
0
def collate_coadd_catim(band, outfile, getsrc=False):
    """

    join the catalog table (catalogtype='coadd_cat' and project='DES') to the
    coadd table, using parentid as the connection

    Note this join is useful even if we didn't need the info since there are
    entries in the database for which the id info is nonsense and we have to
    skip them.

    we demand the band since band is not set in the database for many entries
    so we must set it explicitly

    if getsrc=True add a list of the source 'red' images that made up the
    coadd.  This depends on
        get_coadd_src_locations
            (get_coadd_id)
                (get_tile_run)

    """

    q="""
    select
        catalog.id as catalogid,
        catalog.run as catalogrun,
        catalog.band,
        catalog.tilename,
        catalog.catalogname,
        catalog.parentid,
        location.run as coaddrun,
        location.filename as coaddname
    from
        catalog, location
    where
        catalog.catalogtype = 'coadd_cat' 
        and catalog.project = 'DES'
        and location.id = catalog.parentid
        and catalogname like '%%_%s_cat%%'
    order by
        catalog.run
    """ % band

    stdout.write(q+'\n')

    conn = oracle_util.Connection()


    dictlist=True
    res = conn.Execute(q, dictlist=dictlist, lower=True)

    if res is not None:
        if dictlist:
            for i in range(len(res)):
                res[i]['band'] = band
        else:
            res['band'] = band


    if getsrc:
        # add the single epoch coadd source images
        stdout.write('Getting src lists\n')
        nbad=0
        for i in range(len(res)):
            coadd_id = res[i]['parentid']
            srclist = get_coadd_src_locations(coadd_id,dictlist=True)
            if srclist is None:
                raise ValueError('Could not get source list for id=%s\n' % coadd_id)
            ftype_bad = \
                [sl['filetype'] for sl in srclist if sl['filetype'] != 'red']
            if len(ftype_bad) > 0:
                raise ValueError("Expected 'red' type got '%s'\n" % ftype_bad[0])

            # fix up the bands
            for sl in srclist:
                if sl['band'] != band:
                    stdout.write('Fixing band\n')
                    sl['band'] = band
            res[i]['srclist'] = srclist


    stdout.write('Writing to file: %s\n' % outfile)
    json_util.write(res, outfile)
Ejemplo n.º 14
0
def get_coadd_src_locations(coadd_id=None, tilename=None, band=None, run=None, 
                            dictlist=False, verbose=False):
    """
    Get info about original SE 'red' images associated with a given coadd
    from the locations table.  This can be a complicated process.

    depends:
        (get_tile_run)
        (get_coadd_id)

    """

    if coadd_id is None:
        coadd_id = get_coadd_id(tilename, band, run=run, verbose=verbose)
        coadd_id=coadd_id[0]


    # Get a list of coadd_src images for the coadd_id
    query="""
        SELECT
            image.parentid
        FROM
            image,coadd_src
        WHERE
            coadd_src.coadd_imageid = %d
            AND coadd_src.src_imageid = image.id
    """ % coadd_id

    if verbose:
        sys.stdout.write('%s\n' % query)
    o = oracle_util.Connection()
    res = o.Execute(query,lower=True)

    if res is None:
        return None

    # now we need to find the single epoch red images we are looking for
    # typically we now have the ids of the remap images, which means the very
    # next query for parents will get 'red' but we might have to iterate

    idstrings = [str(id) for id in res['parentid']]
    ftype = 'none'
    i=0
    itmax=5

    while (ftype != 'red') and (i < itmax):
        idlist = ', '.join(idstrings)
        query="""
            SELECT
                image.id,
                image.imagetype,
                image.parentid
            FROM
                image
            WHERE
                image.id in (%s)
        """ % idlist

        if verbose:
            sys.stdout.write('%s\n' % query)
        res = o.Execute(query, lower=True)
        if res is None:
            return None

        idstrings = [str(id) for id in res['parentid']]
        ftype = res['imagetype'][0]
        i += 1

    if ftype != 'red':
        raise ValueError("Reach itmax=%s before finding 'red' images. last is %s" % (itmax, ftype))

    # now the idlist comes from id instead of parentid
    idstrings = [str(id) for id in res['id']]
    idlist = ', '.join(idstrings)
    query="""
        select
            location.id,
            location.run,
            location.exposurename,
            location.filename,
            location.band,
            location.filetype,
            location.ccd
        from
            location
        where
            location.id in (%s)
    """ % idlist

    if verbose:
        sys.stdout.write('%s\n' % query)
    res = o.Execute(query, dictlist=dictlist, lower=True)

    if verbose:
        stdout.write("# iterations: %s\n" % i) 
    return res