import pandas
import numpy as np
import matplotlib.pyplot as plt
import astropy.units as u
from astropy.visualization.wcsaxes import SphericalCircle
from lsst.rsp import get_tap_service, retrieve_query

service = get_tap_service("tap")
assert service is not None

pandas.set_option('display.max_rows', 20)

query = 'SELECT * FROM tap_schema.schemas'

results = service.search(query)

print(type(results))

<class 'pyvo.dal.tap.TAPResults'>

results_table = service.search(query).to_table()

print(type(results_table))

<class 'astropy.table.table.Table'>

results_table

for name in results_table['schema_name']:
    if name.find('dp02') > -1:
        print(name)

dp02_dc2_catalogs

del query, results, results_table

query = "SELECT * FROM tap_schema.tables " \
        "WHERE tap_schema.tables.schema_name = 'dp02_dc2_catalogs'" \
        "ORDER BY table_index ASC"

results = service.search(query).to_table()

results

del query, results

query = "SELECT column_name, datatype, description, unit " \
        "FROM tap_schema.columns " \
        "WHERE table_name = 'dp02_dc2_catalogs.Object'"

results = service.search(query).to_table()

results

search_string = 'coord'
for cname in results['column_name']:
    if cname.find(search_string) > -1:
        print(cname)

coord_dec
coord_ra

search_string = 'g_psfFlux'
for cname in results['column_name']:
    if cname.find(search_string) > -1:
        print(cname)

g_psfFlux
g_psfFlux_area
g_psfFlux_flag
g_psfFlux_flag_apCorr
g_psfFlux_flag_edge
g_psfFlux_flag_noGoodPixels
g_psfFluxErr

print(np.unique(results['datatype']))

datatype
--------
 boolean
    char
  double
   float
     int
    long

print(np.unique(results['unit']))

  unit  
--------
        
     deg
     nJy
   pixel
pixel**2

del query, results

center_ra = 62
center_dec = -37
radius = 0.01

str_center_coords = str(center_ra) + ", " + str(center_dec)
str_radius = str(radius)

query = "SELECT coord_ra, coord_dec "\
        "FROM dp02_dc2_catalogs.Object "\
        "WHERE CONTAINS(POINT('ICRS', coord_ra, coord_dec), "\
        "CIRCLE('ICRS', " + str_center_coords + ", " + str_radius + ")) = 1 "\
        "AND detect_isPrimary = 1"
print(query)

SELECT coord_ra, coord_dec FROM dp02_dc2_catalogs.Object WHERE CONTAINS(POINT('ICRS', coord_ra, coord_dec), CIRCLE('ICRS', 62, -37, 0.01)) = 1 AND detect_isPrimary = 1

job = service.submit_job(query)
print('Job URL is', job.url)
print('Job phase is', job.phase)

Job URL is https://data-int.lsst.cloud/api/tap/async/fu2x4xl0qv600a8v
Job phase is PENDING

job.run()

<pyvo.dal.tap.AsyncTAPJob at 0x7b04f1a89150>

job.wait(phases=['COMPLETED', 'ERROR'])
print('Job phase is', job.phase)

Job phase is COMPLETED

# job.raise_if_error()

results = job.fetch_result().to_table()
print(len(results))

173

# results

fig = plt.figure(figsize=(4, 4))

region = SphericalCircle((center_ra * u.deg, center_dec * u.deg),
                         radius * u.deg, alpha=0.2, color='blue')
plt.gca().add_patch(region)

plt.plot(results['coord_ra'], results['coord_dec'],
         'o', alpha=0.5, color='black', mew=0)

plt.xlabel('RA')
plt.ylabel('Dec')
plt.show()

job.delete()
del query, results

N = 20

query = "SELECT TOP " + str(N) + " coord_ra, coord_dec "\
        "FROM dp02_dc2_catalogs.Object "\
        "WHERE CONTAINS(POINT('ICRS', coord_ra, coord_dec), "\
        "CIRCLE('ICRS', " + str_center_coords + ", " + str_radius + ")) = 1 "\
        "AND detect_isPrimary = 1"
print(query)

SELECT TOP 20 coord_ra, coord_dec FROM dp02_dc2_catalogs.Object WHERE CONTAINS(POINT('ICRS', coord_ra, coord_dec), CIRCLE('ICRS', 62, -37, 0.01)) = 1 AND detect_isPrimary = 1

job = service.submit_job(query)
job.run()
job.wait(phases=['COMPLETED', 'ERROR'])
print('Job phase is', job.phase)

Job phase is COMPLETED

results = job.fetch_result().to_table()
print(len(results))

20

fig = plt.figure(figsize=(4, 4))
region = SphericalCircle((center_ra * u.deg, center_dec * u.deg),
                         radius * u.deg, alpha=0.2, color='blue')
plt.gca().add_patch(region)
plt.plot(results['coord_ra'], results['coord_dec'],
         'o', alpha=0.5, color='black', mew=0)
plt.xlabel('RA')
plt.ylabel('Dec')
plt.show()

job.delete()
del query, results

query = "SELECT coord_ra, coord_dec "\
        "FROM dp02_dc2_catalogs.Object "\
        "WHERE CONTAINS(POINT('ICRS', coord_ra, coord_dec), "\
        "CIRCLE('ICRS', " + str_center_coords + ", " + str_radius + ")) = 1 "\
        "AND detect_isPrimary = 1"
print(query)

SELECT coord_ra, coord_dec FROM dp02_dc2_catalogs.Object WHERE CONTAINS(POINT('ICRS', coord_ra, coord_dec), CIRCLE('ICRS', 62, -37, 0.01)) = 1 AND detect_isPrimary = 1

job = service.submit_job(query, maxrec=N)
job.run()
job.wait(phases=['COMPLETED', 'ERROR'])
print('Job phase is', job.phase)

Job phase is COMPLETED

results = job.fetch_result().to_table()
print(len(results))

20

/opt/lsst/software/stack/conda/envs/lsst-scipipe-9.0.0/lib/python3.11/site-packages/pyvo/dal/query.py:325: DALOverflowWarning: Partial result set. Potential causes MAXREC, async storage space, etc.
  warn("Partial result set. Potential causes MAXREC, async storage space, etc.",

fig = plt.figure(figsize=(4, 4))
region = SphericalCircle((center_ra * u.deg, center_dec * u.deg),
                         radius * u.deg, alpha=0.2, color='blue')
plt.gca().add_patch(region)
plt.plot(results['coord_ra'], results['coord_dec'],
         'o', alpha=0.5, color='black', mew=0)
plt.xlabel('RA')
plt.ylabel('Dec')
plt.show()

job.delete()
del query, results

query = "SELECT TOP " + str(N) + " coord_ra, coord_dec "\
        "FROM dp02_dc2_catalogs.Object "\
        "WHERE CONTAINS(POINT('ICRS', coord_ra, coord_dec), "\
        "CIRCLE('ICRS', " + str_center_coords + ", " + str_radius + ")) = 1 "\
        "AND detect_isPrimary = 1 "\
        "ORDER BY coord_ra ASC"
print(query)

SELECT TOP 20 coord_ra, coord_dec FROM dp02_dc2_catalogs.Object WHERE CONTAINS(POINT('ICRS', coord_ra, coord_dec), CIRCLE('ICRS', 62, -37, 0.01)) = 1 AND detect_isPrimary = 1 ORDER BY coord_ra ASC

job = service.submit_job(query)
job.run()
job.wait(phases=['COMPLETED', 'ERROR'])
print('Job phase is', job.phase)

Job phase is COMPLETED

results = job.fetch_result().to_table()
print(len(results))

20

fig = plt.figure(figsize=(4, 4))
region = SphericalCircle((center_ra * u.deg, center_dec * u.deg),
                         radius * u.deg, alpha=0.2, color='blue')
plt.gca().add_patch(region)
plt.plot(results['coord_ra'], results['coord_dec'],
         'o', alpha=0.5, color='black', mew=0)
plt.xlabel('RA')
plt.ylabel('Dec')
plt.show()

job.delete()
del query, results

query = "SELECT coord_ra, coord_dec "\
        "FROM dp02_dc2_catalogs.Object "\
        "WHERE CONTAINS(POINT('ICRS', coord_ra, coord_dec), "\
        "CIRCLE('ICRS', " + str_center_coords + ", " + str_radius + ")) = 1 "\
        "AND detect_isPrimary = 1"
print(query)

SELECT coord_ra, coord_dec FROM dp02_dc2_catalogs.Object WHERE CONTAINS(POINT('ICRS', coord_ra, coord_dec), CIRCLE('ICRS', 62, -37, 0.01)) = 1 AND detect_isPrimary = 1

job = service.submit_job(query)
job.run()
job.wait(phases=['COMPLETED', 'ERROR'])
print('Job phase is', job.phase)

Job phase is COMPLETED

results = job.fetch_result().to_table().to_pandas()
print(len(results))

173

print(type(results))

<class 'pandas.core.frame.DataFrame'>

results

sorted_results = results.sort_values('coord_ra')

sorted_results

sorted_results.set_index(np.array(range(len(sorted_results))), inplace=True)

sorted_results

job.delete()
del query, results, sorted_results

query = "SELECT coord_ra, coord_dec "\
        "FROM dp02_dc2_catalogs.Object "\
        "WHERE CONTAINS(POINT('ICRS', coord_ra, coord_dec), "\
        "CIRCLE('ICRS', " + str_center_coords + ", " + str_radius + ")) = 1 "\
        "AND detect_isPrimary = 1"
print(query)

job = service.submit_job(query)
job.run()
job.wait(phases=['COMPLETED', 'ERROR'])
print('Job phase is', job.phase)

SELECT coord_ra, coord_dec FROM dp02_dc2_catalogs.Object WHERE CONTAINS(POINT('ICRS', coord_ra, coord_dec), CIRCLE('ICRS', 62, -37, 0.01)) = 1 AND detect_isPrimary = 1
Job phase is COMPLETED

my_job_url = str(job.url)
print(my_job_url)

https://data-int.lsst.cloud/api/tap/async/pk5arytxjo1xedlz

retrieved_job = retrieve_query(my_job_url)
retrieved_results = retrieved_job.fetch_result().to_table().to_pandas()

retrieved_results

job.delete()
del query, retrieved_results

# my_portal_url = ''
# retrieved_job = retrieve_query(my_portal_url)
# retrieved_results = retrieved_job.fetch_result().to_table().to_pandas()

# retrieved_results

# retrieved_job.delete()
# del retrieved_results

description	schema_index	schema_name	utype
object	int32	object	object
Data Preview 0.2 contains the image and catalog products of the Rubin Science Pipelines v23 processing of the DESC Data Challenge 2 simulation, which covered 300 square degrees of the wide-fast-deep LSST survey region over 5 years.	0	dp02_dc2_catalogs
ObsCore v1.1 attributes in ObsTAP realization	1	ivoa
A TAP-standard-mandated schema to describe tablesets in a TAP 1.1 service	100000	tap_schema

description	schema_name	table_index	table_name	table_type	utype
object	object	int32	object	object	object
Properties of the astronomical objects detected and measured on the deep coadded images.	dp02_dc2_catalogs	1	dp02_dc2_catalogs.Object	table
Properties of detections on the single-epoch visit images, performed independently of the Object detections on coadded images.	dp02_dc2_catalogs	2	dp02_dc2_catalogs.Source	table
Forced-photometry measurements on individual single-epoch visit images and difference images, based on and linked to the entries in the Object table. Point-source PSF photometry is performed, based on coordinates from a reference band chosen for each Object and reported in the Object.refBand column.	dp02_dc2_catalogs	3	dp02_dc2_catalogs.ForcedSource	table
Properties of time-varying astronomical objects based on association of data from one or more spatially-related DiaSource detections on individual single-epoch difference images.	dp02_dc2_catalogs	4	dp02_dc2_catalogs.DiaObject	table
Properties of transient-object detections on the single-epoch difference images.	dp02_dc2_catalogs	5	dp02_dc2_catalogs.DiaSource	table
Point-source forced-photometry measurements on individual single-epoch visit images and difference images, based on and linked to the entries in the DiaObject table.	dp02_dc2_catalogs	6	dp02_dc2_catalogs.ForcedSourceOnDiaObject	table
Metadata about the pointings of the DC2 simulated survey, largely associated with the boresight of the entire focal plane.	dp02_dc2_catalogs	7	dp02_dc2_catalogs.Visit	table
Metadata about the 189 individual CCD images for each Visit in the DC2 simulated survey.	dp02_dc2_catalogs	8	dp02_dc2_catalogs.CcdVisit	table
Static information about the subset of tracts and patches from the standard LSST skymap that apply to coadds in these catalogs	dp02_dc2_catalogs	9	dp02_dc2_catalogs.CoaddPatches	table
Summary properties of objects from the DESC DC2 truth catalog, as described in arXiv:2101.04855. Includes the noiseless astrometric and photometric parameters.	dp02_dc2_catalogs	10	dp02_dc2_catalogs.TruthSummary	table
Match information for TruthSummary objects.	dp02_dc2_catalogs	11	dp02_dc2_catalogs.MatchesTruth	table

column_name	datatype	description	unit
object	object	object	object
coord_dec	double	Fiducial ICRS Declination of centroid used for database indexing	deg
coord_ra	double	Fiducial ICRS Right Ascension of centroid used for database indexing	deg
deblend_nChild	int	Number of children this object has (defaults to 0)
deblend_skipped	boolean	Deblender skipped this source
detect_fromBlend	boolean	This source is deblended from a parent with more than one child.
detect_isDeblendedModelSource	boolean	True if source has no children and is in the inner region of a coadd patch and is in the inner region of a coadd tract and is not a sky source and is a deblended child
detect_isDeblendedSource	boolean	True if source has no children and is in the inner region of a coadd patch and is in the inner region of a coadd tract and is not a sky source and is either an unblended isolated source or a deblended child from a parent with
detect_isIsolated	boolean	This source is not a part of a blend.
detect_isPatchInner	boolean	True if source is in the inner region of a coadd patch
...	...	...	...
z_pixelFlags_suspect	boolean	Source's footprint includes suspect pixels. Measured on z-band.
z_pixelFlags_suspectCenter	boolean	Source's center is close to suspect pixels. Measured on z-band.
z_psfFlux	double	Flux derived from linear least-squares fit of PSF model. Forced on z-band.	nJy
z_psfFlux_area	float	Effective area of PSF. Forced on z-band.	pixel
z_psfFlux_flag	boolean	General Failure Flag. Forced on z-band.
z_psfFlux_flag_apCorr	boolean	Set if unable to aperture correct base_PsfFlux. Forced on z-band.
z_psfFlux_flag_edge	boolean	Object was too close to the edge of the image to use the full PSF model. Forced on z-band.
z_psfFlux_flag_noGoodPixels	boolean	Not enough non-rejected pixels in data to attempt the fit. Forced on z-band.
z_psfFluxErr	double	Flux uncertainty derived from linear least-squares fit of PSF model. Forced on z-band.	nJy
z_ra	double	Position in Right Ascension. Measured on z-band.	deg

	coord_ra	coord_dec
0	61.989258	-37.005119
1	61.997438	-37.005796
2	62.003285	-37.006248
3	61.998238	-37.007123
4	62.003341	-37.002536
...	...	...
168	61.990251	-36.996347
169	61.989260	-36.995563
170	61.990184	-36.995566
171	61.992685	-36.998426
172	61.992210	-36.998456

	coord_ra	coord_dec
161	61.988079	-36.999024
164	61.988408	-36.998968
154	61.988546	-36.997821
165	61.988612	-37.001517
0	61.989258	-37.005119
...	...	...
82	62.010771	-36.998845
79	62.010843	-36.999844
98	62.010987	-36.996173
97	62.011207	-36.997063
128	62.012241	-36.999059

Introduction to the Table Access Protocol (TAP) Service¶

1. Introduction¶

1.1. TAP basics¶

1.2. ADQL basics¶

1.3. What is not covered in this tutorial?¶

1.4. Recommendations for TAP queries¶

1.4.1. Use asynchronous queries¶

1.4.2. Include coordinate constraints¶

1.4.3. Constrain detect_isPrimary = True¶

1.4.4. If limiting rows, use TOP¶

1.4.5. If sorting, take care with ORDER BY¶

1.5. Import packages¶

1.6. Define functions and parameters¶

2. Explore the TAP schema¶

2.1. Synchronous queries¶

2.2. List all catalogs (schema)¶

2.3. List all tables in the DP0.2 catalog¶

2.4. List all columns in the Object table¶

3. Query the DP0.2 Object table¶

3.1. Asynchronous queries¶

3.2. Cone search¶

3.3. Limit rows returned with TOP¶

3.4. Use of maxrec instead of TOP¶

3.5. Sort results with ORDER BY¶

3.6. Sort results with pandas¶

4. Retrieve query results with job URL¶

4.1. Retrieve results from a Portal query¶

4.1.1. Run an ADQL query in the Portal¶

4.1.2. Get the job URL from the Portal¶

4.1.3. Retrieve the results¶