IsmailM · June 11, 2020 22:21
diff --git a/PGP_fastq_files.sh b/PGP_fastq_files.sh
 # The below is using JQ from https://stedolan.github.io/jq/ +
 # the PGP API v1.2 - https://www.personalgenomes.org.uk/api/v1.2/

 curl -X GET "https://www.personalgenomes.org.uk/api/v1.2/all_wgs" -H "accept: application/json" | jq -r ' 
 .[] | [
        .hex_id,
        (.data[]?.fastq_ftp),
        (.data[]?.fastq_md5),
        (.data[]?.fastq_bytes | split(";") | .[] | tonumber | . /1024/1024/1024)
 ] | flatten | @csv' > wgs_fastqs.csv
 # Note, some of the records have three fastq files - so the CSV does not fully line up :(


 # The 3 exome sequencing datasets
 # Note this endpoint is not documented, but it exists (sorry)
 curl -X GET "https://www.personalgenomes.org.uk/api/v1.2/all_wxs" -H "accept: application/json" | jq -r '
 .[] | [
        .hex_id,
        (.data[]?.fastq_ftp),
        (.data[]?.fastq_md5),
        (.data[]?.fastq_bytes | split(";") | .[] | tonumber | . /1024/1024/1024)
 ] | flatten | @csv' > wxs_fastqs.csv

 # Note in the above you can also split the fastq_ftp and fastq_md5 fields
        (.data[]?.fastq_ftp | split(";")),
        (.data[]?.fastq_md5 | split(";")),
	# The below is using JQ from https://stedolan.github.io/jq/ +
	# the PGP API v1.2 - https://www.personalgenomes.org.uk/api/v1.2/

	curl -X GET "https://www.personalgenomes.org.uk/api/v1.2/all_wgs" -H "accept: application/json" \| jq -r '
	.[] \| [
	.hex_id,
	(.data[]?.fastq_ftp),
	(.data[]?.fastq_md5),
	(.data[]?.fastq_bytes \| split(";") \| .[] \| tonumber \| . /1024/1024/1024)
	] \| flatten \| @csv' > wgs_fastqs.csv
	# Note, some of the records have three fastq files - so the CSV does not fully line up :(


	# The 3 exome sequencing datasets
	# Note this endpoint is not documented, but it exists (sorry)
	curl -X GET "https://www.personalgenomes.org.uk/api/v1.2/all_wxs" -H "accept: application/json" \| jq -r '
	.[] \| [
	.hex_id,
	(.data[]?.fastq_ftp),
	(.data[]?.fastq_md5),
	(.data[]?.fastq_bytes \| split(";") \| .[] \| tonumber \| . /1024/1024/1024)
	] \| flatten \| @csv' > wxs_fastqs.csv

	# Note in the above you can also split the fastq_ftp and fastq_md5 fields
	(.data[]?.fastq_ftp \| split(";")),
	(.data[]?.fastq_md5 \| split(";")),