<?xml version="1.0"?>
<feed xmlns="http://www.w3.org/2005/Atom" xml:lang="en">
	<id>https://pwiki.pic.es/index.php?action=history&amp;feed=atom&amp;title=QSOs</id>
	<title>QSOs - Revision history</title>
	<link rel="self" type="application/atom+xml" href="https://pwiki.pic.es/index.php?action=history&amp;feed=atom&amp;title=QSOs"/>
	<link rel="alternate" type="text/html" href="https://pwiki.pic.es/index.php?title=QSOs&amp;action=history"/>
	<updated>2026-04-20T15:05:28Z</updated>
	<subtitle>Revision history for this page on the wiki</subtitle>
	<generator>MediaWiki 1.35.14</generator>
	<entry>
		<id>https://pwiki.pic.es/index.php?title=QSOs&amp;diff=835&amp;oldid=prev</id>
		<title>Jcarrete: Created page with &quot;The Primeval Universe working group, lead by Jean-Gabriel Cubi sent us an email with information (email's subject: SC8 PUWG simulations: quasars) They wrote an entry in the Eu...&quot;</title>
		<link rel="alternate" type="text/html" href="https://pwiki.pic.es/index.php?title=QSOs&amp;diff=835&amp;oldid=prev"/>
		<updated>2020-07-27T09:43:47Z</updated>

		<summary type="html">&lt;p&gt;Created page with &amp;quot;The Primeval Universe working group, lead by Jean-Gabriel Cubi sent us an email with information (email&amp;#039;s subject: SC8 PUWG simulations: quasars) They wrote an entry in the Eu...&amp;quot;&lt;/p&gt;
&lt;p&gt;&lt;b&gt;New page&lt;/b&gt;&lt;/p&gt;&lt;div&gt;The Primeval Universe working group, lead by Jean-Gabriel Cubi sent us an email with information (email's subject: SC8 PUWG simulations: quasars)&lt;br /&gt;
They wrote an entry in the Euclid Redmine: https://euclid.roe.ac.uk/projects/puswg/wiki/Quasars/&lt;br /&gt;
&lt;br /&gt;
There is a txt file that we &amp;quot;convert&amp;quot; and ingest into CosmoHub.&lt;br /&gt;
&lt;br /&gt;
(I think) we convert it into parquet:&lt;br /&gt;
&lt;br /&gt;
    CREATE EXTERNAL TABLE `full_h25cut_hcol`(&lt;br /&gt;
  `type` string, &lt;br /&gt;
  `z` float, &lt;br /&gt;
  `m1450` float, &lt;br /&gt;
  `template` string, &lt;br /&gt;
  `h` float, &lt;br /&gt;
  `id` bigint)&lt;br /&gt;
    ROW FORMAT SERDE &lt;br /&gt;
  'org.apache.hadoop.hive.ql.io.parquet.serde.ParquetHiveSerDe' &lt;br /&gt;
    STORED AS INPUTFORMAT &lt;br /&gt;
  'org.apache.hadoop.hive.ql.io.parquet.MapredParquetInputFormat' &lt;br /&gt;
    OUTPUTFORMAT &lt;br /&gt;
  'org.apache.hadoop.hive.ql.io.parquet.MapredParquetOutputFormat'&lt;br /&gt;
    LOCATION&lt;br /&gt;
  'hdfs://AntNest/user/tallada/data/euclid/full_H25cut_Hcol'&lt;br /&gt;
    ;&lt;br /&gt;
&lt;br /&gt;
Then the clustered table in cosmohub:&lt;br /&gt;
&lt;br /&gt;
    CREATE TABLE full_H25cut_Hcol_v1_0_c(&lt;br /&gt;
    `id` bigint COMMENT 'ID',&lt;br /&gt;
    `type` string COMMENT 'type (QSO for all objects)',&lt;br /&gt;
    `z` float COMMENT 'redshift (z). Redshifts are in the range [6-15]',&lt;br /&gt;
    `m1450` float COMMENT 'absolute magnitude at 1450 angstroms (M1450)',&lt;br /&gt;
    `template` string COMMENT 'spectral template name (among 21)',&lt;br /&gt;
    `h` float COMMENT 'approximate H-band magnitude for information only. This was computed for applying the magnitude cut'&lt;br /&gt;
    )&lt;br /&gt;
    CLUSTERED BY (&lt;br /&gt;
    id&lt;br /&gt;
    )&lt;br /&gt;
    SORTED BY ( &lt;br /&gt;
    id ASC&lt;br /&gt;
    ) &lt;br /&gt;
    INTO 4 BUCKETS&lt;br /&gt;
    ROW FORMAT SERDE&lt;br /&gt;
    'org.apache.hadoop.hive.ql.io.orc.OrcSerde'&lt;br /&gt;
    STORED AS INPUTFORMAT&lt;br /&gt;
    'org.apache.hadoop.hive.ql.io.orc.OrcInputFormat'&lt;br /&gt;
    OUTPUTFORMAT&lt;br /&gt;
    'org.apache.hadoop.hive.ql.io.orc.OrcOutputFormat'&lt;br /&gt;
    ;&lt;br /&gt;
&lt;br /&gt;
    INSERT OVERWRITE TABLE cosmohub.full_H25cut_Hcol_v1_0_c&lt;br /&gt;
    SELECT `id`, `type`, `z`,`m1450`, `template`, `h`&lt;br /&gt;
    FROM tallada.full_H25cut_Hcol;  &lt;br /&gt;
&lt;br /&gt;
    ANALYZE TABLE cosmohub.full_H25cut_Hcol_v1_0_c COMPUTE STATISTICS FOR COLUMNS;&lt;br /&gt;
&lt;br /&gt;
I decided to create an integer field for the sed template rather than a string field, in order to use it in CosmoHub and maybe for the mock algorithm:&lt;br /&gt;
&lt;br /&gt;
    CREATE TABLE full_H25cut_Hcol_v1_1_c(&lt;br /&gt;
    `id` bigint COMMENT 'ID',&lt;br /&gt;
    `type` string COMMENT 'type (QSO for all objects)',&lt;br /&gt;
    `z` float COMMENT 'redshift (z). Redshifts are in the range [6-15]',&lt;br /&gt;
    `m1450` float COMMENT 'absolute magnitude at 1450 angstroms (M1450)',&lt;br /&gt;
    `template` string COMMENT 'spectral template name (among 21)',&lt;br /&gt;
    `template_int` int COMMENT 'spectral template as integer (from 0 to 20)',&lt;br /&gt;
    `h` float COMMENT 'approximate H-band magnitude for information only. This was computed for applying the magnitude cut'&lt;br /&gt;
    )&lt;br /&gt;
    CLUSTERED BY (&lt;br /&gt;
    id&lt;br /&gt;
    )&lt;br /&gt;
    SORTED BY ( &lt;br /&gt;
    id ASC&lt;br /&gt;
    ) &lt;br /&gt;
    INTO 4 BUCKETS&lt;br /&gt;
    ROW FORMAT SERDE&lt;br /&gt;
    'org.apache.hadoop.hive.ql.io.orc.OrcSerde'&lt;br /&gt;
    STORED AS INPUTFORMAT&lt;br /&gt;
    'org.apache.hadoop.hive.ql.io.orc.OrcInputFormat'&lt;br /&gt;
    OUTPUTFORMAT&lt;br /&gt;
    'org.apache.hadoop.hive.ql.io.orc.OrcOutputFormat'&lt;br /&gt;
    ;&lt;br /&gt;
&lt;br /&gt;
&lt;br /&gt;
    INSERT OVERWRITE TABLE cosmohub.full_H25cut_Hcol_v1_1_c&lt;br /&gt;
    SELECT `id`, `type`, `z`,`m1450`, `template`,&lt;br /&gt;
    CASE WHEN template = 'Banados_avg_Harris' THEN 0 &lt;br /&gt;
     WHEN template = 'Banados_avg_Selsing' THEN 1&lt;br /&gt;
     WHEN template = 'Banados_avg_Vandenberk' THEN 2&lt;br /&gt;
     WHEN template = 'Banados_hlya_Harris' THEN 3&lt;br /&gt;
     WHEN template = 'Banados_hlya_Selsing' THEN 4&lt;br /&gt;
     WHEN template = 'Banados_hlya_Vandenberk' THEN 5&lt;br /&gt;
     WHEN template = 'Banados_llya_Harris' THEN 6&lt;br /&gt;
     WHEN template = 'Banados_llya_Selsing' THEN 7&lt;br /&gt;
     WHEN template = 'Banados_llya_Vandenberk' THEN 8&lt;br /&gt;
     WHEN template = 'Hewett_l0_cb' THEN 9&lt;br /&gt;
     WHEN template = 'Hewett_l0_cr' THEN 10&lt;br /&gt;
     WHEN template = 'Hewett_l0_cs' THEN 11&lt;br /&gt;
     WHEN template = 'Hewett_ld_cb' THEN 12&lt;br /&gt;
     WHEN template = 'Hewett_ld_cr' THEN 13&lt;br /&gt;
     WHEN template = 'Hewett_ld_cs' THEN 14&lt;br /&gt;
     WHEN template = 'Hewett_lh_cb' THEN 15&lt;br /&gt;
     WHEN template = 'Hewett_lh_cr' THEN 16&lt;br /&gt;
     WHEN template = 'Hewett_lh_cs' THEN 17&lt;br /&gt;
     WHEN template = 'Hewett_ls_cb' THEN 18&lt;br /&gt;
     WHEN template = 'Hewett_ls_cr' THEN 19&lt;br /&gt;
     WHEN template = 'Hewett_ls_cs' THEN 20&lt;br /&gt;
    END as template_int,&lt;br /&gt;
    `h`&lt;br /&gt;
    FROM tallada.full_H25cut_Hcol;  &lt;br /&gt;
&lt;br /&gt;
    ANALYZE TABLE cosmohub.full_H25cut_Hcol_v1_1_c COMPUTE STATISTICS FOR COLUMNS;&lt;/div&gt;</summary>
		<author><name>Jcarrete</name></author>
	</entry>
</feed>