<!-- 
RSS generated by JIRA (8.3.4#803005-sha1:1f96e09b3c60279a408a2ae47be3c745f571388b) at Sat Feb 10 15:33:36 JST 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>PFS-JIRA</title>
    <link>https://pfspipe.ipmu.jp/jira</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>8.3.4</version>
        <build-number>803005</build-number>
        <build-date>13-09-2019</build-date>
    </build-info>


<item>
            <title>[DAMD-40] Define relative locations of the 1d + 2d pipeline outputs</title>
                <link>https://pfspipe.ipmu.jp/jira/browse/DAMD-40</link>
                <project id="10400" key="DAMD">Data Model</project>
                    <description>&lt;p&gt;The outputs from the 2d pipeline have to be passed to the 1d pipelines.&#160; For this, the relative locations of the pipeline outputs have to be defined.&#160; A few constraints:&lt;/p&gt;
&lt;ul&gt;
	&lt;li&gt;outputs should be in a rerun directory&lt;/li&gt;
	&lt;li&gt;there will be multiple 1d reruns based on a single 2d rerun (e.g., run lam1d multiple times tweaking params on a single set of data processed by 2d)&lt;/li&gt;
&lt;/ul&gt;


&lt;p&gt;There may be other constraints we need to consider.&lt;/p&gt;</description>
                <environment></environment>
        <key id="13231">DAMD-40</key>
            <summary>Define relative locations of the 1d + 2d pipeline outputs</summary>
                <type id="10001" iconUrl="https://pfspipe.ipmu.jp/jira/secure/viewavatar?size=xsmall&amp;avatarId=10515&amp;avatarType=issuetype">Story</type>
                                            <priority id="10000" iconUrl="https://pfspipe.ipmu.jp/jira/images/icons/priorities/medium.svg">Normal</priority>
                        <status id="10002" iconUrl="https://pfspipe.ipmu.jp/jira/images/icons/statuses/generic.png" description="The issue is resolved, reviewed, and merged">Done</status>
                    <statusCategory id="3" key="done" colorName="green"/>
                                    <resolution id="10000">Done</resolution>
                                        <assignee username="-1">Unassigned</assignee>
                                    <reporter username="msyktnk">Masayuki Tanaka</reporter>
                        <labels>
                    </labels>
                <created>Fri, 11 Jan 2019 03:58:55 +0000</created>
                <updated>Tue, 15 Sep 2020 06:52:28 +0000</updated>
                            <resolved>Tue, 15 Sep 2020 06:52:28 +0000</resolved>
                                                                        <due></due>
                            <votes>0</votes>
                                    <watches>8</watches>
                                                                <comments>
                            <comment id="14761" author="msyktnk" created="Fri, 11 Jan 2019 04:07:45 +0000"  >&lt;p&gt;I first thought that all the 1d outputs can be under a 2d rerun directory, something line this:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;2d/
&#9500;&#9472;&#9472; BIAS
&#9500;&#9472;&#9472; CALIB
&#9500;&#9472;&#9472; DARK
&#9500;&#9472;&#9472; FLAT
&#9500;&#9472;&#9472; OTHER_STUFF
&#9492;&#9472;&#9472; rerun
&#160;&#160;&#160;&#160;&#160;&#160; &#9500;&#9472;&#9472; dr1
&#160;&#160;&#160;&#160;&#160;&#160; &#9500;&#9472;&#9472; dr2
&#160;&#160;&#160;&#160;&#160;&#160; &#9492;&#9472;&#9472; dr3
&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160; &#9500;&#9472;&#9472; ga1d
&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160; &#9474;&#160;&#160;&#160;&#160; &#9500;&#9472;&#9472; STUFF
&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160; &#9474;&#160;&#160;&#160;&#160; &#9492;&#9472;&#9472; rerun
&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160; &#9474;&#160; &#160; &#160; &#160; &#160; &#160;&#160; &#9500;&#9472;&#9472; test1
&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160; &#9474; &#160; &#160; &#160; &#160; &#160; &#160; &#9492;&#9472;&#9472; test2
&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160; &#9492;&#9472;&#9472; lam1d
&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160; &#9500;&#9472;&#9472; STUFF
&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160; &#9492;&#9472;&#9472; rerun
&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160; &#9500;&#9472;&#9472; test1
&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160; &#9492;&#9472;&#9472; test2&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;
&lt;p&gt;But, this may require having 1d repos for each 2d rerun.&#160; Perhaps not a good idea.&#160; Another naive thinking is:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;./
&#9500;&#9472;&#9472; 2d
&#9474;&#160; &#160;&#160; &#9500;&#9472;&#9472; BIAS
&#9474;&#160; &#160;&#160; &#9500;&#9472;&#9472; CALIB
&#9474;&#160; &#160;&#160; &#9500;&#9472;&#9472; DARK
&#9474;&#160; &#160;&#160; &#9500;&#9472;&#9472; FLAT
&#9474;&#160; &#160;&#160; &#9500;&#9472;&#9472; OTHER_STUFF
&#9474; &#160; &#160; &#9492;&#9472;&#9472; rerun
&#9474;&#160;&#160;&#160;      &#160; &#9500;&#9472;&#9472; dr1
&#9474;&#160;&#160;&#160;&#160;       &#9500;&#9472;&#9472; dr2
&#9474;&#160;&#160;&#160;&#160;       &#9492;&#9472;&#9472; dr3
&#9500;&#9472;&#9472; ga1d
&#9474;&#160;&#160;&#160;&#160; &#9500;&#9472;&#9472; STUFF
&#9474;&#160; &#160;&#160; &#9492;&#9472;&#9472; rerun
&#9474;&#160; &#160; &#160; &#160; &#160; &#160;&#160; &#9500;&#9472;&#9472; dr3_test1
&#9474;&#160; &#160; &#160; &#160; &#160; &#160;&#160; &#9492;&#9472;&#9472; dr3_test2
&#9492;&#9472;&#9472; lam1d
&#160;&#160;&#160;&#160;&#160;&#160;&#160; &#9500;&#9472;&#9472; STUFF
&#160;&#160;&#160;&#160;&#160;&#160;&#160; &#9492;&#9472;&#9472; rerun
&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160; &#9500;&#9472;&#9472; dr3_test1
&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160; &#9492;&#9472;&#9472; dr3_test2&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;
&lt;p&gt;For this, we need to a mapping between the 2d and 1d reruns.&#160; One way to do it is to have 1d rerun name as &quot;2d_rerun_name&quot;_&quot;your_string&quot;.&#160;&#160; In the above example, &quot;dr3_test1&quot; is based on the &quot;dr3&quot; rerun from 2d.&lt;/p&gt;

&lt;p&gt;There are probably other (and better) options.&lt;/p&gt;

&lt;p&gt;&#160;&lt;/p&gt;</comment>
                            <comment id="14975" author="rhl" created="Fri, 15 Feb 2019 21:16:29 +0000"  >&lt;p&gt;Sorry, this got lost.  I have no problem with defining the layout of the outputs here, but they should merely be documenting the implementation in the butler templates (for 2-D).&lt;/p&gt;

&lt;p&gt;In particular, this means that the reruns and calibrations should probable be laid out a bit differently. Is this urgent?&lt;/p&gt;</comment>
                            <comment id="14980" author="msyktnk" created="Mon, 18 Feb 2019 06:49:13 +0000"  >&lt;p&gt;No, this is not urgent.&#160; We will probably implement one of the above in the proto-type database v2, but we do not have real 2d outputs there (only simulated psfObject files) and the directory structure will be different anyway.&lt;/p&gt;</comment>
                            <comment id="17017" author="msyktnk" created="Mon, 13 Apr 2020 05:39:10 +0000"  >&lt;p&gt;&lt;tt&gt;&lt;a href=&quot;https://pfspipe.ipmu.jp/jira/secure/ViewProfile.jspa?name=sogo.mineo&quot; class=&quot;user-hover&quot; rel=&quot;sogo.mineo&quot;&gt;sogo.mineo&lt;/a&gt; suggested that this is also a possible option:&lt;/tt&gt;&lt;/p&gt;
&lt;div class=&quot;code panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;codeContent panelContent&quot;&gt;
&lt;pre class=&quot;code-java&quot;&gt;
ROOT
 +-- BIAS
 +-- CALIB
 : :
 + 1DSTUFF
 +-- rerun
     +-- 2d/dr1
     +-- 2d/dr2
     +-- 2d/dr3
     +-- gal1d/dr3_test1
     +-- gal1d/dr3_test2
     +-- lam1d/dr3_test1
     +-- lam1d/dr3_test2&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;
&lt;p&gt;Do we prefer to have different root for 2d and 1d pipelines?&lt;/p&gt;</comment>
                            <comment id="17027" author="hassan" created="Mon, 13 Apr 2020 23:48:14 +0000"  >&lt;p&gt;Need a definitive agreement in the next 3 weeks.&lt;/p&gt;</comment>
                            <comment id="17029" author="hassan" created="Tue, 14 Apr 2020 00:44:38 +0000"  >&lt;p&gt;Once an agreement has been made, a document capturing that agreement will be prepared and uploaded to PbWorks. Hassan will take that action.&lt;/p&gt;</comment>
                            <comment id="17131" author="rhl" created="Mon, 11 May 2020 23:42:47 +0000"  >&lt;p&gt;I really don&apos;t care much, but I don&apos;t understand the examples &amp;#8211; what is &lt;tt&gt;BIAS&lt;/tt&gt;, for example?  &lt;/p&gt;

&lt;p&gt;The reruns need to be under ROOT, at least via a symbolic link, so that you can point the butler at e.g. &lt;tt&gt;ROOT/rerun/drp2&lt;/tt&gt; or &lt;tt&gt;ROOT/rerun/rhl/foo&lt;/tt&gt;.  I don&apos;t know how 1-D will handle reruns, but I&apos;d expect them to be able to be able to process any 2-D rerun, including all the book-keeping so we know what we did.  Ideally this would be transparent (as is true on the 2-D side), but this is independent of the logical layout.&lt;/p&gt;

&lt;p&gt;Until we understand how 1-D will handle reprocessing it&apos;s hard to take a decision.&lt;/p&gt;</comment>
                            <comment id="17134" author="msyktnk" created="Tue, 12 May 2020 08:58:11 +0000"  >&lt;p&gt;If you ingest new data, you&apos;ll have directories $(OBJECT) under your root directory.&#160; That is what BIAS etc meant.&#160; Anyway, that is not very important.&#160; Here is how you run the 1d pipeline:&lt;br/&gt;
&lt;a href=&quot;https://github.com/Subaru-PFS/drp_1dpipe/blob/master/MANUAL.md&quot; class=&quot;external-link&quot; rel=&quot;nofollow&quot;&gt;https://github.com/Subaru-PFS/drp_1dpipe/blob/master/MANUAL.md&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;It looks like you will have to tell the pipeline where your spectra are with respect to the root directory.&#160; I am not sure if you have any control on the output directory (it does not look like it).&#160; We could ask the LAM team to handle reruns.&#160; Another option might be to ask Mineo-kun to somehow handle 1d and 2d reruns internally in his code.&#160; I&apos;d prefer the former because we want to have a good level of transparency at the rerun level.&lt;/p&gt;</comment>
                            <comment id="17420" author="pychabau" created="Thu, 2 Jul 2020 14:09:53 +0000"  >&lt;p&gt;The relative locations of the input (where the 2D outputs are stored) and output (where the DRP-1D data products are stored) directories are comand line parameters of the pipeline (&#8211;spectra_dir and --output_dir), and default values can be adapted as a function of implementation (e.g the output directory can be named from the input one with a time_stamp). Thus you can produce as many rerun of a given input catalog as wanted.&lt;br/&gt;
&#160;&lt;br/&gt;
A question came to us from this ticket : does that mean that there will be 2 implementations of the DRP-1D : one for the on-the-fly reduction that will run automatically with a fixed configuration, and a second one related to the science database that will be used for rerun in different configurations ?&lt;/p&gt;</comment>
                            <comment id="17422" author="msyktnk" created="Fri, 3 Jul 2020 08:24:30 +0000"  >&lt;p&gt;Thank you!&#160; The ability to specify input/output directories is exactly what we want for our purpose.&#160; I am going to educate myself on how to run the 1d pipeline a little further.&lt;/p&gt;

&lt;p&gt;I am not sure if we are going to run the 1d pipeline at the summit (with different config).&#160; But, we may change the config and rerun the pipeline for testing purposes or whatever reason and that is what &apos;rerun&apos; is for.&lt;/p&gt;</comment>
                            <comment id="17586" author="msyktnk" created="Tue, 25 Aug 2020 01:47:08 +0000"  >&lt;p&gt;I&apos;ve run the LAM 1d pipeline on ~60k simulated PFS spectra.&#160; I think any of the options discussed on this ticket will work.&#160; HSC has about 80 reruns for SSP production so far (there should be more for testing purposes), and if I think about &amp;gt;10 years of PFS operations, I would suggest that we have separate root directories for 2ddrp, lam1d, (and probably ga1d as well, although I do not know yet what the ga1d output looks like).&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;./
&#9500;&#9472;&#9472; 2d
&#9474;    &#9500;&#9472;&#9472; BIAS
&#9474;    &#9500;&#9472;&#9472; CALIB
&#9474;    &#9500;&#9472;&#9472; DARK
&#9474;    &#9500;&#9472;&#9472; FLAT
&#9474;    &#9500;&#9472;&#9472; OTHER_STUFF
&#9474;    &#9492;&#9472;&#9472; rerun
&#9474;          &#9500;&#9472;&#9472; dr1
&#9474;          &#9500;&#9472;&#9472; dr2
&#9474;          &#9492;&#9472;&#9472; dr3
&#9500;&#9472;&#9472; ga1d
&#9474;    &#9500;&#9472;&#9472; STUFF
&#9474;    &#9492;&#9472;&#9472; rerun
&#9474;          &#9500;&#9472;&#9472; dr3_test1
&#9474;          &#9492;&#9472;&#9472; dr3_test2
&#9492;&#9472;&#9472; lam1d
      &#9500;&#9472;&#9472; STUFF
      &#9492;&#9472;&#9472; rerun
            &#9500;&#9472;&#9472; dr3_test1
            &#9492;&#9472;&#9472; dr3_test2&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;
&lt;p&gt;The 1d rerun names should inherit the 2d rerun name to make the relationship clear.&lt;/p&gt;</comment>
                            <comment id="17666" author="rhl" created="Fri, 11 Sep 2020 14:06:44 +0000"  >&lt;p&gt;This is fine, except that I&apos;m not sure what you mean by CALIB. The 2d pipeline has one CALIB directory which contains the biases, flats, fiberTraces, etc. The &lt;b&gt;raw&lt;/b&gt; biases etc. are in the same place as all the other raw data, so it&apos;s more like:&lt;/p&gt;


&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;./
+-- 2d 
|    +-- raw
|    |   +-- data
|    +-- CALIB
|    |   +-- BIAS 
|    |   +-- DARK
|    |   +-- FLAT
|    |   +-- FIBER_TRACE
|    |   +-- OTHER_STUFF
|    +-- rerun
|         +-- rhl
|         |   +-- test1
|         +-- dr1
|         +-- dr2
|         +-- dr3
+-- ga1d
|    +-- STUFF
|    +-- rerun
|         +-- dr3_test1
|         +-- dr3_test2
+-- lam1d
     +-- STUFF
     +-- rerun
          +-- dr3_test1
          +-- dr3_test2&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;
&lt;p&gt;Except that I&apos;d expect that we&apos;d need some new CALIBs for every rerun (because the algorithms to build e.g. fibre traces and arc solutions will change, and I have no idea how much smarter we&apos;ll get with the H4RGs), so I&apos;d put a CALIB in each rerun (and probably symbolic link it to the top level, but that&apos;s a real detail).&lt;/p&gt;

&lt;p&gt;On the 2-D side the reruns logically include the raw data, but the butler handles that so it&apos;s not visible to the file system.&lt;/p&gt;</comment>
                            <comment id="17705" author="msyktnk" created="Tue, 15 Sep 2020 06:52:28 +0000"  >&lt;p&gt;Thank you for the useful comment!&#160; This ticket is about relative locations of the 2d and 1d outputs, and I think we can safely close it now.&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10003">
                    <name>Relates</name>
                                            <outwardlinks description="relates to">
                                        <issuelink>
            <issuekey id="14642">SCIDB-98</issuekey>
        </issuelink>
                            </outwardlinks>
                                                        </issuelinktype>
                    </issuelinks>
                <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                            <customfield id="customfield_10500" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                            <customfield id="customfield_10010" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>0|s0020g:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>