On Mon, 2019-01-07 at 12:02 -0800, Francisco Jerez wrote:
> Iago Toral <ito...@igalia.com> writes:
> 
> > On Sat, 2018-12-29 at 12:39 -0800, Francisco Jerez wrote:
> > > It's redundant with the functionality provided by lower_regioning
> > > now.
> > > ---
> > >  src/intel/Makefile.sources                    |   1 -
> > >  src/intel/compiler/brw_fs.cpp                 |   1 -
> > >  src/intel/compiler/brw_fs.h                   |   1 -
> > >  .../compiler/brw_fs_lower_conversions.cpp     | 132 ------------
> > > ----
> > > --
> > >  src/intel/compiler/meson.build                |   1 -
> > >  5 files changed, 136 deletions(-)
> > >  delete mode 100644
> > > src/intel/compiler/brw_fs_lower_conversions.cpp
> > > 
> > > diff --git a/src/intel/Makefile.sources
> > > b/src/intel/Makefile.sources
> > > index 6b9874d2b80..fe06a57b42e 100644
> > > --- a/src/intel/Makefile.sources
> > > +++ b/src/intel/Makefile.sources
> > > @@ -62,7 +62,6 @@ COMPILER_FILES = \
> > >   compiler/brw_fs.h \
> > >   compiler/brw_fs_live_variables.cpp \
> > >   compiler/brw_fs_live_variables.h \
> > > - compiler/brw_fs_lower_conversions.cpp \
> > >   compiler/brw_fs_lower_pack.cpp \
> > >   compiler/brw_fs_lower_regioning.cpp \
> > >   compiler/brw_fs_nir.cpp \
> > > diff --git a/src/intel/compiler/brw_fs.cpp
> > > b/src/intel/compiler/brw_fs.cpp
> > > index caa7a798332..d6280d558ec 100644
> > > --- a/src/intel/compiler/brw_fs.cpp
> > > +++ b/src/intel/compiler/brw_fs.cpp
> > > @@ -6472,7 +6472,6 @@ fs_visitor::optimize()
> > >     }
> > >  
> > >     progress = false;
> > > -   OPT(lower_conversions);
> > >     OPT(lower_regioning);
> > >     if (progress) {
> > >        OPT(opt_copy_propagation);
> > 
> > If you didn't do this in the previous patch, then maybe do it here:
> > 
> > if (OPT(lower_regioning)) {
> >    ...
> > }
> > 
> > and avoid resetting progress.
> > 
> 
> I left this lying around because there is another legalization pass
> coming up that should cause the same post-lowering optimization
> passes
> to be executed if progress is made.  I can clean things up though if
> you
> like, and re-introduce the reset of the progress flag in the future
> commit.

If we are still going to need it soon I think it is fine to leave it
like this.

> > > diff --git a/src/intel/compiler/brw_fs.h
> > > b/src/intel/compiler/brw_fs.h
> > > index 36825754931..7edaa3af43c 100644
> > > --- a/src/intel/compiler/brw_fs.h
> > > +++ b/src/intel/compiler/brw_fs.h
> > > @@ -165,7 +165,6 @@ public:
> > >     bool lower_load_payload();
> > >     bool lower_pack();
> > >     bool lower_regioning();
> > > -   bool lower_conversions();
> > >     bool lower_logical_sends();
> > >     bool lower_integer_multiplication();
> > >     bool lower_minmax();
> > > diff --git a/src/intel/compiler/brw_fs_lower_conversions.cpp
> > > b/src/intel/compiler/brw_fs_lower_conversions.cpp
> > > deleted file mode 100644
> > > index 145fb55f995..00000000000
> > > --- a/src/intel/compiler/brw_fs_lower_conversions.cpp
> > > +++ /dev/null
> > > @@ -1,132 +0,0 @@
> > > -/*
> > > - * Copyright © 2015 Connor Abbott
> > > - *
> > > - * Permission is hereby granted, free of charge, to any person
> > > obtaining a
> > > - * copy of this software and associated documentation files (the
> > > "Software"),
> > > - * to deal in the Software without restriction, including
> > > without
> > > limitation
> > > - * the rights to use, copy, modify, merge, publish, distribute,
> > > sublicense,
> > > - * and/or sell copies of the Software, and to permit persons to
> > > whom
> > > the
> > > - * Software is furnished to do so, subject to the following
> > > conditions:
> > > - *
> > > - * The above copyright notice and this permission notice
> > > (including
> > > the next
> > > - * paragraph) shall be included in all copies or substantial
> > > portions of the
> > > - * Software.
> > > - *
> > > - * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY
> > > KIND,
> > > EXPRESS OR
> > > - * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
> > > MERCHANTABILITY,
> > > - * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO
> > > EVENT SHALL
> > > - * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM,
> > > DAMAGES
> > > OR OTHER
> > > - * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
> > > OTHERWISE,
> > > ARISING
> > > - * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
> > > OTHER DEALINGS
> > > - * IN THE SOFTWARE.
> > > - */
> > > -
> > > -#include "brw_fs.h"
> > > -#include "brw_cfg.h"
> > > -#include "brw_fs_builder.h"
> > > -
> > > -using namespace brw;
> > > -
> > > -static bool
> > > -supports_type_conversion(const fs_inst *inst) {
> > > -   switch (inst->opcode) {
> > > -   case BRW_OPCODE_MOV:
> > > -   case SHADER_OPCODE_MOV_INDIRECT:
> > > -      return true;
> > > -   case BRW_OPCODE_SEL:
> > > -      return inst->dst.type == get_exec_type(inst);
> > > -   default:
> > > -      /* FIXME: We assume the opcodes don't explicitly mentioned
> > > -       * before just work fine with arbitrary conversions.
> > > -       */
> > > -      return true;
> > > -   }
> > > -}
> > > -
> > > -/* From the SKL PRM Vol 2a, "Move":
> > > - *
> > > - *    "A mov with the same source and destination type, no
> > > source
> > > modifier,
> > > - *     and no saturation is a raw move. A packed byte
> > > destination
> > > region (B
> > > - *     or UB type with HorzStride == 1 and ExecSize > 1) can
> > > only be
> > > written
> > > - *     using raw move."
> > > - */
> > > -static bool
> > > -is_byte_raw_mov (const fs_inst *inst)
> > > -{
> > > -   return type_sz(inst->dst.type) == 1 &&
> > > -          inst->opcode == BRW_OPCODE_MOV &&
> > > -          inst->src[0].type == inst->dst.type &&
> > > -          !inst->saturate &&
> > > -          !inst->src[0].negate &&
> > > -          !inst->src[0].abs;
> > > -}
> > > -
> > > -bool
> > > -fs_visitor::lower_conversions()
> > > -{
> > > -   bool progress = false;
> > > -
> > > -   foreach_block_and_inst(block, fs_inst, inst, cfg) {
> > > -      const fs_builder ibld(this, block, inst);
> > > -      fs_reg dst = inst->dst;
> > > -      bool saturate = inst->saturate;
> > > -
> > > -      if (supports_type_conversion(inst)) {
> > > -         if (type_sz(inst->dst.type) < get_exec_type_size(inst)
> > > &&
> > > -             !is_byte_raw_mov(inst)) {
> > > -            /* From the Broadwell PRM, 3D Media GPGPU, "Double
> > > Precision Float to
> > > -             * Single Precision Float":
> > > -             *
> > > -             *    The upper Dword of every Qword will be written
> > > with undefined
> > > -             *    value when converting DF to F.
> > > -             *
> > > -             * So we need to allocate a temporary that's two
> > > registers, and then do
> > > -             * a strided MOV to get the lower DWord of every
> > > Qword
> > > that has the
> > > -             * result.
> > > -             *
> > > -             * This restriction applies, in general, whenever we
> > > convert to
> > > -             * a type with a smaller bit-size.
> > > -             */
> > > -            fs_reg temp = ibld.vgrf(get_exec_type(inst));
> > > -            fs_reg strided_temp = subscript(temp, dst.type, 0);
> > > -
> > > -            assert(inst->size_written == inst-
> > > > dst.component_size(inst->exec_size));
> > > 
> > > -            inst->dst = strided_temp;
> > > -            inst->saturate = false;
> > > -            /* As it is an strided destination, we write n-times
> > > more being n the
> > > -             * size ratio between source and destination types.
> > > Update
> > > -             * size_written accordingly.
> > > -             */
> > > -            inst->size_written = inst->dst.component_size(inst-
> > > > exec_size);
> > > 
> > > -
> > > -            fs_inst *mov = ibld.at(block, inst->next).MOV(dst,
> > > strided_temp);
> > > -            mov->saturate = saturate;
> > > -            mov->predicate = inst->predicate;
> > > -
> > > -            progress = true;
> > > -         }
> > > -      } else {
> > > -         fs_reg temp0 = ibld.vgrf(get_exec_type(inst));
> > > -
> > > -         assert(inst->size_written == inst-
> > > >dst.component_size(inst-
> > > > exec_size));
> > > 
> > > -         inst->dst = temp0;
> > > -         /* As it is an strided destination, we write n-times
> > > more
> > > being n the
> > > -          * size ratio between source and destination types.
> > > Update
> > > -          * size_written accordingly.
> > > -          */
> > > -         inst->size_written = inst->dst.component_size(inst-
> > > > exec_size);
> > > 
> > > -         inst->saturate = false;
> > > -         /* Now, do the conversion to original destination's
> > > type.
> > > In next iteration,
> > > -          * we will lower it if it is a d2f conversion.
> > > -          */
> > > -         ibld.at(block, inst->next).MOV(dst, temp0)->saturate =
> > > saturate;
> > > -
> > > -         progress = true;
> > > -      }
> > > -   }
> > > -
> > > -   if (progress)
> > > -      invalidate_live_intervals();
> > > -
> > > -   return progress;
> > > -}
> > > diff --git a/src/intel/compiler/meson.build
> > > b/src/intel/compiler/meson.build
> > > index 4af134b418e..f8e5e2518fe 100644
> > > --- a/src/intel/compiler/meson.build
> > > +++ b/src/intel/compiler/meson.build
> > > @@ -55,7 +55,6 @@ libintel_compiler_files = files(
> > >    'brw_fs.h',
> > >    'brw_fs_live_variables.cpp',
> > >    'brw_fs_live_variables.h',
> > > -  'brw_fs_lower_conversions.cpp',
> > >    'brw_fs_lower_pack.cpp',
> > >    'brw_fs_lower_regioning.cpp',
> > >    'brw_fs_nir.cpp',

_______________________________________________
mesa-dev mailing list
mesa-dev@lists.freedesktop.org
https://lists.freedesktop.org/mailman/listinfo/mesa-dev

Reply via email to