pytti-tools
diff --git a/‎src/pytti/ImageGuide.py‎
Lines changed: 31 additions & 282 deletions b/‎src/pytti/ImageGuide.py‎
Lines changed: 31 additions & 282 deletions
@@ -77,13 +77,13 @@ def __init__(
         embedder: nn.Module,
         optimizer: optim.Optimizer = None,
         lr: float = None,
-        null_update=True,
+        # null_update=True,
         params=None,
         writer=None,
-        OUTPATH=None,
-        base_name=None,
         fig=None,
         axs=None,
+        base_name=None,
+        OUTPATH=None,  # <<<<<<<<<<<<<<
         #####################
         video_frames=None,  # # only need this to pass to animate_video_source
         optical_flows=None,
@@ -108,7 +108,7 @@ def __init__(
             self.optimizer = optimizer
         self.dataframe = []
 
-        self.null_update = null_update
+        # self.null_update = null_update
         self.params = params
         self.writer = writer
         self.OUTPATH = OUTPATH
@@ -117,13 +117,13 @@ def __init__(
         self.axs = axs
         self.video_frames = video_frames
         self.optical_flows = optical_flows
-        if stabilization_augs is None:
-            stabilization_augs = []
+        # if stabilization_augs is None:
+        #    stabilization_augs = []
         self.stabilization_augs = stabilization_augs
         self.last_frame_semantic = last_frame_semantic
         self.semantic_init_prompt = semantic_init_prompt
-        if init_augs is None:
-            init_augs = []
+        # if init_augs is None:
+        #    init_augs = []
         self.init_augs = init_augs
 
     def run_steps(
@@ -152,8 +152,26 @@ def run_steps(
             #        and here we can check if the DirectImageGuide was
             #        initialized with a renderer or not, and call self.renderer.update()
             #        if appropriate
-            if not self.null_update:
-                self.update(i + i_offset, i + skipped_steps)
+            # if not self.null_update:
+            #    self.update(i + i_offset, i + skipped_steps)
+            self.update(
+                model=self,
+                img=self.image_rep,
+                i=i + i_offset,
+                stage_i=i + skipped_steps,
+                params=self.params,
+                writer=self.writer,
+                fig=self.fig,
+                axs=self.axs,
+                base_name=self.base_name,
+                optical_flows=self.optical_flows,
+                video_frames=self.video_frames,
+                stabilization_augs=self.stabilization_augs,
+                last_frame_semantic=self.last_frame_semantic,
+                embedder=self.embedder,
+                init_augs=self.init_augs,
+                semantic_init_prompt=self.semantic_init_prompt,
+            )
             losses = self.train(
                 i + skipped_steps,
                 prompts,
@@ -343,277 +361,8 @@ def train(
 
         return {"TOTAL": float(total_loss)}
 
-    def report_out(
-        self,
-        i,
-        stage_i,
-        # model,
-        writer,
-        fig,  # default to None...
-        axs,  # default to None...
-        clear_every,
-        display_every,
-        approximate_vram_usage,
-        display_scale,
-        show_graphs,
-        show_palette,
-    ):
-        model = self
-        img = self.image_rep  # pretty sure this is right
-        # DM: I bet this could be abstracted out into a report_out() function or whatever
-        if clear_every > 0 and i > 0 and i % clear_every == 0:
-            display.clear_output()
-
-        if display_every > 0 and i % display_every == 0:
-            logger.debug(f"Step {i} losses:")
-            if model.dataframe:
-                rec = model.dataframe[0].iloc[-1]
-                logger.debug(rec)
-                if writer is not None:
-                    for k, v in rec.iteritems():
-                        writer.add_scalar(
-                            tag=f"losses/{k}", scalar_value=v, global_step=i
-                        )
-
-            # does this VRAM stuff even do anything?
-            if approximate_vram_usage:
-                logger.debug("VRAM Usage:")
-                print_vram_usage()  # update this function to use logger
-            # update this stuff to use/rely on tensorboard
-            display_width = int(img.image_shape[0] * display_scale)
-            display_height = int(img.image_shape[1] * display_scale)
-            if stage_i > 0 and show_graphs:
-                model.plot_losses(axs)
-                im = img.decode_image()
-                sidebyside = make_hbox(
-                    im.resize((display_width, display_height), Image.LANCZOS),
-                    fig,
-                )
-                display.display(sidebyside)
-            else:
-                im = img.decode_image()
-                display.display(
-                    im.resize((display_width, display_height), Image.LANCZOS)
-                )
-            logger.debug(PixelImage)
-            logger.debug(type(PixelImage))
-            if show_palette and isinstance(img, PixelImage):
-                logger.debug("Palette:")
-                display.display(img.render_pallet())
-
-    def save_out(
-        self,
-        i,
-        # img,
-        writer,
-        OUTPATH,
-        base_name,
-        save_every,
-        file_namespace,
-        backups,
-    ):
-        img = self.image_rep
-        # save
-        # if i > 0 and save_every > 0 and i % save_every == 0:
-        if i > 0 and save_every > 0 and (i + 1) % save_every == 0:
-            im = (
-                img.decode_image()
-            )  # let's turn this into a property so decoding is cheap
-            # n = i // save_every
-            n = (i + 1) // save_every
-            filename = f"{OUTPATH}/{file_namespace}/{base_name}_{n}.png"
-            logger.debug(filename)
-            im.save(filename)
-
-            im_np = np.array(im)
-            if writer is not None:
-                writer.add_image(
-                    tag="pytti output",
-                    # img_tensor=filename, # thought this would work?
-                    img_tensor=im_np,
-                    global_step=i,
-                    dataformats="HWC",  # this was the key
-                )
-
-            if backups > 0:
-                filename = f"backup/{file_namespace}/{base_name}_{n}.bak"
-                torch.save(img.state_dict(), filename)
-                if n > backups:
-
-                    # YOOOOOOO let's not start shell processes unnecessarily
-                    # and then execute commands using string interpolation.
-                    # Replace this with a pythonic folder removal, then see
-                    # if we can't deprecate the folder removal entirely. What
-                    # is the purpose of "backups" here? Just use the frames that
-                    # are being written to disk.
-                    subprocess.run(
-                        [
-                            "rm",
-                            f"backup/{file_namespace}/{base_name}_{n-backups}.bak",
-                        ]
-                    )
-
-    def update(
-        self,
-        # params,
-        # move to class
-        i,
-        stage_i,
-    ):
+    def update(self, model, img, i, stage_i, *args, **kwargs):
         """
-        Orchestrates animation transformations and reporting
+        update hook called ever step
         """
-        # logger.debug("model.update called")
-
-        # ... I have regrets.
-        params = self.params
-        writer = self.writer
-        OUTPATH = self.OUTPATH
-        base_name = self.base_name
-        fig = self.fig
-        axs = self.axs
-        video_frames = self.video_frames
-        optical_flows = self.optical_flows
-        stabilization_augs = self.stabilization_augs
-        last_frame_semantic = self.last_frame_semantic
-        semantic_init_prompt = self.semantic_init_prompt
-        init_augs = self.init_augs
-
-        model = self
-        img = self.image_rep
-        embedder = self.embedder
-
-        model.report_out(
-            i=i,
-            stage_i=stage_i,
-            # model=model,
-            writer=writer,
-            fig=fig,  # default to None...
-            axs=axs,  # default to None...
-            clear_every=params.clear_every,
-            display_every=params.display_every,
-            approximate_vram_usage=params.approximate_vram_usage,
-            display_scale=params.display_scale,
-            show_graphs=params.show_graphs,
-            show_palette=params.show_palette,
-        )
-
-        model.save_out(
-            i=i,
-            # img=img,
-            writer=writer,
-            OUTPATH=OUTPATH,
-            base_name=base_name,
-            save_every=params.save_every,
-            file_namespace=params.file_namespace,
-            backups=params.backups,
-        )
-
-        # animate
-        ################
-        ## TO DO: attach T as a class attribute
-        t = (i - params.pre_animation_steps) / (
-            params.steps_per_frame * params.frames_per_second
-        )
-        set_t(t)  # this won't need to be a thing with `t`` attached to the class
-        if i >= params.pre_animation_steps:
-            # next_step_pil = None
-            if (i - params.pre_animation_steps) % params.steps_per_frame == 0:
-                logger.debug(f"Time: {t:.4f} seconds")
-                # update_rotoscopers(
-                ROTOSCOPERS.update_rotoscopers(
-                    ((i - params.pre_animation_steps) // params.steps_per_frame + 1)
-                    * params.frame_stride
-                )
-                if params.reset_lr_each_frame:
-                    model.set_optim(None)
-
-                if params.animation_mode == "2D":
-
-                    next_step_pil = animate_2d(
-                        translate_y=params.translate_y,
-                        translate_x=params.translate_x,
-                        rotate_2d=params.rotate_2d,
-                        zoom_x_2d=params.zoom_x_2d,
-                        zoom_y_2d=params.zoom_y_2d,
-                        infill_mode=params.infill_mode,
-                        sampling_mode=params.sampling_mode,
-                        writer=writer,
-                        i=i,
-                        img=img,
-                        t=t,  # just here for logging
-                    )
-
-                    ###########################
-                elif params.animation_mode == "3D":
-                    try:
-                        im
-                    except NameError:
-                        im = img.decode_image()
-                    with vram_usage_mode("Optical Flow Loss"):
-                        # zoom_3d -> rename to animate_3d or transform_3d
-                        flow, next_step_pil = zoom_3d(
-                            img,
-                            (
-                                params.translate_x,
-                                params.translate_y,
-                                params.translate_z_3d,
-                            ),
-                            params.rotate_3d,
-                            params.field_of_view,
-                            params.near_plane,
-                            params.far_plane,
-                            border_mode=params.infill_mode,
-                            sampling_mode=params.sampling_mode,
-                            stabilize=params.lock_camera,
-                        )
-                        freeze_vram_usage()
-
-                    for optical_flow in optical_flows:
-                        optical_flow.set_last_step(im)
-                        optical_flow.set_target_flow(flow)
-                        optical_flow.set_enabled(True)
-
-                elif params.animation_mode == "Video Source":
-
-                    flow_im, next_step_pil = animate_video_source(
-                        i=i,
-                        img=img,
-                        video_frames=video_frames,
-                        optical_flows=optical_flows,
-                        base_name=base_name,
-                        pre_animation_steps=params.pre_animation_steps,
-                        frame_stride=params.frame_stride,
-                        steps_per_frame=params.steps_per_frame,
-                        file_namespace=params.file_namespace,
-                        reencode_each_frame=params.reencode_each_frame,
-                        lock_palette=params.lock_palette,
-                        save_every=params.save_every,
-                        infill_mode=params.infill_mode,
-                        sampling_mode=params.sampling_mode,
-                    )
-
-                if params.animation_mode != "off":
-                    try:
-                        for aug in stabilization_augs:
-                            aug.set_comp(next_step_pil)
-                            aug.set_enabled(True)
-                        if last_frame_semantic is not None:
-                            last_frame_semantic.set_image(embedder, next_step_pil)
-                            last_frame_semantic.set_enabled(True)
-                        for aug in init_augs:
-                            aug.set_enabled(False)
-                        if semantic_init_prompt is not None:
-                            semantic_init_prompt.set_enabled(False)
-                    except UnboundLocalError:
-                        logger.critical(
-                            "\n\n-----< PYTTI-TOOLS > ------"
-                            "If you are seeing this error, it might mean "
-                            "you are using an option that expects you have "
-                            "provided an init_image or video_file.\n\nIf you "
-                            "think you are seeing this message in error, please "
-                            "file an issue here: "
-                            "https://github.com/pytti-tools/pytti-core/issues/new"
-                            "-----< PYTTI-TOOLS > ------\n\n"
-                        )
-                        raise
+        pass