Akascape / CTkPDFViewer

A simple yet powerfull pdf viewer for customtkinter! (extension/add-on)
MIT License
48 stars 4 forks source link

CTkpdfviewer is taking a lot of memory cuz of ctklabel widget - i give to u a little rework #1

Open MaxNiark opened 1 year ago

MaxNiark commented 1 year ago

hi

i rework some code in your ctkpdfviewer

for some reason, your process create a lot of ctklabel, and don't rly destroy it in memory .. i change this by simple tkinter label. i replace pack by grid, and create a textbox to get the text data. i'll work soon on parser to set a bit the textbox when it's possible with metadata.

configure function is not re-code, and thread disabled cuz i don't undestand how to get one variable dict

also this one is so powerfull, u could make a picture viewer with a same code ;)

"""
CTkPDFViewer is a pdf viewer widget for customtkinter.
Author: Akash Bora
License: MIT
Version 2 Work By MaxNiark
"""

import customtkinter
from tkinter import ttk
from PIL import Image, ImageTk
import fitz as fz
from threading import Thread
import math
import io
import os

class CTkPDFViewer(customtkinter.CTkFrame):

    def __init__(self,
                 master: any,
                 file: str,
                 width: int = 600,
                 height: int = 200,
                 page_width: int = 600,
                 page_height: int = 700,
                 page_separation_height: int = 2,
                 **kwargs):

        super().__init__(master, width=width, height=height,**kwargs)
        print("--------------",self._apply_widget_scaling(self._current_width))
        self._apply_widget_scaling(self._current_width)

        self.width_bouh=50
        def on_window_resize(event):
            width = event.width
            height = event.height

            print(f"Window resized to {width}x{height}")
            if width!=self.width_bouh:
                self.width_bouh=width
               # self.text_box.configure(width=width-950)
          #  SIZE_MAIN=[width,height]
          #  return SIZE_MAIN

        # Bind the resize event to a function
        self.master.bind("<Configure>", on_window_resize)
        self._scrlframe=customtkinter.CTkScrollableFrame(self, width=page_width)
        self._scrlframe.grid(row=0,column=0,sticky="nesw")

        self._scrlframe.grid_columnconfigure(0,weight=1,minsize=200)

        self.text_box=customtkinter.CTkTextbox(self,width=(self._apply_widget_scaling(self._current_width)-page_width))
        self.text_box.grid(row=0, column=1,sticky="nesw")
        self.text_box.grid_columnconfigure(0,weight=1, minsize=120)

        self.page_width = page_width
        self.page_height = page_height
        self.separation = page_separation_height
        self.pdf_images = []
        self.labels = []
        self._text_info=[]
        self._pdf=""

        self._text_info=[]
        self.file = file

        self.percentage_view = 0
        self.percentage_load = customtkinter.StringVar()

        self.loading_message = customtkinter.CTkLabel(self, textvariable=self.percentage_load, justify="center")

        self.loading_bar = customtkinter.CTkProgressBar(self, width=100)
        self.loading_bar.set(0)

        self.grid_columnconfigure((0,1),weight=1, minsize=200)
        self.grid_rowconfigure(0,weight=1, minsize=10)
        self._grid_loading()

    def start_process(self):
       # Thread(target=self._ADD_PAGE(), args=(self._text_info)).start()
        self._ADD_PAGE()
        self._insert_text()
        self._SEARCH()

    def _grid_loading(self):
        self.loading_message.grid(row=0, column=0)
        self.loading_bar.grid(row=0)
        self.after(250, self.start_process)

    def _ADD_PAGE(self)    :

        self.percentage_bar = 0
        pdf = fz.open(self.file)
        count=0
        for page in pdf:
            page_data = page.get_pixmap()

            text_info=page.get_text(),page.get_text_words()

          #  text_word=page.get_text_words()
            pix = fz.Pixmap(page_data, 0) if page_data.alpha else page_data
            img = Image.open(io.BytesIO(pix.tobytes('ppm')))

            # Convertissez l'image en PhotoImage
            label_img = ImageTk.PhotoImage(img,size=(self.page_width+150, self.page_height),width=750)
            self.pdf_images.append(label_img)
            self._text_info.append(text_info)

            self.percentage_bar = self.percentage_bar + 1
            percentage_view = (float(self.percentage_bar) / float(len(pdf)) * float(100))
            self.loading_bar.set(percentage_view)
            self.percentage_load.set(f"Loading {os.path.basename(self.file)} \n{int(math.floor(percentage_view))}%")

        self.loading_bar.grid_forget()
        self.loading_message.grid_forget()

        pdf.close()

        for i in self.pdf_images:
            label=ttk.Label(self._scrlframe,image=i, text="")
            label.grid(row=count, column=0, pady=(0+self.separation), sticky="nesw")
            count+=1
            self.labels.append(label)

        return self._text_info    

    def _insert_text(self):
        self.text_box.delete("1.0", "end")
        count=0
        for i in self._text_info:
            print(i[1])

            self.text_box.insert('end',str(count)+'\n\n'+i[0] +'\n\n')
            count+=1

    def _SEARCH(self,):
        mot_a_rechercher="Site Information"  ## FROM CtkEntry.
        count=0
        for i in self._text_info:
            if mot_a_rechercher in i: 
                print(count)
            count+=1    

    def configure(self, **kwargs):
        """ configurable options """

        if "file" in kwargs:
            self.file = kwargs.pop("file")
            self.pdf_images = []
            self._text_info=[]

          #  self.text_box.destroy()

            for i in self.labels:
                i.destroy()

            self.labels = []
            self.after(250, self._grid_loading)

        if "page_width" in kwargs:
            self.page_width = kwargs.pop("page_width")
            for i in self.pdf_images:
                i.configure(size=(self.page_width, self.page_height))

        if "page_height" in kwargs:
            self.page_height = kwargs.pop("page_height")
            for i in self.pdf_images:
                i.configure(size=(self.page_width, self.page_height))

        if "page_separation_height" in kwargs:
            self.separation = kwargs.pop("page_separation_height")
            for i in self.labels:
                i.pack_forget()
                i.pack(pady=(0,self.separation))

        super().configure(**kwargs)
UlisesToledoH commented 5 months ago

What a job mate! COngratulations it resolved a problem with the scrollbar