refactor: prepare repo for v1.8.1

- add localizations for AutoFP8 - remove unnecessary assets - update CHANGELOG.md - add DownloadThread.py docs
2024-09-04 17:19:54 -07:00 · 2024-09-04 17:19:54 -07:00 · d55cb9ea9b
parent 3adee266ca
commit d55cb9ea9b
8 changed files with 117 additions and 23 deletions
--- a/.env.example
+++ b/.env.example
@ -3,3 +3,6 @@ AUTOGGUF_THEME=
 AUTOGGUF_CHECK_BACKEND=enabled
 AUTOGGUF_CHECK_UPDATE=enabled
 AUTOGGUF_SERVER_API_KEY=
 AUTOGGUF_MODEL_DIR_NAME=models
 AUTOGGUF_OUTPUT_DIR_NAME=quantized_models
 AUTOGGUF_RESIZE_FACTOR=1.1
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@ -1,5 +1,35 @@
 # Changelog
 ## [v1.8.1] - 2024-09-04
 ### Added
 - AutoFP8 quantization classes and window (currently WIP)
 - Minimize/maximize buttons to title bar
 - API key authentication support for the local server
 - HuggingFace upload/download class
 - OpenAPI docs for endpoints
 ### Changed
 - Replaced Flask with FastAPI and Uvicorn for improved performance
 - Moved functions out of AutoGGUF.py into utils.py and TaskListItem.py
 - Updated llama.cpp convert scripts
 - Improved LoRA conversion process:
  - Allow specifying output path in arguments
  - Removed shutil.move operation
  - Increased max number of LoRA layers
 - Changed default port to 7001
 - Now binding to localhost (127.0.0.1) instead of 0.0.0.0
 - Upadted Spanish localizations
 - Updated setuptools requirement from ~=68.2.0 to ~=74.0.0
 ### Fixed
 - Web page not found error
 - Use of proper status in TaskListItem
 - Passing of quant_threads and Logger to TaskListItem
 - Improved window moving smoothness
 - Prevention of moving window below taskbar
 - Optimized imports in various files
 ## [v1.8.0] - 2024-08-26
 ### Added
--- a/assets/icon.RES
+++ b/assets/icon.RES
--- a/assets/icon.rc
+++ b/assets/icon.rc
@ -1 +0,0 @@
 IDI_ICON1 ICON "favicon.ico"
--- a/docs/AutoGGUF.py
+++ b/docs/AutoGGUF.py
@ -1,29 +1,34 @@
 import importlib
 import json
 import re
 import shutil
-import os
+from datetime import datetime
 from functools import partial
 from typing import Any, Dict, List, Tuple
 import requests
 from PySide6.QtCore import *
 from PySide6.QtGui import *
 from PySide6.QtWidgets import *
 from dotenv import load_dotenv
 import lora_conversion
 import presets
 import ui_update
 import utils
 from CustomTitleBar import CustomTitleBar
 from GPUMonitor import GPUMonitor
-from KVOverrideEntry import KVOverrideEntry
+from Localizations import *
 from Logger import Logger
-from ModelInfoDialog import ModelInfoDialog
+from QuantizationThread import QuantizationThread
-from error_handling import show_error, handle_error
+from TaskListItem import TaskListItem
 from error_handling import handle_error, show_error
 from imports_and_globals import (
    ensure_directory,
    open_file_safe,
    resource_path,
    show_about,
    ensure_directory,
 )
 from Localizations import *
 import presets
 import ui_update
 import lora_conversion
 import utils
 class CustomTitleBar(QWidget):
--- a/docs/DownloadThread.py
+++ b/docs/DownloadThread.py
@ -0,0 +1,44 @@
 import os
 import zipfile
 import requests
 from PySide6.QtCore import QThread, Signal
 class DownloadThread(QThread):
    """
    A QThread subclass for downloading and extracting zip files.
    This thread downloads a file from a given URL, saves it to a specified path,
    extracts its contents if it's a zip file, and then removes the original zip file.
    Signals:
        progress_signal (int): Emits the download progress as a percentage.
        finished_signal (str): Emits the path of the extracted directory upon successful completion.
        error_signal (str): Emits an error message if an exception occurs during the process.
    """
    def __init__(self, url: str, save_path: str) -> None:
        """
        Initialize the DownloadThread.
        Args:
            url (str): The URL of the file to download.
            save_path (str): The local path where the file will be saved.
        """
    def run(self) -> None:
        """
        Execute the download, extraction, and cleanup process.
        This method performs the following steps:
        1. Downloads the file from the specified URL.
        2. Saves the file to the specified path.
        3. Extracts the contents if it's a zip file.
        4. Removes the original zip file after extraction.
        5. Emits signals for progress updates, completion, or errors.
        Raises:
            Exception: Any exception that occurs during the process is caught
                       and emitted through the error_signal.
        """
--- a/src/AutoGGUF.py
+++ b/src/AutoGGUF.py
@ -1016,7 +1016,9 @@ def browse_hf_outfile(self) -> None:
            self.hf_outfile.setText(os.path.abspath(outfile))
    def quantize_to_fp8_dynamic(self, model_dir: str, output_dir: str) -> None:
-        self.logger.info(f"Quantizing {os.path.basename(model_dir)} to {output_dir}")
+        self.logger.info(
            QUANTIZING_TO_WITH_AUTOFP8.format(os.path.basename(model_dir), output_dir)
        )
        try:
            command = [
                "python",
@ -1034,7 +1036,7 @@ def quantize_to_fp8_dynamic(self, model_dir: str, output_dir: str) -> None:
            thread = QuantizationThread(command, os.getcwd(), log_file)
            self.quant_threads.append(thread)
-            task_name = f"Quantizing {os.path.basename(model_dir)} with AutoFP8"
+            task_name = QUANTIZING_WITH_AUTOFP8.format(os.path.basename(model_dir))
            task_item = TaskListItem(
                task_name,
                log_file,
@ -1057,12 +1059,12 @@ def quantize_to_fp8_dynamic(self, model_dir: str, output_dir: str) -> None:
            thread.start()
        except Exception as e:
-            show_error(self.logger, f"Error starting AutoFP8 quantization: {e}")
+            show_error(self.logger, f"{ERROR_STARTING_AUTOFP8_QUANTIZATION}: {e}")
-        self.logger.info("AutoFP8 quantization task started")
+        self.logger.info(AUTOFP8_QUANTIZATION_TASK_STARTED)
    def show_autofp8_window(self):
        dialog = QDialog(self)
-        dialog.setWindowTitle("Quantize to FP8 Dynamic")
+        dialog.setWindowTitle(QUANTIZE_TO_FP8_DYNAMIC)
        dialog.setFixedWidth(500)
        layout = QVBoxLayout()
@ -1072,10 +1074,10 @@ def show_autofp8_window(self):
        input_button = QPushButton(BROWSE)
        input_button.clicked.connect(
            lambda: self.fp8_input.setText(
-                QFileDialog.getExistingDirectory(self, "Open Model Folder")
+                QFileDialog.getExistingDirectory(self, OPEN_MODEL_FOLDER)
            )
        )
-        input_layout.addWidget(QLabel("Input Model:"))
+        input_layout.addWidget(QLabel(INPUT_MODEL))
        input_layout.addWidget(self.fp8_input)
        input_layout.addWidget(input_button)
        layout.addLayout(input_layout)
@ -1086,16 +1088,16 @@ def show_autofp8_window(self):
        output_button = QPushButton(BROWSE)
        output_button.clicked.connect(
            lambda: self.fp8_output.setText(
-                QFileDialog.getExistingDirectory(self, "Open Model Folder")
+                QFileDialog.getExistingDirectory(self, OPEN_MODEL_FOLDER)
            )
        )
-        output_layout.addWidget(QLabel("Output Path:"))
+        output_layout.addWidget(QLabel(OUTPUT))
        output_layout.addWidget(self.fp8_output)
        output_layout.addWidget(output_button)
        layout.addLayout(output_layout)
        # Quantize button
-        quantize_button = QPushButton("Quantize")
+        quantize_button = QPushButton(QUANTIZE)
        quantize_button.clicked.connect(
            lambda: self.quantize_to_fp8_dynamic(
                self.fp8_input.text(), self.fp8_output.text()
--- a/src/Localizations.py
+++ b/src/Localizations.py
@ -1,6 +1,6 @@
 import os
-AUTOGGUF_VERSION = "v1.8.0"
+AUTOGGUF_VERSION = "v1.8.1"
 class _Localization:
@ -34,6 +34,17 @@ def __init__(self):
        self.IMPORTING_MODEL = "Importing model"
        self.IMPORTED_MODEL_TOOLTIP = "Imported model: {}"
        # AutoFP8 Quantization
        self.AUTOFP8_QUANTIZATION_TASK_STARTED = "AutoFP8 quantization task started"
        self.ERROR_STARTING_AUTOFP8_QUANTIZATION = "Error starting AutoFP8 quantization"
        self.QUANTIZING_WITH_AUTOFP8 = "Quantizing {0} with AutoFP8"
        self.QUANTIZING_TO_WITH_AUTOFP8 = "Quantizing {0} to {1}"
        self.QUANTIZE_TO_FP8_DYNAMIC = "Quantize to FP8 Dynamic"
        self.OPEN_MODEL_FOLDER = "Open Model Folder"
        self.QUANTIZE = "Quantize"
        self.OPEN_MODEL_FOLDER = "Open Model Folder"
        self.INPUT_MODEL = "Input Model:"
        # GGUF Verification
        self.INVALID_GGUF_FILE = "Invalid GGUF file: {}"
        self.SHARDED_MODEL_NAME = "{} (Sharded)"