feat(core): add verification to manual import + concatenated file support

- verify GGUFs on manual import - show warning when dealing with concatenated files such as mradermacher's split GGUFs (partXofX)
2024-08-22 15:57:21 -07:00 · 2024-08-22 15:57:21 -07:00 · 4f2c8057e1
parent 88875e3d67
commit 4f2c8057e1
2 changed files with 75 additions and 22 deletions
--- a/src/AutoGGUF.py
+++ b/src/AutoGGUF.py
@ -1156,6 +1156,14 @@ def create_label(self, text, tooltip):
        label.setToolTip(tooltip)
        return label
    def verify_gguf(self, file_path):
        try:
            with open(file_path, "rb") as f:
                magic = f.read(4)
                return magic == b"GGUF"
        except Exception:
            return False
    def load_models(self):
        self.logger.info(LOADING_MODELS)
        models_dir = self.models_input.text()
@ -1164,34 +1172,48 @@ def load_models(self):
        sharded_models = {}
        single_models = []
        concatenated_models = []
        # Regex pattern to match sharded model filenames
        shard_pattern = re.compile(r"(.*)-(\d+)-of-(\d+)\.gguf$")
        concat_pattern = re.compile(r"(.*)\.gguf\.part(\d+)of(\d+)$")
        # Load models from the models directory
        for file in os.listdir(models_dir):
            full_path = os.path.join(models_dir, file)
            if file.endswith(".gguf"):
                if not self.verify_gguf(full_path):
                    show_error(self.logger, INVALID_GGUF_FILE.format(file))
                    continue
                match = shard_pattern.match(file)
                if match:
                    # This is a sharded model
                    base_name, shard_num, total_shards = match.groups()
                    if base_name not in sharded_models:
                        sharded_models[base_name] = []
                    sharded_models[base_name].append((int(shard_num), file))
                else:
                    single_models.append(file)
            else:
                match = concat_pattern.match(file)
                if match:
                    concatenated_models.append(file)
        # Add imported models
        if hasattr(self, "imported_models"):
            for imported_model in self.imported_models:
                file_name = os.path.basename(imported_model)
-                if file_name not in single_models:
+                if (
                    file_name not in single_models
                    and file_name not in concatenated_models
                ):
                    if self.verify_gguf(imported_model):
                        single_models.append(file_name)
                    else:
                        show_error(
                            self.logger, INVALID_GGUF_FILE.format(imported_model)
                        )
        # Add sharded models to the tree
        for base_name, shards in sharded_models.items():
            parent_item = QTreeWidgetItem(self.model_tree)
-            parent_item.setText(0, f"{base_name} ({SHARDED})")
+            parent_item.setText(0, SHARDED_MODEL_NAME.format(base_name))
            first_shard = sorted(shards, key=lambda x: x[0])[0][1]
            parent_item.setData(0, Qt.ItemDataRole.UserRole, first_shard)
            for _, shard_file in sorted(shards):
@ -1199,8 +1221,26 @@ def load_models(self):
                child_item.setText(0, shard_file)
                child_item.setData(0, Qt.ItemDataRole.UserRole, shard_file)
        # Add single models to the tree
        for model in sorted(single_models):
            self.add_model_to_tree(model)
        for model in sorted(concatenated_models):
            item = self.add_model_to_tree(model)
            item.setForeground(0, Qt.gray)
            item.setToolTip(0, CONCATENATED_FILE_WARNING)
        self.model_tree.expandAll()
        self.logger.info(
            LOADED_MODELS.format(
                len(single_models) + len(sharded_models) + len(concatenated_models)
            )
        )
        if concatenated_models:
            self.logger.warning(
                CONCATENATED_FILES_FOUND.format(len(concatenated_models))
            )
    def add_model_to_tree(self, model):
        item = QTreeWidgetItem(self.model_tree)
        item.setText(0, model)
        if hasattr(self, "imported_models") and model in [
@ -1213,9 +1253,7 @@ def load_models(self):
            item.setToolTip(0, IMPORTED_MODEL_TOOLTIP.format(full_path))
        else:
            item.setData(0, Qt.ItemDataRole.UserRole, model)
-
+        return item
        self.model_tree.expandAll()
        self.logger.info(LOADED_MODELS.format(len(single_models) + len(sharded_models)))
    def validate_quantization_inputs(self):
        self.logger.debug(VALIDATING_QUANTIZATION_INPUTS)
@ -1469,6 +1507,12 @@ def import_model(self):
        )
        if file_path:
            file_name = os.path.basename(file_path)
            # Verify GGUF file
            if not self.verify_gguf(file_path):
                show_error(self.logger, INVALID_GGUF_FILE.format(file_name))
                return
            reply = QMessageBox.question(
                self,
                CONFIRM_IMPORT,
--- a/src/Localizations.py
+++ b/src/Localizations.py
@ -34,6 +34,15 @@ def __init__(self):
        self.IMPORTING_MODEL = "Importing model"
        self.IMPORTED_MODEL_TOOLTIP = "Imported model: {}"
        # GGUF Verification
        self.INVALID_GGUF_FILE = "Invalid GGUF file: {}"
        self.SHARDED_MODEL_NAME = "{} (Sharded)"
        self.IMPORTED_MODEL_TOOLTIP = "Imported model: {}"
        self.CONCATENATED_FILE_WARNING = "This is a concatenated file part. It will not work with llama-quantize; please concat the file first."
        self.CONCATENATED_FILES_FOUND = (
            "Found {} concatenated file parts. Please concat the files first."
        )
        # GPU Monitoring
        self.GPU_USAGE = "GPU Usage:"
        self.GPU_USAGE_FORMAT = "GPU: {:.1f}% | VRAM: {:.1f}% ({} MB / {} MB)"