Spaces:

ttttdiva
/

cv_test

Running

App Files Files Community

ttttdiva commited on Jan 6

Commit

fc1d399

verified ·

1 Parent(s): a7e29db

Update main.py

Browse files

Files changed (1) hide show

main.py +246 -313

main.py CHANGED Viewed

@@ -16,7 +16,6 @@ from fake_useragent import UserAgent
 from fastapi import FastAPI
 from huggingface_hub import HfApi, create_repo, hf_hub_download, login
-# ロギングの設定
 logging.basicConfig(level=logging.INFO)
 logger = logging.getLogger(__name__)
@@ -49,7 +48,6 @@ class Config:
     # ===== rclone 用の追加設定 =====
     RCLONE_CONF_BASE64 = os.environ.get("RCLONE_CONF_BASE64", "")
-    # 暗号化されたファイルが出力されるローカルディレクトリ（cryptLocal: の実体）
     ENCRYPTED_DIR = "/home/user/app/encrypted"
@@ -63,61 +61,50 @@ class CivitAICrawler:
         self.repo_ids = self.config.REPO_IDS.copy()
         self.jst = self.config.JST
-        # rclone のセットアップ
         self.setup_rclone_conf()
         self.setup_routes()
     def setup_routes(self):
-        """FastAPIのルーティングを設定する。"""
         @self.app.get("/")
         def read_root():
             now = str(datetime.datetime.now(self.jst))
-            description = f"""
-            CivitAIを定期的に周回し新規モデルを {self.repo_ids['current']} にバックアップするSpaceです。
-            model_list.log や civitai_backup.log は暗号化しないでアップロードします。
-            モデルのフォルダやファイルは暗号化してアップロードします。
-            Status: {now} + currently running :D
-            """
             return description
         @self.app.on_event("startup")
         async def startup_event():
             asyncio.create_task(self.crawl())
-    # =============================================================================
-    # rclone の設定・暗号化アップロード処理
-    # =============================================================================
     def setup_rclone_conf(self):
-        """環境変数 RCLONE_CONF_BASE64 から rclone.conf を生成し、RCLONE_CONFIG 環境変数を設定"""
         if not self.config.RCLONE_CONF_BASE64:
             logger.warning("[WARN] RCLONE_CONF_BASE64 is empty. rclone may fail.")
             return
         os.makedirs(".rclone_config", exist_ok=True)
         conf_path = os.path.join(".rclone_config", "rclone.conf")
         with open(conf_path, "wb") as f:
             f.write(base64.b64decode(self.config.RCLONE_CONF_BASE64))
         os.environ["RCLONE_CONFIG"] = conf_path
         logger.info(f"[INFO] rclone.conf created at: {conf_path}")
     def encrypt_with_rclone(self, local_path: str):
-        """
-        指定ファイル or ディレクトリを cryptLocal: にコピー。
-        フォルダ構造やファイル名を rclone の filename_encryption 設定に応じて暗号化する。
-        """
         if not os.path.exists(local_path):
             raise FileNotFoundError(f"[ERROR] Local path not found: {local_path}")
         # 事前に暗号先ディレクトリをクリーンアップ
         if os.path.isdir(self.config.ENCRYPTED_DIR):
             shutil.rmtree(self.config.ENCRYPTED_DIR, ignore_errors=True)
-        top_level_name = os.path.basename(local_path.rstrip("/"))
-        if not top_level_name:
-            top_level_name = "unnamed"
         cmd = ["rclone", "copy", local_path, f"cryptLocal:{top_level_name}", "-v"]
         logger.info(f"[INFO] Running: {' '.join(cmd)}")
         subprocess.run(cmd, check=True)
@@ -128,15 +115,14 @@ class CivitAICrawler:
                 f"[ERROR] {self.config.ENCRYPTED_DIR} not found. Check your rclone config."
             )
-    # 例: upload_encrypted_files の中の再試行処理
     def upload_encrypted_files(self, repo_id: str, base_path_in_repo: str = ""):
         max_retries = 5
         for root, dirs, files in os.walk(self.config.ENCRYPTED_DIR):
             for fn in files:
                 encrypted_file_path = os.path.join(root, fn)
                 if not os.path.isfile(encrypted_file_path):
                     continue
                 relative_path = os.path.relpath(encrypted_file_path, self.config.ENCRYPTED_DIR)
                 upload_path_in_repo = os.path.join(base_path_in_repo, relative_path)
@@ -150,37 +136,26 @@ class CivitAICrawler:
                         )
                         logger.info(f"[OK] Uploaded => {repo_id}/{upload_path_in_repo}")
                         break
                     except Exception as e:
                         attempt += 1
                         error_message = str(e)
-                        # ================================
-                        # 429によるrate-limit検出追加
-                        # ================================
-                        # "You have been rate-limited; you can retry this action in 31 minutes."
-                        # のようなメッセージから時間を抽出し、その時間+1分だけ待機後、再試行
                         if "rate-limited" in error_message and "minutes" in error_message:
                             import re
                             match = re.search(r"in (\d+) minutes?", error_message)
                             if match:
-                                minutes = int(match.group(1))
-                                # +1分して待機
-                                minutes += 1
-                                logger.warning(f"Rate-limited. Waiting {minutes} minutes before retry...")
                                 time.sleep(minutes * 60)
-                                attempt -= 1  # 同じ attempt カウントで再試行
                                 continue
-                        # ================================
-                        # すでにある1時間待機処理
-                        # ================================
                         if "you can retry this action in about 1 hour" in error_message:
-                            logger.warning("Encountered 'retry in 1 hour' error. Waiting 1 hour before retrying...")
                             time.sleep(3600)
-                            attempt -= 1  # 再試行回数を増やさずにループを続ける
                             continue
                         if "over the limit of 100000 files" in error_message:
                             logger.warning("Repository file limit exceeded. Creating a new repository...")
                             self.repo_ids['current'] = self.increment_repo_name(self.repo_ids['current'])
@@ -189,7 +164,6 @@ class CivitAICrawler:
                             repo_id = self.repo_ids['current']
                             continue
-                        # 上記以外のエラーの場合
                         if attempt < max_retries:
                             logger.warning(
                                 f"Failed to upload {encrypted_file_path}, retry {attempt}/{max_retries}..."
@@ -200,148 +174,6 @@ class CivitAICrawler:
                             )
                             raise
-    @staticmethod
-    def get_filename_from_cd(content_disposition: Optional[str], default_name: str) -> str:
-        if content_disposition:
-            parts = content_disposition.split(';')
-            for part in parts:
-                if "filename=" in part:
-                    return part.split("=")[1].strip().strip('"')
-        return default_name
-    def download_file(self, url: str, destination_folder: str, default_name: str):
-        try:
-            response = requests.get(url, headers=self.config.HEADERS, stream=True)
-            response.raise_for_status()
-        except requests.RequestException as e:
-            logger.error(f"Failed to download file from {url}: {e}")
-            return
-        filename = self.get_filename_from_cd(response.headers.get('content-disposition'), default_name)
-        file_path = os.path.join(destination_folder, filename)
-        with open(file_path, 'wb') as file:
-            for chunk in response.iter_content(chunk_size=8192):
-                file.write(chunk)
-        logger.info(f"Download completed: {file_path}")
-    def get_model_info(self, model_id: str) -> dict:
-        try:
-            response = requests.get(self.config.URLS["modelId"] + str(model_id), headers=self.config.HEADERS)
-            response.raise_for_status()
-            return response.json()
-        except requests.RequestException as e:
-            logger.error(f"Failed to retrieve model info for ID {model_id}: {e}")
-    def download_model(self, model_versions: list, folder: str, existing_old_version_files: list = []):
-        latest_version = model_versions[0]
-        latest_files = latest_version["files"]
-        for file_info in latest_files:
-            download_url = file_info["downloadUrl"]
-            file_name = file_info["name"]
-            login_detected_count = 0
-            while login_detected_count < 5:
-                try:
-                    self.download_file(download_url, folder, file_name)
-                except Exception as e:
-                    logger.error(f"Exception occurred while downloading {file_name}: {e}")
-                    login_detected_count += 1
-                    continue
-                if "login" in os.listdir(folder):
-                    login_detected_count += 1
-                    logger.warning(f"'login' file found. Will try again. ({login_detected_count}/5)")
-                    os.remove(os.path.join(folder, "login"))
-                else:
-                    logger.info(f"Successfully downloaded {file_name}")
-                    break
-            if login_detected_count >= 5:
-                dummy_file_name = f"{file_name}.download_failed"
-                dummy_file_path = os.path.join(folder, dummy_file_name)
-                try:
-                    with open(dummy_file_path, "w") as f:
-                        f.write("Download failed after 5 attempts.")
-                    logger.error(f"Failed to download {file_name}. Created dummy file {dummy_file_name}. URL: {download_url}")
-                except Exception as e:
-                    logger.error(f"Failed to create dummy file for {file_name}: {e}")
-        # 古いバージョンのダウンロード
-        if len(model_versions) > 1:
-            old_versions_folder = os.path.join(folder, "old_versions")
-            os.makedirs(old_versions_folder, exist_ok=True)
-            for version in model_versions[1:]:
-                for file_info in version["files"]:
-                    file_name = file_info["name"]
-                    if file_name in existing_old_version_files:
-                        logger.info(f"Skipping download of existing old version file: {file_name}")
-                        continue
-                    download_url = file_info["downloadUrl"]
-                    local_file_path = os.path.join(old_versions_folder, file_name)
-                    login_detected_count = 0
-                    while login_detected_count < 5:
-                        try:
-                            self.download_file(download_url, old_versions_folder, file_name)
-                        except Exception as e:
-                            logger.error(f"Exception occurred while downloading {file_name}: {e}")
-                            login_detected_count += 1
-                            continue
-                        if "login" in os.listdir(old_versions_folder):
-                            login_detected_count += 1
-                            logger.warning(f"'login' file found while downloading {file_name}. Will try again. ({login_detected_count}/5)")
-                            os.remove(os.path.join(old_versions_folder, "login"))
-                        else:
-                            logger.info(f"Successfully downloaded {file_name}")
-                            break
-                    if login_detected_count >= 5:
-                        dummy_file_name = f"{file_name}.download_failed"
-                        dummy_file_path = os.path.join(old_versions_folder, dummy_file_name)
-                        try:
-                            with open(dummy_file_path, "w") as f:
-                                f.write("Download failed after 5 attempts.")
-                            logger.error(f"Failed to download {file_name}. Created dummy file {dummy_file_name}. URL: {download_url}")
-                        except Exception as e:
-                            logger.error(f"Failed to create dummy file for {file_name}: {e}")
-    def download_images(self, model_versions: list, folder: str):
-        images_folder = os.path.join(folder, "images")
-        os.makedirs(images_folder, exist_ok=True)
-        images = []
-        for version in model_versions:
-            for img in version.get("images", []):
-                image_url = img["url"]
-                images.append(image_url)
-        for image_url in images:
-            image_name = image_url.split("/")[-1]
-            try:
-                response = requests.get(image_url)
-                response.raise_for_status()
-                with open(os.path.join(images_folder, f"{image_name}.png"), "wb") as file:
-                    file.write(response.content)
-            except requests.RequestException as e:
-                logger.error(f"Error downloading image {image_url}: {e}")
-    def save_html_content(self, url: str, folder: str):
-        try:
-            response = requests.get(url)
-            response.raise_for_status()
-            html_path = os.path.join(folder, f"{folder}.html")
-            with open(html_path, 'w', encoding='utf-8') as file:
-                file.write(response.text)
-        except Exception as e:
-            logger.error(f"Error saving HTML content for URL {url}: {e}")
-    @staticmethod
-    def save_model_info(model_info: dict, folder: str):
-        with open(os.path.join(folder, "model_info.json"), "w") as file:
-            json.dump(model_info, file, indent=2)
     @staticmethod
     def increment_repo_name(repo_id: str) -> str:
         match = re.search(r'(\d+)$', repo_id)
@@ -351,15 +183,38 @@ class CivitAICrawler:
         else:
             return f"{repo_id}1"
-    # =============================================================================
-    # 暗号化しないアップロード（ログや model_list.log 用）
-    # =============================================================================
-    def upload_file_raw(
         self,
-        file_path: str,
         repo_id: Optional[str] = None,
-        path_in_repo: Optional[str] = None
     ):
         if repo_id is None:
             repo_id = self.repo_ids['current']
         if path_in_repo is None:
@@ -387,7 +242,7 @@ class CivitAICrawler:
                     repo_id = self.repo_ids['current']
                     continue
                 elif "you can retry this action in about 1 hour" in error_message:
-                    logger.warning("Encountered 'retry in 1 hour' error. Waiting 1 hour before retrying...")
                     time.sleep(3600)
                     attempt -= 1
                 else:
@@ -397,67 +252,150 @@ class CivitAICrawler:
                         logger.error(f"Failed to upload raw file after {max_retries} attempts: {file_path}")
                         raise
-    # =============================================================================
-    # 暗号化してアップロード (単ファイル)
-    # =============================================================================
-    def upload_file_encrypted(
-        self,
-        file_path: str,
-        repo_id: Optional[str] = None,
-        path_in_repo: Optional[str] = None
-    ):
-        if repo_id is None:
-            repo_id = self.repo_ids['current']
-        base_path = path_in_repo or ""
-        self.encrypt_with_rclone(file_path)
-        self.upload_encrypted_files(repo_id=repo_id, base_path_in_repo=base_path)
-        if os.path.isdir(self.config.ENCRYPTED_DIR):
-            shutil.rmtree(self.config.ENCRYPTED_DIR, ignore_errors=True)
-    # =============================================================================
-    # 暗号化してアップロード (フォルダ)
-    # =============================================================================
-    def upload_folder_encrypted(
-        self,
-        folder_path: str,
-        repo_id: Optional[str] = None,
-        path_in_repo: Optional[str] = None
-    ) -> str:
-        if repo_id is None:
-            repo_id = self.repo_ids['current']
-        base_path = path_in_repo or ""
-        self.encrypt_with_rclone(folder_path)
-        top_levels = [
-            d for d in os.listdir(self.config.ENCRYPTED_DIR)
-            if os.path.isdir(os.path.join(self.config.ENCRYPTED_DIR, d))
-        ]
-        if not top_levels:
-            raise RuntimeError("No top-level folder found after rclone encryption.")
-        if len(top_levels) > 1:
-            logger.warning(f"Multiple top-level folders found after encryption? {top_levels}. Using the first one.")
-        encrypted_top_name = top_levels[0]
-        self.upload_encrypted_files(repo_id=repo_id, base_path_in_repo=base_path)
-        if os.path.isdir(self.config.ENCRYPTED_DIR):
-            shutil.rmtree(self.config.ENCRYPTED_DIR, ignore_errors=True)
-        return encrypted_top_name
-    # =============================================================================
-    # model_list.log の読み書きを「model_id: model_hf_url」で扱うよう変更
-    # =============================================================================
-    def read_model_list(self):
         """
-        model_list.log の各行を
-          "123456: https://huggingface.co/...encrypted_folder_name"
-        の形式で読み込み、 { "123456": "https://huggingface.co/..."} の dict を返す
         """
         model_list = {}
         try:
             with open(self.config.LIST_FILE, "r", encoding="utf-8") as f:
@@ -469,95 +407,103 @@ class CivitAICrawler:
                     if len(parts) == 2:
                         stored_id, stored_url = parts
                         model_list[stored_id] = stored_url
-            return model_list
         except Exception as e:
             logger.error(f"Failed to read model list: {e}")
-            return {}
     def process_model(self, model_url: str):
-        """指定されたモデルURLを処理する関数。"""
         try:
             model_id = model_url.rstrip("/").split("/")[-1]
             model_info = self.get_model_info(model_id)
             latest_version = model_info.get("modelVersions", [])[0]
             model_file = next(
-                (file for file in latest_version["files"] if file.get('type') == 'Model'),
                 None
             )
             if model_file:
-                latest_filename = model_file['name']
                 folder = os.path.splitext(latest_filename)[0]
             else:
                 first_file = latest_version["files"][0]
-                latest_filename = first_file['name']
                 folder = os.path.splitext(latest_filename)[0]
-                logger.warning(f"No 'Model' type file found for model ID {model_id}. Using first file's name.")
             os.makedirs(folder, exist_ok=True)
-            # model_list を読み込み
             model_list = self.read_model_list()
-            # もし既に「同名（モデルページ名）がアップされている」かどうか確認したい場合の例:
-            #   ※ 今回は modelpage_name���= model_info["name"]） をキーにするか、
-            #     あるいは model_id (str) をキーにするか、運用に合わせて設定してください。
-            #   例として modelpage_name をキーとしてチェックする流れ:
-            modelpage_name = model_info.get("name", "Unnamed Model")
             if modelpage_name in model_list.values():
-                # 既に同モデルページ名がアップロード済み → ここでスキップや上書きなどの処理を決定
-                logger.info(f"Model '{modelpage_name}' is already listed in model_list. Skipping re-upload.")
-                # もし「強制再アップロード」したくないなら return で処理終了:
-                # return
-                # あるいは「強制アップするがバージョンだけ追加」などいろいろ処理が可能
-                # ここではあえて続行するが、必要に応じて書き換えてください。
-            # ダウンロードや画像保存
-            existing_old_version_files = []
-            self.download_model(model_info["modelVersions"], folder, existing_old_version_files)
-            self.download_images(model_info["modelVersions"], folder)
-            self.save_html_content(model_url, folder)
-            self.save_model_info(model_info, folder)
-            # ========== rclone で暗号化フォルダをアップロード ==========
-            encrypted_top_name = self.upload_folder_encrypted(folder)
-            # 今回アップロードしたモデルの URL
-            model_hf_url = f"https://huggingface.co/{self.repo_ids['current']}/tree/main/{encrypted_top_name}"
-            # model_list.log に追記 → "modelpage_name: model_hf_url" 形式
-            with open(self.config.LIST_FILE, "a", encoding="utf-8") as f:
-                f.write(f"{modelpage_name}: {model_hf_url}\n")
-            # ローカルフォルダ削除
             if os.path.exists(folder):
                 shutil.rmtree(folder)
         except Exception as e:
             logger.error(f"Unexpected error processing model ({model_url}): {e}")
     async def crawl(self):
-        """モデルを定期的にチェックし、更新を行う。"""
         while True:
             try:
                 login(token=self.config.HUGGINGFACE_API_KEY, add_to_git_credential=True)
-                # model_list.log & civitai_backup.log を取得
                 model_list_path = hf_hub_download(repo_id=self.repo_ids['model_list'], filename=self.config.LIST_FILE)
                 shutil.copyfile(model_list_path, f"./{self.config.LIST_FILE}")
                 local_file_path = hf_hub_download(repo_id=self.repo_ids["log"], filename=self.config.LOG_FILE)
                 shutil.copyfile(local_file_path, f"./{self.config.LOG_FILE}")
-                # ログ読み込み
                 with open(self.config.LOG_FILE, "r", encoding="utf-8") as file:
                     lines = file.read().splitlines()
                     old_models = json.loads(lines[0]) if len(lines) > 0 else []
                     self.repo_ids["current"] = lines[1] if len(lines) > 1 else ""
-                # 新着モデル確認
                 response = requests.get(self.config.URLS["latest"], headers=self.config.HEADERS)
                 response.raise_for_status()
                 latest_models = response.json().get("items", [])
@@ -570,6 +516,7 @@ class CivitAICrawler:
                     logger.info(f"New models found: {new_models}")
                     model_id = new_models[0]
                     for attempt in range(1, 6):
                         try:
                             self.process_model(f"{self.config.URLS['modelId']}{model_id}")
@@ -581,43 +528,29 @@ class CivitAICrawler:
                             else:
                                 await asyncio.sleep(2)
                 else:
-                    # 新モデルなし
                     with open(self.config.LOG_FILE, "w", encoding="utf-8") as f:
                         f.write(json.dumps(latest_model_ids) + "\n")
                         f.write(f"{self.repo_ids['current']}\n")
                     logger.info(f"Updated log file: {self.config.LOG_FILE}")
-                    self.upload_file_raw(
-                        file_path=self.config.LOG_FILE,
-                        repo_id=self.repo_ids["log"],
-                        path_in_repo=self.config.LOG_FILE
-                    )
                     logger.info("Uploaded log file to repository (unencrypted).")
                     logger.info("No new models found.")
                     await asyncio.sleep(60)
                     continue
-                # 追加したモデルIDを old_models に追加
                 old_models.append(model_id)
-                # ログファイル更新
                 with open(self.config.LOG_FILE, "w", encoding="utf-8") as f:
                     f.write(json.dumps(old_models) + "\n")
                     f.write(f"{self.repo_ids['current']}\n")
                 logger.info(f"Updated log file with new model ID: {model_id}")
-                # ログとmodel_list.logをアップロード
-                self.upload_file_raw(
-                    file_path=self.config.LOG_FILE,
-                    repo_id=self.repo_ids["log"],
-                    path_in_repo=self.config.LOG_FILE
-                )
-                self.upload_file_raw(
-                    file_path=self.config.LIST_FILE,
-                    repo_id=self.repo_ids["model_list"],
-                    path_in_repo=self.config.LIST_FILE
-                )
             except Exception as e:
                 logger.error(f"Error during crawling: {e}")

 from fastapi import FastAPI
 from huggingface_hub import HfApi, create_repo, hf_hub_download, login
 logging.basicConfig(level=logging.INFO)
 logger = logging.getLogger(__name__)
     # ===== rclone 用の追加設定 =====
     RCLONE_CONF_BASE64 = os.environ.get("RCLONE_CONF_BASE64", "")
     ENCRYPTED_DIR = "/home/user/app/encrypted"
         self.repo_ids = self.config.REPO_IDS.copy()
         self.jst = self.config.JST
+        # rcloneのセットアップ
         self.setup_rclone_conf()
         self.setup_routes()
     def setup_routes(self):
         @self.app.get("/")
         def read_root():
             now = str(datetime.datetime.now(self.jst))
+            description = (
+                f"CivitAIを定期的に周回し新規モデルを {self.repo_ids['current']} にバックアップするSpaceです。\n"
+                f"model_list.log や civitai_backup.log は暗号化しないでアップロードします。\n"
+                f"モデルのフォルダやファイルは暗号化してアップロードします。\n"
+                f"Status: {now} + currently running :D\n"
+            )
             return description
         @self.app.on_event("startup")
         async def startup_event():
             asyncio.create_task(self.crawl())
+    # ============================================================================
+    # rclone設定 & 暗号化アップロード関連
+    # ============================================================================
     def setup_rclone_conf(self):
         if not self.config.RCLONE_CONF_BASE64:
             logger.warning("[WARN] RCLONE_CONF_BASE64 is empty. rclone may fail.")
             return
         os.makedirs(".rclone_config", exist_ok=True)
         conf_path = os.path.join(".rclone_config", "rclone.conf")
         with open(conf_path, "wb") as f:
             f.write(base64.b64decode(self.config.RCLONE_CONF_BASE64))
         os.environ["RCLONE_CONFIG"] = conf_path
         logger.info(f"[INFO] rclone.conf created at: {conf_path}")
     def encrypt_with_rclone(self, local_path: str):
+        """単一ファイル or ディレクトリを cryptLocal: にコピーし、暗号化する"""
         if not os.path.exists(local_path):
             raise FileNotFoundError(f"[ERROR] Local path not found: {local_path}")
         # 事前に暗号先ディレクトリをクリーンアップ
         if os.path.isdir(self.config.ENCRYPTED_DIR):
             shutil.rmtree(self.config.ENCRYPTED_DIR, ignore_errors=True)
+        top_level_name = os.path.basename(local_path.rstrip("/")) or "unnamed"
         cmd = ["rclone", "copy", local_path, f"cryptLocal:{top_level_name}", "-v"]
         logger.info(f"[INFO] Running: {' '.join(cmd)}")
         subprocess.run(cmd, check=True)
                 f"[ERROR] {self.config.ENCRYPTED_DIR} not found. Check your rclone config."
             )
     def upload_encrypted_files(self, repo_id: str, base_path_in_repo: str = ""):
+        """self.config.ENCRYPTED_DIR 配下の暗号化済ファイルを再帰的にアップロード"""
         max_retries = 5
         for root, dirs, files in os.walk(self.config.ENCRYPTED_DIR):
             for fn in files:
                 encrypted_file_path = os.path.join(root, fn)
                 if not os.path.isfile(encrypted_file_path):
                     continue
                 relative_path = os.path.relpath(encrypted_file_path, self.config.ENCRYPTED_DIR)
                 upload_path_in_repo = os.path.join(base_path_in_repo, relative_path)
                         )
                         logger.info(f"[OK] Uploaded => {repo_id}/{upload_path_in_repo}")
                         break
                     except Exception as e:
                         attempt += 1
                         error_message = str(e)
+                        # 429 Rate-limit (31 minutes)
                         if "rate-limited" in error_message and "minutes" in error_message:
                             import re
                             match = re.search(r"in (\d+) minutes?", error_message)
                             if match:
+                                minutes = int(match.group(1)) + 1
+                                logger.warning(f"Rate-limited. Waiting {minutes} minutes...")
                                 time.sleep(minutes * 60)
+                                attempt -= 1
                                 continue
+                        # 1時間待機パターン
                         if "you can retry this action in about 1 hour" in error_message:
+                            logger.warning("Encountered 'retry in 1 hour' error. Waiting 1 hour...")
                             time.sleep(3600)
+                            attempt -= 1
                             continue
+                        # 100kファイル上限
                         if "over the limit of 100000 files" in error_message:
                             logger.warning("Repository file limit exceeded. Creating a new repository...")
                             self.repo_ids['current'] = self.increment_repo_name(self.repo_ids['current'])
                             repo_id = self.repo_ids['current']
                             continue
                         if attempt < max_retries:
                             logger.warning(
                                 f"Failed to upload {encrypted_file_path}, retry {attempt}/{max_retries}..."
                             )
                             raise
     @staticmethod
     def increment_repo_name(repo_id: str) -> str:
         match = re.search(r'(\d+)$', repo_id)
         else:
             return f"{repo_id}1"
+    # ============================================================================
+    # 単ファイル暗号化アップロード → ローカル削除
+    # ============================================================================
+    def upload_file_encrypted_one_by_one(
         self,
+        local_path: str,
         repo_id: Optional[str] = None,
+        path_in_repo: str = ""
     ):
+        """
+        単一ファイル (or フォルダ) を暗号化してアップロードしたあと、ローカルファイルを削除する。
+        """
+        if not repo_id:
+            repo_id = self.repo_ids['current']
+        self.encrypt_with_rclone(local_path)
+        self.upload_encrypted_files(repo_id=repo_id, base_path_in_repo=path_in_repo)
+        # 暗号化用のENCRYPTED_DIRを消す
+        if os.path.isdir(self.config.ENCRYPTED_DIR):
+            shutil.rmtree(self.config.ENCRYPTED_DIR, ignore_errors=True)
+        # 元のローカルファイルも削除
+        if os.path.isfile(local_path):
+            os.remove(local_path)
+        elif os.path.isdir(local_path):
+            shutil.rmtree(local_path, ignore_errors=True)
+    # ============================================================================
+    # 生ファイルアップロード (ログなど)
+    # ============================================================================
+    def upload_file_raw(self, file_path: str, repo_id: Optional[str] = None, path_in_repo: Optional[str] = None):
         if repo_id is None:
             repo_id = self.repo_ids['current']
         if path_in_repo is None:
                     repo_id = self.repo_ids['current']
                     continue
                 elif "you can retry this action in about 1 hour" in error_message:
+                    logger.warning("Encountered 'retry in 1 hour' error. Waiting 1 hour...")
                     time.sleep(3600)
                     attempt -= 1
                 else:
                         logger.error(f"Failed to upload raw file after {max_retries} attempts: {file_path}")
                         raise
+    # ============================================================================
+    # ダウンロード関連
+    # ============================================================================
+    @staticmethod
+    def get_filename_from_cd(content_disposition: Optional[str], default_name: str) -> str:
+        if content_disposition:
+            parts = content_disposition.split(';')
+            for part in parts:
+                if "filename=" in part:
+                    return part.split("=")[1].strip().strip('"')
+        return default_name
+    def download_file(self, url: str, destination_folder: str, default_name: str):
+        try:
+            response = requests.get(url, headers=self.config.HEADERS, stream=True)
+            response.raise_for_status()
+        except requests.RequestException as e:
+            logger.error(f"Failed to download file from {url}: {e}")
+            return None
+        filename = self.get_filename_from_cd(response.headers.get('content-disposition'), default_name)
+        file_path = os.path.join(destination_folder, filename)
+        with open(file_path, 'wb') as file:
+            for chunk in response.iter_content(chunk_size=8192):
+                file.write(chunk)
+        logger.info(f"Download completed: {file_path}")
+        return file_path  # ★ ダウンロードしたファイルのパスを返すように
+    # ============================================================================
+    # （★修正）1ファイルずつDL→暗号化→アップロード→削除
+    # ============================================================================
+    def process_latest_files_one_by_one(self, version_data: dict, model_folder: str, encrypted_folder_name: str):
+        """
+        最新バージョンのファイルを1つずつダウンロード→暗号化アップロード→ローカル削除
+        path_in_repo は "{encrypted_folder_name}/" をベースに。
+        """
+        files = version_data.get("files", [])
+        for file_info in files:
+            download_url = file_info["downloadUrl"]
+            file_name = file_info["name"]
+            # ダウンロード
+            local_path = self.download_file(download_url, model_folder, file_name)
+            if not local_path or not os.path.exists(local_path):
+                logger.warning(f"Skip because file not found locally: {local_path}")
+                continue
+            # 暗号化アップロード
+            # 例: "myModelName/filename"
+            in_repo_path = os.path.join(encrypted_folder_name, file_name)
+            self.upload_file_encrypted_one_by_one(local_path, repo_id=self.repo_ids['current'], path_in_repo=in_repo_path)
+    def process_images_one_by_one(self, version_list: list, model_folder: str, encrypted_folder_name: str):
+        """
+        画像をすべて1つずつDL→暗号化アップロード→削除
+        path_in_repo は "{encrypted_folder_name}/images/"
+        """
+        images = []
+        for version in version_list:
+            for img_info in version.get("images", []):
+                images.append(img_info["url"])
+        for image_url in images:
+            image_name = image_url.split("/")[-1] + ".png"
+            local_path = os.path.join(model_folder, image_name)
+            # ダウンロード
+            try:
+                resp = requests.get(image_url, stream=True)
+                resp.raise_for_status()
+                with open(local_path, "wb") as f:
+                    for chunk in resp.iter_content(chunk_size=8192):
+                        f.write(chunk)
+                logger.info(f"Downloaded image: {local_path}")
+            except Exception as e:
+                logger.error(f"Error downloading image {image_url}: {e}")
+                continue
+            # アップロード
+            in_repo_path = os.path.join(encrypted_folder_name, "images", image_name)
+            self.upload_file_encrypted_one_by_one(local_path, self.repo_ids['current'], in_repo_path)
+    def process_old_versions_one_by_one(self, version_list: list, model_folder: str, encrypted_folder_name: str):
         """
+        古いバージョン (index=1以降) のファイルを 1つずつダウンロード→暗号化アップロード→削除
+        path_in_repo は "{encrypted_folder_name}/old_versions/{versionID_orName}/filename"
         """
+        if len(version_list) <= 1:
+            return
+        for old_version in version_list[1:]:
+            # どんな名前でフォルダを区別するか（バージョンIDやバージョン名など）
+            version_id_or_name = str(old_version.get("id", "old_ver"))
+            files = old_version.get("files", [])
+            for file_info in files:
+                download_url = file_info["downloadUrl"]
+                file_name = file_info["name"]
+                # ダウンロード
+                local_path = self.download_file(download_url, model_folder, file_name)
+                if not local_path or not os.path.exists(local_path):
+                    logger.warning(f"Skip because file not found locally: {local_path}")
+                    continue
+                # 暗号化アップロード
+                in_repo_path = os.path.join(
+                    encrypted_folder_name,
+                    "old_versions",
+                    version_id_or_name,
+                    file_name
+                )
+                self.upload_file_encrypted_one_by_one(local_path, self.repo_ids['current'], in_repo_path)
+    # ============================================================================
+    # HTML & model_info.json は軽量なので一括DL→アップロードでもOK
+    # ============================================================================
+    def save_html_content(self, url: str, folder: str):
+        try:
+            response = requests.get(url)
+            response.raise_for_status()
+            html_path = os.path.join(folder, os.path.basename(folder) + ".html")
+            with open(html_path, 'w', encoding='utf-8') as file:
+                file.write(response.text)
+            return html_path
+        except Exception as e:
+            logger.error(f"Error saving HTML content for URL {url}: {e}")
+            return None
+    def save_model_info(self, model_info: dict, folder: str):
+        json_path = os.path.join(folder, "model_info.json")
+        try:
+            with open(json_path, "w", encoding="utf-8") as file:
+                json.dump(model_info, file, indent=2)
+            return json_path
+        except Exception as e:
+            logger.error(f"Error saving model_info.json: {e}")
+            return None
+    # ============================================================================
+    # model_list.log
+    # ============================================================================
+    def read_model_list(self):
         model_list = {}
         try:
             with open(self.config.LIST_FILE, "r", encoding="utf-8") as f:
                     if len(parts) == 2:
                         stored_id, stored_url = parts
                         model_list[stored_id] = stored_url
         except Exception as e:
             logger.error(f"Failed to read model list: {e}")
+        return model_list
     def process_model(self, model_url: str):
+        """ 指定されたモデルURLを処理 (1つずつファイルをDL→アップロード→削除) """
         try:
             model_id = model_url.rstrip("/").split("/")[-1]
             model_info = self.get_model_info(model_id)
+            if not model_info:
+                logger.error(f"No model_info returned for {model_id}")
+                return
             latest_version = model_info.get("modelVersions", [])[0]
             model_file = next(
+                (file for file in latest_version.get("files", []) if file.get("type") == "Model"),
                 None
             )
             if model_file:
+                latest_filename = model_file["name"]
                 folder = os.path.splitext(latest_filename)[0]
             else:
+                # ファイルtype=Modelが無い場合、とりあえず最初のファイル名でフォルダ名を作る
                 first_file = latest_version["files"][0]
+                latest_filename = first_file["name"]
                 folder = os.path.splitext(latest_filename)[0]
+                logger.warning(f"No 'Model' type file found for {model_id}. Using first file's name.")
+            # ローカルに一時フォルダを作成
             os.makedirs(folder, exist_ok=True)
+            # 同名判定 (model_list.log を読み込み、modelpage_name が既にあればスキップ)
             model_list = self.read_model_list()
+            modelpage_name = model_info.get("name", f"Model_{model_id}")
             if modelpage_name in model_list.values():
+                logger.info(f"Model '{modelpage_name}' already in model_list. Skipping.")
+                # return  # 必要に応じてリターン
+            # HTMLやmodel_info は軽いので一括保存→まとめて単ファイル暗号化アップロード
+            html_path = self.save_html_content(self.config.URLS["modelPage"] + str(model_id), folder)
+            json_path = self.save_model_info(model_info, folder)
+            # 暗号化アップロード（HTML, JSON など）
+            # HF 上では "{folder}/model_info.json" としておく例
+            if html_path and os.path.exists(html_path):
+                in_repo_path = os.path.join(folder, os.path.basename(html_path))
+                self.upload_file_encrypted_one_by_one(html_path, self.repo_ids['current'], in_repo_path)
+            if json_path and os.path.exists(json_path):
+                in_repo_path = os.path.join(folder, "model_info.json")
+                self.upload_file_encrypted_one_by_one(json_path, self.repo_ids['current'], in_repo_path)
+            # 最新バージョンを1ファイルずつアップロード
+            self.process_latest_files_one_by_one(latest_version, folder, folder)
+            # 画像を1ファイルずつアップロード
+            self.process_images_one_by_one(model_info["modelVersions"], folder, folder)
+            # 古いバージョンを1ファイルずつアップロード
+            self.process_old_versions_one_by_one(model_info["modelVersions"], folder, folder)
+            # ここで folder はほぼ空だが、一応削除
             if os.path.exists(folder):
                 shutil.rmtree(folder)
+            # 最後に model_list.log に追記 (「modelpage_name: HFのURL構造」)
+            # 今回はフォルダごと暗号化ではなくファイルごとなので、ひとまず "folder" をルート名に使っておく
+            # Hugging Face 上でのトップフォルダ URL:
+            #   https://huggingface.co/REPO_ID/tree/main/folder
+            model_hf_url = f"https://huggingface.co/{self.repo_ids['current']}/tree/main/{folder}"
+            with open(self.config.LIST_FILE, "a", encoding="utf-8") as f:
+                f.write(f"{modelpage_name}: {model_hf_url}\n")
         except Exception as e:
             logger.error(f"Unexpected error processing model ({model_url}): {e}")
     async def crawl(self):
+        """新着モデルをチェックし、1件ずつ処理するループ"""
         while True:
             try:
                 login(token=self.config.HUGGINGFACE_API_KEY, add_to_git_credential=True)
+                # 最新のmodel_list.log & civitai_backup.log をダウンロード
                 model_list_path = hf_hub_download(repo_id=self.repo_ids['model_list'], filename=self.config.LIST_FILE)
                 shutil.copyfile(model_list_path, f"./{self.config.LIST_FILE}")
                 local_file_path = hf_hub_download(repo_id=self.repo_ids["log"], filename=self.config.LOG_FILE)
                 shutil.copyfile(local_file_path, f"./{self.config.LOG_FILE}")
+                # civitai_backup.log を読み取り
                 with open(self.config.LOG_FILE, "r", encoding="utf-8") as file:
                     lines = file.read().splitlines()
                     old_models = json.loads(lines[0]) if len(lines) > 0 else []
                     self.repo_ids["current"] = lines[1] if len(lines) > 1 else ""
+                # 新着モデルを確認
                 response = requests.get(self.config.URLS["latest"], headers=self.config.HEADERS)
                 response.raise_for_status()
                 latest_models = response.json().get("items", [])
                     logger.info(f"New models found: {new_models}")
                     model_id = new_models[0]
+                    # 試行5回
                     for attempt in range(1, 6):
                         try:
                             self.process_model(f"{self.config.URLS['modelId']}{model_id}")
                             else:
                                 await asyncio.sleep(2)
                 else:
+                    # 新モデルなし → backup.log を更新 & アップロード
                     with open(self.config.LOG_FILE, "w", encoding="utf-8") as f:
                         f.write(json.dumps(latest_model_ids) + "\n")
                         f.write(f"{self.repo_ids['current']}\n")
                     logger.info(f"Updated log file: {self.config.LOG_FILE}")
+                    self.upload_file_raw(self.config.LOG_FILE, self.repo_ids["log"], self.config.LOG_FILE)
                     logger.info("Uploaded log file to repository (unencrypted).")
                     logger.info("No new models found.")
                     await asyncio.sleep(60)
                     continue
+                # 成功したモデルをold_modelsに追加 → backup.log更新
                 old_models.append(model_id)
                 with open(self.config.LOG_FILE, "w", encoding="utf-8") as f:
                     f.write(json.dumps(old_models) + "\n")
                     f.write(f"{self.repo_ids['current']}\n")
                 logger.info(f"Updated log file with new model ID: {model_id}")
+                # ログ & model_list.log をアップ
+                self.upload_file_raw(self.config.LOG_FILE, self.repo_ids["log"], self.config.LOG_FILE)
+                self.upload_file_raw(self.config.LIST_FILE, self.repo_ids["model_list"], self.config.LIST_FILE)
             except Exception as e:
                 logger.error(f"Error during crawling: {e}")