fix: 捕捉处理 ValueError 报错以及修改错字

This commit is contained in:
leantli 2024-05-08 22:26:35 +08:00
parent 57ee8dd63b
commit 43acde240b
5 changed files with 43 additions and 20 deletions

View File

@ -14,7 +14,9 @@ import aiofiles
from base.base_crawler import AbstractStore from base.base_crawler import AbstractStore
from tools import utils from tools import utils
from var import crawler_type_var from var import crawler_type_var
def calculatet_number_of_files(file_store_path: str) -> int:
def calculate_number_of_files(file_store_path: str) -> int:
"""计算数据保存文件的前部分排序数字,支持每次运行代码不写到同一个文件中 """计算数据保存文件的前部分排序数字,支持每次运行代码不写到同一个文件中
Args: Args:
file_store_path; file_store_path;
@ -23,11 +25,14 @@ def calculatet_number_of_files(file_store_path: str) -> int:
""" """
if not os.path.exists(file_store_path): if not os.path.exists(file_store_path):
return 1 return 1
try:
return max([int(file_name.split("_")[0])for file_name in os.listdir(file_store_path)])+1 return max([int(file_name.split("_")[0])for file_name in os.listdir(file_store_path)])+1
except ValueError:
return 1
class BiliCsvStoreImplement(AbstractStore): class BiliCsvStoreImplement(AbstractStore):
csv_store_path: str = "data/bilibili" csv_store_path: str = "data/bilibili"
file_count:int=calculatet_number_of_files(csv_store_path) file_count:int=calculate_number_of_files(csv_store_path)
def make_save_file_name(self, store_type: str) -> str: def make_save_file_name(self, store_type: str) -> str:
""" """
make save file name by store type make save file name by store type
@ -127,7 +132,7 @@ class BiliDbStoreImplement(AbstractStore):
class BiliJsonStoreImplement(AbstractStore): class BiliJsonStoreImplement(AbstractStore):
json_store_path: str = "data/bilibili" json_store_path: str = "data/bilibili"
lock = asyncio.Lock() lock = asyncio.Lock()
file_count:int=calculatet_number_of_files(json_store_path) file_count:int=calculate_number_of_files(json_store_path)
def make_save_file_name(self, store_type: str) -> str: def make_save_file_name(self, store_type: str) -> str:

View File

@ -14,7 +14,9 @@ import aiofiles
from base.base_crawler import AbstractStore from base.base_crawler import AbstractStore
from tools import utils from tools import utils
from var import crawler_type_var from var import crawler_type_var
def calculatet_number_of_files(file_store_path: str) -> int:
def calculate_number_of_files(file_store_path: str) -> int:
"""计算数据保存文件的前部分排序数字,支持每次运行代码不写到同一个文件中 """计算数据保存文件的前部分排序数字,支持每次运行代码不写到同一个文件中
Args: Args:
file_store_path; file_store_path;
@ -23,11 +25,14 @@ def calculatet_number_of_files(file_store_path: str) -> int:
""" """
if not os.path.exists(file_store_path): if not os.path.exists(file_store_path):
return 1 return 1
try:
return max([int(file_name.split("_")[0])for file_name in os.listdir(file_store_path)])+1 return max([int(file_name.split("_")[0])for file_name in os.listdir(file_store_path)])+1
except ValueError:
return 1
class DouyinCsvStoreImplement(AbstractStore): class DouyinCsvStoreImplement(AbstractStore):
csv_store_path: str = "data/douyin" csv_store_path: str = "data/douyin"
file_count:int=calculatet_number_of_files(csv_store_path) file_count:int=calculate_number_of_files(csv_store_path)
def make_save_file_name(self, store_type: str) -> str: def make_save_file_name(self, store_type: str) -> str:
""" """
@ -129,7 +134,7 @@ class DouyinDbStoreImplement(AbstractStore):
class DouyinJsonStoreImplement(AbstractStore): class DouyinJsonStoreImplement(AbstractStore):
json_store_path: str = "data/douyin" json_store_path: str = "data/douyin"
lock = asyncio.Lock() lock = asyncio.Lock()
file_count:int=calculatet_number_of_files(json_store_path) file_count:int=calculate_number_of_files(json_store_path)
def make_save_file_name(self, store_type: str) -> str: def make_save_file_name(self, store_type: str) -> str:
""" """

View File

@ -14,7 +14,9 @@ import aiofiles
from base.base_crawler import AbstractStore from base.base_crawler import AbstractStore
from tools import utils from tools import utils
from var import crawler_type_var from var import crawler_type_var
def calculatet_number_of_files(file_store_path: str) -> int:
def calculate_number_of_files(file_store_path: str) -> int:
"""计算数据保存文件的前部分排序数字,支持每次运行代码不写到同一个文件中 """计算数据保存文件的前部分排序数字,支持每次运行代码不写到同一个文件中
Args: Args:
file_store_path; file_store_path;
@ -23,12 +25,15 @@ def calculatet_number_of_files(file_store_path: str) -> int:
""" """
if not os.path.exists(file_store_path): if not os.path.exists(file_store_path):
return 1 return 1
try:
return max([int(file_name.split("_")[0])for file_name in os.listdir(file_store_path)])+1 return max([int(file_name.split("_")[0])for file_name in os.listdir(file_store_path)])+1
except ValueError:
return 1
class KuaishouCsvStoreImplement(AbstractStore): class KuaishouCsvStoreImplement(AbstractStore):
csv_store_path: str = "data/kuaishou" csv_store_path: str = "data/kuaishou"
file_count:int=calculatet_number_of_files(csv_store_path) file_count:int=calculate_number_of_files(csv_store_path)
def make_save_file_name(self, store_type: str) -> str: def make_save_file_name(self, store_type: str) -> str:
""" """
@ -128,7 +133,7 @@ class KuaishouDbStoreImplement(AbstractStore):
class KuaishouJsonStoreImplement(AbstractStore): class KuaishouJsonStoreImplement(AbstractStore):
json_store_path: str = "data/kuaishou" json_store_path: str = "data/kuaishou"
lock = asyncio.Lock() lock = asyncio.Lock()
file_count:int=calculatet_number_of_files(json_store_path) file_count:int=calculate_number_of_files(json_store_path)
def make_save_file_name(self, store_type: str) -> str: def make_save_file_name(self, store_type: str) -> str:

View File

@ -15,7 +15,8 @@ from base.base_crawler import AbstractStore
from tools import utils from tools import utils
from var import crawler_type_var from var import crawler_type_var
def calculatet_number_of_files(file_store_path: str) -> int:
def calculate_number_of_files(file_store_path: str) -> int:
"""计算数据保存文件的前部分排序数字,支持每次运行代码不写到同一个文件中 """计算数据保存文件的前部分排序数字,支持每次运行代码不写到同一个文件中
Args: Args:
file_store_path; file_store_path;
@ -24,12 +25,15 @@ def calculatet_number_of_files(file_store_path: str) -> int:
""" """
if not os.path.exists(file_store_path): if not os.path.exists(file_store_path):
return 1 return 1
try:
return max([int(file_name.split("_")[0])for file_name in os.listdir(file_store_path)])+1 return max([int(file_name.split("_")[0])for file_name in os.listdir(file_store_path)])+1
except ValueError:
return 1
class WeiboCsvStoreImplement(AbstractStore): class WeiboCsvStoreImplement(AbstractStore):
csv_store_path: str = "data/weibo" csv_store_path: str = "data/weibo"
file_count:int=calculatet_number_of_files(csv_store_path) file_count:int=calculate_number_of_files(csv_store_path)
def make_save_file_name(self, store_type: str) -> str: def make_save_file_name(self, store_type: str) -> str:
""" """
@ -130,7 +134,7 @@ class WeiboDbStoreImplement(AbstractStore):
class WeiboJsonStoreImplement(AbstractStore): class WeiboJsonStoreImplement(AbstractStore):
json_store_path: str = "data/weibo" json_store_path: str = "data/weibo"
lock = asyncio.Lock() lock = asyncio.Lock()
file_count:int=calculatet_number_of_files(json_store_path) file_count:int=calculate_number_of_files(json_store_path)
def make_save_file_name(self, store_type: str) -> str: def make_save_file_name(self, store_type: str) -> str:

View File

@ -15,7 +15,8 @@ from base.base_crawler import AbstractStore
from tools import utils from tools import utils
from var import crawler_type_var from var import crawler_type_var
def calculatet_number_of_files(file_store_path: str) -> int:
def calculate_number_of_files(file_store_path: str) -> int:
"""计算数据保存文件的前部分排序数字,支持每次运行代码不写到同一个文件中 """计算数据保存文件的前部分排序数字,支持每次运行代码不写到同一个文件中
Args: Args:
file_store_path; file_store_path;
@ -24,12 +25,15 @@ def calculatet_number_of_files(file_store_path: str) -> int:
""" """
if not os.path.exists(file_store_path): if not os.path.exists(file_store_path):
return 1 return 1
try:
return max([int(file_name.split("_")[0])for file_name in os.listdir(file_store_path)])+1 return max([int(file_name.split("_")[0])for file_name in os.listdir(file_store_path)])+1
except ValueError:
return 1
class XhsCsvStoreImplement(AbstractStore): class XhsCsvStoreImplement(AbstractStore):
csv_store_path: str = "data/xhs" csv_store_path: str = "data/xhs"
file_count:int=calculatet_number_of_files(csv_store_path) file_count:int=calculate_number_of_files(csv_store_path)
def make_save_file_name(self, store_type: str) -> str: def make_save_file_name(self, store_type: str) -> str:
""" """
@ -159,7 +163,7 @@ class XhsDbStoreImplement(AbstractStore):
class XhsJsonStoreImplement(AbstractStore): class XhsJsonStoreImplement(AbstractStore):
json_store_path: str = "data/xhs" json_store_path: str = "data/xhs"
lock = asyncio.Lock() lock = asyncio.Lock()
file_count:int=calculatet_number_of_files(json_store_path) file_count:int=calculate_number_of_files(json_store_path)
def make_save_file_name(self, store_type: str) -> str: def make_save_file_name(self, store_type: str) -> str:
""" """