# 记录每个分类项出现空值的个数
def count_add(home,title):
global null_cnt_dict
global null_value_dict
# 每调用一次函数就给相应的home加1
null_cnt_dict[home] = null_cnt_dict[home] + 1
# 空值的title添加进list
null_value_dict[home].append(title)
# 程序结束打印一下空值的个数
def cnt_null_print():
global null_cnt_dict
global null_value_dict
with open("./520a_com/" + "cnt_null.txt",'w+',encoding='utf-8') as fp:
fp.write(str(null_cnt_dict))
fp.write(str(null_value_dict))
if __name__ == '__main__':
# 10个分类列表
home_list = ["zonghe","liaotian","sijiao","xianxia","yuehui","xingxiang","paishe","wanhui","qita","nvsheng"]
# c存放空值个数和空值的title
null_cnt_dict = dict.fromkeys(home_list,0)
null_value_dict = dict.fromkeys(home_list,[])
# 每个分类列表的页数列表
page_list = [47, 15, 11, 5, 9, 5, 4, 2, 23, 27]
解释一下:
此代码是写的爬虫代码的一部分,定义了两个dict类型的全局变量,分别保存不同home_list下的item为空的个数和item的列表
用法:
在主函数中定义任意变量,想使全局变量,就在需要用的地方前边加个global关键字声明一下就可以了



