diff --git a/readme.md b/readme.md deleted file mode 100644 index 60f7544..0000000 --- a/readme.md +++ /dev/null @@ -1,116 +0,0 @@ -# B站关注清理工具 - Scripts 版 - -> 一键命令运行全流程:`python source/scripts/run_pipeline.py` - -python source/scripts/run_pipeline.py --input-json source/resources/export_uids_test5.json - -本工具包含7个步骤的完整流水线: - -1. 抓取视频标题 -2. 分批AI分析 -3. 生成保留关注报告 -4. 生成取关UID列表 -5. 按首字母排序 -6. 提取分组信息 -7. 删除最近10条标题 - -## 快速开始 - -```powershell -# 完整流程(推荐) -python source/scripts/run_pipeline.py - -# 速度优先 -python source/scripts/run_pipeline.py --workers 8 --batch-size 30 --sleep-seconds 0 - -# 试跑30个UP -python source/scripts/run_pipeline.py --max-ups 30 - -# 跳过抓取,使用已有标题报告 -python source/scripts/run_pipeline.py --skip-fetch - -# 跳过分析,仅生成产物 -python source/scripts/run_pipeline.py --skip-analyze - -# 跳过排序/分组/删除 -python source/scripts/run_pipeline.py --skip-sort --skip-group --skip-remove -``` - -## 输出文件 - -| 文件 | 说明 | -|------|------| -| `source/output/reports/1_up_titles_report.md` | 标题抓取报告 | -| `source/output/reports/2_up_analysis_full_auto.md` | AI分析报告(完整) | -| `source/output/reports/3_up_keep_follow_only.md` | 保留关注报告 | -| `source/output/uids/4_unfollow_mids_list.txt` | 取关UID列表 | -| `source/output/reports/5_sorted_up_analysis.md` | 按首字母排序报告 | -| `source/output/reports/6_group_info.md` | 提取分组信息报告 | -| `source/output/reports/7_no_titles.md` | 最终报告(删除最近10条) | - -## 常用参数 - -| 参数 | 默认值 | 说明 | -|------|--------|------| -| `--workers` | 6 | 并发请求数 | -| `--batch-size` | 20 | 每批分析条数 | -| `--max-ups` | 0(全部) | 限制处理UP数量 | -| `--split-size` | 100 | UID拆分大小 | -| `--sleep-seconds` | 0 | 任务间隔秒数 | - -### 跳过参数 - -| 参数 | 说明 | -|------|------| -| `--skip-fetch` | 跳过抓取阶段 | -| `--skip-analyze` | 跳过分析阶段 | -| `--skip-sort` | 跳过排序阶段 | -| `--skip-group` | 跳过提取分组阶段 | -| `--skip-remove` | 跳过删除最近10条阶段 | - -## 分步执行 - -### 步骤1:抓取标题 -```powershell -python source/scripts/analyze_up_content.py --skip-ai -``` - -### 步骤2:分批AI分析 -```powershell -python source/scripts/batch_ai_summary_from_report.py --run-all-batches -``` - -### 步骤3:生成保留关注报告 -```powershell -python source/scripts/extract_keep_follow_doc.py -``` - -### 步骤4:生成取关UID -```powershell -python source/scripts/extract_unfollow_list.py --format mid-only --split-size 100 -``` - -### 步骤5:按首字母排序 -```powershell -python source/scripts/sort_up_main.py -``` - -### 步骤6:提取分组信息 -```powershell -python source/scripts/extract_group_info.py -``` - -### 步骤7:删除最近10条标题 -```powershell -python source/scripts/remove_10content.py -``` - -## 先配置API - -编辑 [source/scripts/analyze_up_content.py](source/scripts/analyze_up_content.py) 顶部配置: - -```python -VOLCENGINE_API_KEY = "你的火山引擎API Key" -VOLCENGINE_MODEL = "deepseek-v3-1-terminus" -VOLCENGINE_BASE_URL = "https://ark.cn-beijing.volces.com/api/v3" -``` \ No newline at end of file diff --git a/source/.all_i_need/export_uids.json b/source/.all_i_need/export_uids.json deleted file mode 100644 index a7165af..0000000 --- a/source/.all_i_need/export_uids.json +++ /dev/null @@ -1 +0,0 @@ -[{"mid":1357612844,"name":"考研英语马天艺老师","tag":[]},{"mid":321583894,"name":"我是蓝同学啊","tag":["实力派"]},{"mid":439478093,"name":"中国食品报融媒体","tag":["纪录片","新闻"]},{"mid":1044673687,"name":"心理述","tag":[]},{"mid":62224043,"name":"栗之from一直夫妇","tag":[]},{"mid":1031543543,"name":"Java面试突击-Mic","tag":[]},{"mid":1481344732,"name":"我们都是社畜","tag":["准备取关"]},{"mid":475443398,"name":"黑毛羊驼","tag":["准备取关"]},{"mid":2026173074,"name":"温竣岩","tag":["准备取关"]},{"mid":1858861103,"name":"迷因水母","tag":["准备取关"]},{"mid":444728505,"name":"小狮日记","tag":["准备取关"]},{"mid":23947287,"name":"小约翰可汗","tag":["准备取关"]},{"mid":35807625,"name":"小凡今天出片了吗","tag":["准备取关"]},{"mid":23791195,"name":"科学透镜","tag":["准备取关"]},{"mid":111714204,"name":"胖胖地球君","tag":["准备取关"]},{"mid":1937308559,"name":"赛博食录","tag":["准备取关"]},{"mid":1587138171,"name":"为一放映室","tag":["准备取关"]},{"mid":440798355,"name":"狗性巧克力","tag":["准备取关"]},{"mid":33291981,"name":"脑洞部长","tag":["准备取关"]},{"mid":648113003,"name":"沈逸老师","tag":["准备取关"]},{"mid":241241407,"name":"第一颗思考的蝌蚪","tag":["准备取关"]},{"mid":2099983410,"name":"电子电工之家","tag":["准备取关"]},{"mid":11914415,"name":"严伯钧","tag":["准备取关"]},{"mid":436700803,"name":"天星教育官方号","tag":["准备取关"]},{"mid":3493282273299102,"name":"奇妙世界GPT","tag":["准备取关"]},{"mid":612593877,"name":"Python_子木","tag":["准备取关"]},{"mid":2125857107,"name":"李大可爱玩","tag":["准备取关"]},{"mid":40433405,"name":"科技狐","tag":["准备取关"]},{"mid":2000819931,"name":"中国国家地理","tag":["准备取关"]},{"mid":2053592854,"name":"造梦小懿","tag":["准备取关"]},{"mid":546189,"name":"小Q不是导盲犬","tag":["准备取关"]},{"mid":507448807,"name":"Beelief","tag":["准备取关"]},{"mid":607281655,"name":"Science科学杂志","tag":["准备取关"]},{"mid":505935166,"name":"语文作文菌","tag":["准备取关"]},{"mid":14524124,"name":"胡诌施佬","tag":["准备取关"]},{"mid":385200931,"name":"MappleZS","tag":["准备取关"]},{"mid":25876945,"name":"极客湾Geekerwan","tag":["准备取关"]},{"mid":669397302,"name":"ZiKa-玩机酷","tag":["准备取关"]},{"mid":1769820463,"name":"百电汇数码生活","tag":["准备取关"]},{"mid":1562896062,"name":"EYEZMAZEvideo","tag":["准备取关"]},{"mid":3493285194632125,"name":"原理视界","tag":["准备取关"]},{"mid":3493264275540254,"name":"单词鲨手","tag":["准备取关"]},{"mid":479424216,"name":"卡尼酱本人","tag":["准备取关"]},{"mid":604710494,"name":"长片短解","tag":["准备取关"]},{"mid":1016523517,"name":"科技公元","tag":["准备取关"]},{"mid":409109266,"name":"陨石张大福","tag":["准备取关"]},{"mid":1428318343,"name":"芸曦小手工","tag":["准备取关"]},{"mid":700817047,"name":"第一推动科普","tag":["准备取关"]},{"mid":1634586116,"name":"中国日报双语新闻","tag":["准备取关"]},{"mid":543931674,"name":"马力在知群","tag":["准备取关"]},{"mid":1590538073,"name":"今日搞钱信息差","tag":["准备取关"]},{"mid":1574721168,"name":"潘教授和Fodil聊口语","tag":["准备取关"]},{"mid":432752294,"name":"晓晨聊大学","tag":["准备取关"]},{"mid":15247078,"name":"小飞蛾好可爱","tag":["准备取关"]},{"mid":499889496,"name":"是爱丽丝_","tag":["准备取关"]},{"mid":506174440,"name":"异星探索","tag":["准备取关"]},{"mid":1784235102,"name":"算法大师兄","tag":["准备取关"]},{"mid":3494376355400290,"name":"DayDay常识","tag":["准备取关"]},{"mid":320819729,"name":"Jonathan彭玉印","tag":["准备取关"]},{"mid":1795221360,"name":"心情瓶中信","tag":["准备取关"]},{"mid":4848323,"name":"数字游牧人","tag":["准备取关"]},{"mid":495224316,"name":"一只萧包子","tag":["准备取关"]},{"mid":397109346,"name":"思维社","tag":["准备取关"]},{"mid":3493258518858434,"name":"西安交通大学沈杨书社","tag":["准备取关"]},{"mid":379247856,"name":"好奇心会社","tag":["准备取关"]},{"mid":32360194,"name":"当下频道","tag":["准备取关"]},{"mid":381653678,"name":"老板懂设计","tag":["准备取关"]},{"mid":393119260,"name":"轻玩科技-老肖","tag":["准备取关"]},{"mid":274928598,"name":"幻想奇术师","tag":["准备取关"]},{"mid":475656605,"name":"超时空采访","tag":["准备取关"]},{"mid":365212208,"name":"Albert英语研习社","tag":["准备取关"]},{"mid":26653094,"name":"Marina0826","tag":["准备取关"]},{"mid":474881660,"name":"英语Snow老师","tag":["准备取关"]},{"mid":3546378525477862,"name":"Joseph的机器","tag":["准备取关"]},{"mid":14484744,"name":"科学小视","tag":["准备取关"]},{"mid":35339643,"name":"超极黑科技","tag":["准备取关"]},{"mid":1747335,"name":"老着急的小两居","tag":["准备取关"]},{"mid":1263990139,"name":"机智朱马马","tag":["准备取关"]},{"mid":3493263038220393,"name":"陆玖无敌","tag":["准备取关"]},{"mid":252075192,"name":"迪哥有点愁","tag":["准备取关"]},{"mid":251642119,"name":"简单柑桔Rw","tag":["准备取关"]},{"mid":387412319,"name":"布白PPT","tag":["准备取关"]},{"mid":508455218,"name":"放羊人_论文指导","tag":["准备取关"]},{"mid":672614938,"name":"英文老师Tanner","tag":["准备取关"]},{"mid":1212367465,"name":"水电知识分享","tag":["准备取关"]},{"mid":3494374235179579,"name":"Blender地势坤","tag":["准备取关"]},{"mid":589747109,"name":"后期老毛","tag":["准备取关"]},{"mid":1025542770,"name":"口语提升训练基地","tag":["准备取关"]},{"mid":23770618,"name":"蛇十六","tag":["准备取关"]},{"mid":3494350482836026,"name":"大道只源","tag":["准备取关"]},{"mid":54091976,"name":"拾镹i","tag":["准备取关"]},{"mid":252028114,"name":"戴博士实验室","tag":["准备取关"]},{"mid":599449178,"name":"槽逻辑","tag":["准备取关"]},{"mid":20826656,"name":"糖果果的未来要发光","tag":["准备取关"]},{"mid":384317271,"name":"易展翅-求职小表姐","tag":["准备取关"]},{"mid":1715594148,"name":"offer锦鲤魏校长","tag":["准备取关"]},{"mid":3493127266503448,"name":"安妮的职场与生活","tag":["准备取关"]},{"mid":1767282898,"name":"探长说电影","tag":["准备取关"]},{"mid":487505057,"name":"池早是我","tag":["准备取关"]},{"mid":630874464,"name":"冷科普","tag":["准备取关"]},{"mid":1264711195,"name":"爱读书的豆豆","tag":["准备取关"]},{"mid":3537118481615036,"name":"琅琊阁之信息差","tag":["准备取关"]},{"mid":319358609,"name":"民族自强不息者","tag":["准备取关"]},{"mid":518742534,"name":"那边那个g蛋","tag":["准备取关"]},{"mid":385172962,"name":"我是阿朱吖","tag":["准备取关"]},{"mid":1999199378,"name":"不略-","tag":[]},{"mid":4401694,"name":"林亦LYi","tag":[]},{"mid":518619340,"name":"想开面包店的Ricky","tag":[]},{"mid":419109033,"name":"科普创世纪","tag":["纪录片","科普","特别关注"]},{"mid":44980991,"name":"会放羊的教书匠","tag":[]},{"mid":474803476,"name":"泡厨房的顾小胖","tag":[]},{"mid":629408291,"name":"今日常识练习","tag":[]},{"mid":2052851329,"name":"律师老韩","tag":[]},{"mid":525382468,"name":"人间放映厅","tag":[]},{"mid":3546595513600180,"name":"松哥打虎","tag":[]},{"mid":1475748134,"name":"精分英教谢尔盖","tag":[]},{"mid":295993972,"name":"爱鼓捣的邢志磊","tag":[]},{"mid":287591832,"name":"丁老师现代英语","tag":[]},{"mid":38061207,"name":"Git源宝","tag":["科普","学习","科技","CODEK"]},{"mid":509905775,"name":"燎结构","tag":[]},{"mid":476819048,"name":"Adam陈老丝","tag":[]},{"mid":21435789,"name":"Kiefan琪凡速写","tag":[]},{"mid":49746395,"name":"GenJi是真想教会你","tag":["特别关注"]},{"mid":419052321,"name":"羊小驼叔叔","tag":[]},{"mid":488218866,"name":"EnglishVista2023","tag":[]},{"mid":1725223092,"name":"科学内幕","tag":[]},{"mid":1067722283,"name":"CG快报","tag":["新闻","ACG"]},{"mid":3494360540777110,"name":"老师好我叫白鼠同学","tag":[]},{"mid":2114928296,"name":"麦说","tag":["科普"]},{"mid":174471602,"name":"阿右科普","tag":[]},{"mid":43584648,"name":"工科男孙老师","tag":["科普"]},{"mid":3493281113573620,"name":"OK语文","tag":[]},{"mid":1480366563,"name":"静止想象研究所","tag":[]},{"mid":3546590293789198,"name":"机械视界J","tag":[]},{"mid":17095888,"name":"Crossin的编程教室","tag":[]},{"mid":391831595,"name":"Rudy英语","tag":[]},{"mid":15862638,"name":"哈密瓜微课","tag":[]},{"mid":295100453,"name":"叶梅梅过家家","tag":[]},{"mid":1305776725,"name":"虎哥教英语","tag":[]},{"mid":3493283187657030,"name":"青衫图解数学","tag":[]},{"mid":25694274,"name":"小五只会一点点","tag":["科普"]},{"mid":14797570,"name":"葆二爺的读心术","tag":["科普"]},{"mid":20998925,"name":"英语何太急","tag":[]},{"mid":166828,"name":"机智的商业生活","tag":[]},{"mid":3546575620016315,"name":"阿鹏哥哥探结构","tag":[]},{"mid":451196839,"name":"专心种花兔","tag":["科普","新闻"]},{"mid":485163549,"name":"大胡子老师-Jesse","tag":[]},{"mid":13260671,"name":"张烟囱","tag":[]},{"mid":385126080,"name":"圆中的猫头鹰","tag":[]},{"mid":3546610074126569,"name":"每天一个最强大脑","tag":[]},{"mid":523603911,"name":"七哥论国际战略-","tag":[]},{"mid":298332602,"name":"亦申凌泽","tag":[]},{"mid":3461582166166488,"name":"识万物_","tag":["科普"]},{"mid":3537120815745590,"name":"精英论坛","tag":["科普","特别关注"]},{"mid":208300745,"name":"小猴哥技术美术","tag":[]},{"mid":489302782,"name":"AI视次方","tag":[]},{"mid":430385404,"name":"设计生听超哥说AI","tag":[]},{"mid":73674032,"name":"小草律师呀","tag":[]},{"mid":1500074803,"name":"一朝春暖花满城","tag":[]},{"mid":488313112,"name":"DcMona迪迪西西","tag":[]},{"mid":68134500,"name":"张大碗子","tag":[]},{"mid":1047158092,"name":"奇妙的世界QAQ","tag":[]},{"mid":3546571071293861,"name":"没事我梨姐","tag":["科普"]},{"mid":1246792669,"name":"勃哥只有一辆车","tag":[]},{"mid":621235564,"name":"涤生大数据","tag":[]},{"mid":124806013,"name":"愚知乐","tag":[]},{"mid":26055664,"name":"张宝塔啊","tag":[]},{"mid":441631812,"name":"咕Job工作室","tag":[]},{"mid":243680430,"name":"金泽每日搞钱信息差","tag":["科普"]},{"mid":601300995,"name":"Mrs腊月小九","tag":[]},{"mid":108526737,"name":"法师马马","tag":[]},{"mid":2100151539,"name":"小义子小","tag":["科普"]},{"mid":3461566464789457,"name":"设计师一修","tag":[]},{"mid":3546603229023143,"name":"舒小车日常","tag":[]},{"mid":628054609,"name":"晶姐职说","tag":[]},{"mid":1749224369,"name":"老司机观察","tag":[]},{"mid":3493133887211865,"name":"环球-论坛记","tag":[]},{"mid":56300844,"name":"张小米粒的简单生活","tag":[]},{"mid":35639011,"name":"余扬捷老师","tag":["科普"]},{"mid":255139870,"name":"柴猫小巫师","tag":[]},{"mid":1029508158,"name":"单位晋升","tag":[]},{"mid":23244398,"name":"三口草莓","tag":[]},{"mid":18562567,"name":"mason英语","tag":[]},{"mid":3493291869866324,"name":"全球宏观FICC","tag":[]},{"mid":3494354444355822,"name":"顾老师商业定位","tag":[]},{"mid":594840903,"name":"带带政治理论","tag":[]},{"mid":3546593938639500,"name":"罗胖罗振宇","tag":[]},{"mid":1618054,"name":"商业启示","tag":[]},{"mid":1098004826,"name":"刘丫丫跳舞","tag":[]},{"mid":94577838,"name":"拾叁生意经","tag":[]},{"mid":21849780,"name":"每日搞钱信息差","tag":[]},{"mid":35105301,"name":"法号观芷","tag":[]},{"mid":423319981,"name":"刘沣学长","tag":[]},{"mid":413276548,"name":"城事堂","tag":[]},{"mid":693654968,"name":"罗罗说说Rossi","tag":[]},{"mid":3493111665789758,"name":"纪录频道Nature","tag":["纪录片"]},{"mid":15520342,"name":"创投学社","tag":[]},{"mid":535023713,"name":"是德科技","tag":["科普"]},{"mid":1321969690,"name":"五道口工匠","tag":[]},{"mid":11555160,"name":"空天同学","tag":[]},{"mid":224560702,"name":"鱼不溜秋","tag":[]},{"mid":17789957,"name":"Amethyst_Star","tag":[]},{"mid":2073606358,"name":"wuli_东哥物理","tag":[]},{"mid":531692757,"name":"初中学业业委会主任","tag":[]},{"mid":1823466601,"name":"English-Power","tag":[]},{"mid":524899324,"name":"小八的数分和高代","tag":[]},{"mid":3546637651675315,"name":"锁匠钥匙批发零售","tag":[]},{"mid":583967110,"name":"今日原理","tag":["科普"]},{"mid":3494361759221832,"name":"财富人生看个性签名拍","tag":[]},{"mid":1640934198,"name":"NewCH-娇哥","tag":[]},{"mid":383587023,"name":"复利的奇迹ETF基金理财","tag":[]},{"mid":1710911403,"name":"刘楠Talia","tag":[]},{"mid":14342271,"name":"遇真纪事","tag":[]},{"mid":2031277323,"name":"科普见闻录","tag":[]},{"mid":520814591,"name":"谈三圈","tag":["科普","科技"]},{"mid":603430640,"name":"涛哥讲期权","tag":["科普"]},{"mid":3546568640694467,"name":"还得是跳爷","tag":["科普"]},{"mid":3546571882892263,"name":"轻玩科技智造家","tag":["科普"]},{"mid":3493140684081255,"name":"新惕姆自动化","tag":["科普"]},{"mid":28535841,"name":"每天都在学东西","tag":["科普"]},{"mid":1741962246,"name":"IT界扛霸子","tag":["学习"]},{"mid":145611758,"name":"游点物理","tag":["科普"]},{"mid":26742637,"name":"方法自习室","tag":["特别关注","科普"]},{"mid":418201063,"name":"影子跟读","tag":["科普","学习"]},{"mid":673614860,"name":"卢麒元的视角","tag":["科普"]},{"mid":1304346514,"name":"张琦大大","tag":["科普"]},{"mid":283389925,"name":"每天一篇外刊精读","tag":["学习"]},{"mid":107861587,"name":"AI大模型全栈","tag":["学习"]},{"mid":1954415159,"name":"TED官方","tag":["科普","学习"]},{"mid":415500574,"name":"B站金融学院","tag":["新闻","科普"]},{"mid":3461575868418125,"name":"哔哩大学政治学院","tag":["科普","学习","新闻"]},{"mid":400258300,"name":"币圈五五开","tag":["科普","信息差"]},{"mid":3546655775263285,"name":"电商小菜鸡呀","tag":["科普","纪录片","信息差"]},{"mid":3546622413768823,"name":"懂一些人情世故","tag":["科普"]},{"mid":102617968,"name":"Amor东山再起","tag":["科普","学习"]},{"mid":217475729,"name":"CSDN","tag":["科普"]},{"mid":685526816,"name":"老魏机械百科","tag":["科普"]},{"mid":3494364269513335,"name":"重案纪实","tag":["学习"]},{"mid":185549749,"name":"bili_185549749","tag":["科普"]},{"mid":502539494,"name":"洞察人性缘","tag":["科普"]},{"mid":73528331,"name":"摩斯神探","tag":["科普"]},{"mid":14004258,"name":"奥德修斯的绳索","tag":["科普"]},{"mid":3546604311152974,"name":"销售学习知识库","tag":["科普"]},{"mid":510767506,"name":"单口喜剧侯智元","tag":["科普"]},{"mid":1169142430,"name":"传播学刘阳","tag":["科普"]},{"mid":1633547470,"name":"林少华林老师","tag":["科普"]},{"mid":1315696773,"name":"韩潇老师讲诗词","tag":["科普"]},{"mid":15741969,"name":"像素范","tag":["学习"]},{"mid":3461579156752681,"name":"常军谈心理","tag":["学习"]},{"mid":238171381,"name":"TED原声英语演讲","tag":["学习"]},{"mid":3546627212052911,"name":"天涯神贴YYDS","tag":["科普"]},{"mid":3546670222543152,"name":"富贵儿很正经","tag":["科普"]},{"mid":448165099,"name":"军情D7处","tag":["新闻"]},{"mid":2233213,"name":"星话大白","tag":["新闻"]},{"mid":1975692083,"name":"军情巴朗","tag":["新闻"]},{"mid":542824499,"name":"军情阿丁","tag":["新闻"]},{"mid":16243913,"name":"Solo审判日","tag":["新闻"]},{"mid":3494354016537425,"name":"A电子爱好者老牛","tag":["科普"]},{"mid":316627722,"name":"世界见闻录","tag":["新闻"]},{"mid":14520423,"name":"传说中的挖掘机","tag":["科普"]},{"mid":3546613639284889,"name":"五点半FiveThirty","tag":["科普"]},{"mid":1944667205,"name":"雷峰网","tag":["新闻"]},{"mid":1433031509,"name":"bili_1433031509","tag":["新闻"]},{"mid":3546662922357356,"name":"52赫兹实验室","tag":["科普","科技"]},{"mid":355155672,"name":"费洛凡","tag":["科普"]},{"mid":506786489,"name":"启眸运动","tag":["科普"]},{"mid":3546387566299549,"name":"达利奥利奥","tag":["科普"]},{"mid":496787581,"name":"SiliconPlanet","tag":["科普","新闻"]},{"mid":3546643550963789,"name":"尝试学习常识","tag":["科普"]},{"mid":515457626,"name":"原版外刊精读社","tag":["科普","学习"]},{"mid":510362725,"name":"赛雷话金","tag":["新闻","科普"]},{"mid":10698584,"name":"唠点历史","tag":["学习","科普","纪录片"]},{"mid":345339963,"name":"光城刺史","tag":["科普"]},{"mid":601612399,"name":"北京卫视档案","tag":["科普"]},{"mid":346563107,"name":"波士顿圆脸","tag":["新闻"]},{"mid":289189019,"name":"戏京同志","tag":["科普","新闻"]},{"mid":1593690059,"name":"李筠教授","tag":["科普"]},{"mid":382423121,"name":"白宫日记","tag":["科普"]},{"mid":600428973,"name":"周侃侃plus","tag":["学习"]},{"mid":430426421,"name":"燕三嘤嘤嘤","tag":["科普","乐子","新闻"]},{"mid":294262027,"name":"奔流映画","tag":["科普","科技"]},{"mid":923477,"name":"无骨者伊瓦尔","tag":["学习"]},{"mid":370982805,"name":"人与地球","tag":["科普"]},{"mid":408179496,"name":"环球地图","tag":["科普"]},{"mid":100785033,"name":"地球知识局","tag":["科普"]},{"mid":3493107370822154,"name":"穿透人性","tag":["科普","抽象派"]},{"mid":325848853,"name":"陇上姚明","tag":["科普","信息差"]},{"mid":22234926,"name":"认真的阿真","tag":["学习","科普"]},{"mid":735958,"name":"胖达粑粑","tag":["科普","学习"]},{"mid":442603088,"name":"三维地图看世界","tag":["科普","学习"]},{"mid":35162124,"name":"hum_hallelujah","tag":["科普","学习"]},{"mid":520819684,"name":"小Lin说","tag":["科普"]},{"mid":613408351,"name":"迷幻枸杞","tag":["科普","学习"]},{"mid":668794433,"name":"哈佛雪梨","tag":["科普"]},{"mid":3546390949005555,"name":"一大杯芋圆啵啵","tag":["学习"]},{"mid":276983285,"name":"你今天学地理了吗","tag":["科普","学习"]},{"mid":34107188,"name":"丘丘的数学之旅","tag":["学习"]},{"mid":385168742,"name":"春霖老师","tag":["学习"]},{"mid":413049762,"name":"高中数学蔡德锦","tag":["学习"]},{"mid":18509044,"name":"Mk数学杀手","tag":["学习"]},{"mid":22511468,"name":"小龙阿卡纳","tag":["学习"]},{"mid":673420980,"name":"韩秀云讲经济","tag":["科普"]},{"mid":478548163,"name":"睡前小声比比","tag":["科普"]},{"mid":563396855,"name":"爱喝碳水的瓦冰","tag":["科普"]},{"mid":357669580,"name":"萌萌战队","tag":["学习","科普"]},{"mid":319176130,"name":"圣诞节南瓜灯","tag":["科普","学习"]},{"mid":3546672034482563,"name":"TED官方科普","tag":["科普"]},{"mid":250584301,"name":"艾伦大大-","tag":["科普"]},{"mid":27022750,"name":"子疯实验室","tag":["纪录片","科普"]},{"mid":485234598,"name":"Emily每日英语听读","tag":["学习"]},{"mid":1555665460,"name":"YouTube政治学院","tag":["纪录片","科普","学习"]},{"mid":1408106571,"name":"柏年说","tag":["科普"]},{"mid":6776617,"name":"安东星老6","tag":["实力派","科普","科技","硬核整活"]},{"mid":30947486,"name":"小椰子专栏","tag":["乐子"]},{"mid":18024796,"name":"橙子登登-","tag":["科普"]},{"mid":2097311046,"name":"产经破壁机","tag":["科普"]},{"mid":296399504,"name":"虎嗅视频","tag":["科普"]},{"mid":3493262402783627,"name":"馋逗儿-","tag":["实力派","纪录片","科普","硬核整活"]},{"mid":487881722,"name":"村花熙熙","tag":["科普"]},{"mid":108709998,"name":"易本正经傅师兄","tag":["科普"]},{"mid":11146869,"name":"黑猫星球","tag":["科普","新闻"]},{"mid":37950062,"name":"硬核资本论","tag":["新闻"]},{"mid":481434238,"name":"Ele实验室","tag":["科普","学习"]},{"mid":437840703,"name":"荒野追剧探长","tag":["纪录片"]},{"mid":598464467,"name":"苏星河牛通","tag":["科普"]},{"mid":611584263,"name":"芯机叔Talk","tag":["科普"]},{"mid":1957113893,"name":"AI光影社","tag":["科普"]},{"mid":496261881,"name":"CNSA中国航天文化","tag":["科普","新闻"]},{"mid":1735615743,"name":"东部战区","tag":["新闻","菌嗜"]},{"mid":687410230,"name":"HexUp","tag":["科普","特别关注","学习"]},{"mid":46880349,"name":"啥都会一点的研究生","tag":["科普","学习"]},{"mid":245869,"name":"尚在天国EX","tag":["科普"]},{"mid":1094131374,"name":"哔哩哔哩超级科学晚","tag":["科普"]},{"mid":28378491,"name":"家有神兽","tag":["学习","菌嗜"]},{"mid":1875198641,"name":"SpaceLens","tag":["科普","学习","菌嗜"]},{"mid":248466804,"name":"百岁山不甜pro","tag":["科普","学习","菌嗜"]},{"mid":1915842925,"name":"一只野飞友","tag":["科普","菌嗜"]},{"mid":67079745,"name":"玄离199","tag":["学习","科普","科技","CODEK"]},{"mid":379889714,"name":"边亮_网络安全","tag":["学习","科普"]},{"mid":14583962,"name":"思维实验室","tag":["科普","学习"]},{"mid":412499953,"name":"Github开源软件-阿轩","tag":["科普","科技","学习"]},{"mid":395188578,"name":"爱上半导体","tag":["科普","科技","学习"]},{"mid":21612876,"name":"电力小子-gtetgeg","tag":["硬核整活"]},{"mid":3494363613104182,"name":"每日英语一点通","tag":["学习"]},{"mid":1980386544,"name":"1号档案馆","tag":["科普","学习"]},{"mid":661141753,"name":"框框老师课堂","tag":["学习","特别关注"]},{"mid":151155077,"name":"天才赵德柱","tag":["科普","科技"]},{"mid":679619486,"name":"国仁全球大学堂","tag":["科普","学习"]},{"mid":52699256,"name":"S亦和","tag":["科普"]},{"mid":67907025,"name":"猴博士爱讲课","tag":["学习"]},{"mid":72270557,"name":"芳斯塔芙","tag":["科普"]},{"mid":3546588897086207,"name":"轻玩科技社","tag":["实力派"]},{"mid":32229576,"name":"算法猪立业","tag":["科普","学习"]},{"mid":3493079826828072,"name":"豌克思","tag":["学习","科普","纪录片","硬核整活","实力派"]},{"mid":96639395,"name":"学院派Academia","tag":["科普"]},{"mid":1606682745,"name":"米哥专升本","tag":["学习"]},{"mid":1534642081,"name":"学习强国","tag":["纪录片","新闻","学习"]},{"mid":21778636,"name":"中国日报","tag":["科普","新闻","学习"]},{"mid":3546752795805831,"name":"国家应急广播","tag":["新闻"]},{"mid":703186600,"name":"麻薯波比呀","tag":["科普","新闻"]},{"mid":415200463,"name":"军迷天花板杰哥","tag":["科普","菌嗜"]},{"mid":33683045,"name":"张召忠","tag":["科普","菌嗜"]},{"mid":569956690,"name":"CGTN","tag":["科普","新闻"]},{"mid":407045223,"name":"二次元的中科院物理所","tag":["科普","新闻","学习"]},{"mid":20259914,"name":"稚晖君","tag":["实力派","科普","科技","硬核整活","学习"]},{"mid":942755,"name":"迷影至下Filmlast","tag":["科普"]},{"mid":205631797,"name":"果壳","tag":["科普"]},{"mid":11270116,"name":"酒痴东梦","tag":["科普","学习"]},{"mid":629101318,"name":"远方的青木","tag":["科普","学习"]},{"mid":321691718,"name":"中国日报网","tag":["科普","新闻"]},{"mid":520097839,"name":"发烧好了呢","tag":["科普","学习"]},{"mid":326427334,"name":"星球研究所","tag":["科普","学习"]},{"mid":452161580,"name":"战忽智库","tag":["学习"]},{"mid":508171633,"name":"思考的熊兄","tag":["学习","特别关注"]},{"mid":26108626,"name":"赛雷三分钟","tag":["科普"]},{"mid":3493089637305282,"name":"中国国家地理景观","tag":["科普"]},{"mid":364654971,"name":"中国国家地理频道","tag":["科普"]},{"mid":335850246,"name":"玉渊谭天","tag":["科普"]},{"mid":519872016,"name":"历史调研室","tag":["科普"]},{"mid":522262428,"name":"不严肃问题研究室","tag":["科普","新闻"]},{"mid":612194373,"name":"沙盘上的战争","tag":["科普","学习"]},{"mid":1839363891,"name":"图解价值","tag":["科普","学习"]},{"mid":743226,"name":"花岗岩工作室","tag":["科普"]},{"mid":374377163,"name":"全球档案馆","tag":["科普","学习"]},{"mid":213845897,"name":"天才简史","tag":["科普"]},{"mid":88461692,"name":"3Blue1Brown","tag":["科普"]},{"mid":94727573,"name":"科学认识论","tag":["科普"]},{"mid":693447092,"name":"超离谱科技","tag":["科普","学习"]},{"mid":65564239,"name":"IT咖啡馆","tag":["科普","科技","学习","CODEK"]},{"mid":323713206,"name":"螳螂捕财","tag":["科普","新闻"]},{"mid":1070859358,"name":"军事博物馆","tag":["科普","学习"]},{"mid":1705267972,"name":"百哥讲网络","tag":["科普","学习"]},{"mid":388576777,"name":"英语的平行世界","tag":["学习"]},{"mid":43219807,"name":"毒舌的南瓜","tag":["科普"]},{"mid":11021614,"name":"我是瑞斯拜","tag":["科普","学习"]},{"mid":70217434,"name":"妈妈不用担心我的英语","tag":["学习"]},{"mid":477671072,"name":"至书-山居五年","tag":["科普","学习"]},{"mid":3494374304385046,"name":"海林A读书","tag":["科普","学习"]},{"mid":390186534,"name":"蜀霞客","tag":["纪录片","科普"]},{"mid":272107494,"name":"7小时解锁新技能","tag":["学习"]},{"mid":514924891,"name":"王德峰","tag":["科普","学习"]},{"mid":435931665,"name":"军武志","tag":["科普","新闻"]},{"mid":1140672573,"name":"小王Albert","tag":["新闻"]},{"mid":14871346,"name":"硬件茶谈","tag":["科普"]},{"mid":3546730316433889,"name":"雷电欧姆","tag":[]},{"mid":622986240,"name":"阿吞啊","tag":["新闻"]},{"mid":69837092,"name":"战争研究所","tag":["科普","新闻"]},{"mid":664086886,"name":"鹏城杰森","tag":["科普","新闻","菌嗜"]},{"mid":439028291,"name":"WU_Eric","tag":["学习"]},{"mid":193147738,"name":"幻海航行","tag":["科普","纪录片"]},{"mid":1773278179,"name":"科幻小凌","tag":["科普"]},{"mid":26606146,"name":"底层原理","tag":["科普"]},{"mid":38598226,"name":"医学科普联盟","tag":["科普"]},{"mid":3546656899336980,"name":"冯无畏","tag":["科普"]},{"mid":430856432,"name":"囚水不盐","tag":["科普"]},{"mid":2039176794,"name":"奇异脑博士","tag":["科普"]},{"mid":485356818,"name":"医学边界","tag":["科普"]},{"mid":67141499,"name":"大漠叔叔","tag":[]},{"mid":1270632901,"name":"我是思屹","tag":["纪录片","科普"]},{"mid":103261012,"name":"歪设长","tag":[]},{"mid":353816116,"name":"大猫超人英语工作室","tag":[]},{"mid":457983079,"name":"math也是柠檬精","tag":["学习"]},{"mid":239688446,"name":"硬核的HeyMatt","tag":["特别关注"]},{"mid":3546821062298417,"name":"框框老师课堂_资料号","tag":["学习"]},{"mid":391930545,"name":"Maki的完美算术教室","tag":["科普","学习"]},{"mid":1632276842,"name":"Ayumu爱讲数学","tag":["科普","特别关注"]},{"mid":27415479,"name":"Victius","tag":["科普"]},{"mid":266765166,"name":"漫士沉思录","tag":["科普"]},{"mid":22072692,"name":"喜欢数学的ayumu","tag":["学习"]},{"mid":394252131,"name":"绩满满","tag":["学习"]},{"mid":320203065,"name":"深蓝学院","tag":[]},{"mid":11023521,"name":"letmedream","tag":["科普","创意","艺术"]},{"mid":446630510,"name":"道长的思维铺子","tag":[]},{"mid":318331,"name":"ForgotFun","tag":["科普","社会"]},{"mid":285027361,"name":"爱研究的小阿楠","tag":[]},{"mid":114366178,"name":"从0开始数","tag":[]},{"mid":1575688490,"name":"CLS同学","tag":[]},{"mid":108753930,"name":"降星驰","tag":["科普","零食关注"]},{"mid":95256449,"name":"遇见狂神说","tag":[]},{"mid":203983793,"name":"Linux中国","tag":[]},{"mid":3546647317448859,"name":"NotOnlySuccess","tag":[]},{"mid":39665558,"name":"偶尔有点小迷糊","tag":[]},{"mid":34786453,"name":"康文昌","tag":[]},{"mid":302417610,"name":"尚硅谷","tag":[]},{"mid":518514395,"name":"今天晚放学","tag":[]},{"mid":322683393,"name":"丘比特的帽子","tag":["学习"]},{"mid":519266610,"name":"会AI的哈利波特","tag":[]},{"mid":1271953419,"name":"大模型微调","tag":[]},{"mid":1283676771,"name":"不加醋的氨基酸","tag":["学习"]},{"mid":367678065,"name":"费曼学徒冬瓜","tag":["学习"]},{"mid":386643440,"name":"我是7788_","tag":["学习"]},{"mid":1965933018,"name":"Python大本营","tag":[]},{"mid":470624011,"name":"动物治愈馆","tag":[]},{"mid":3546583482239276,"name":"故史里","tag":[]},{"mid":3493281239402498,"name":"大发程序员","tag":["学习"]},{"mid":3546886008998093,"name":"雍俊海","tag":["学习"]},{"mid":1791942573,"name":"徐宿的经验书","tag":[]},{"mid":35868098,"name":"长河劫","tag":["科普"]},{"mid":2056649750,"name":"哔哩大学计算机学院","tag":[]},{"mid":30646569,"name":"华语辩坛老友赛","tag":[]},{"mid":157504840,"name":"郝英俊和易道云","tag":[]},{"mid":146668655,"name":"千锋教育","tag":[]},{"mid":1475977561,"name":"今天也要努力哦o","tag":[]},{"mid":2016676980,"name":"北京艾雷克斯企业管理","tag":[]},{"mid":12890453,"name":"程序员鱼皮","tag":[]},{"mid":1209319826,"name":"小锅聊攻防","tag":[]},{"mid":1577562848,"name":"Python万能胶","tag":[]},{"mid":1335124945,"name":"百万亚瑟王x","tag":[]},{"mid":37974444,"name":"黑马程序员","tag":[]},{"mid":416206486,"name":"千锋python","tag":[]},{"mid":3546768587360615,"name":"乌昂大叔","tag":[]},{"mid":129860965,"name":"记忆宫殿宁梓亦","tag":[]},{"mid":371846699,"name":"图灵的猫","tag":[]},{"mid":3493129770502861,"name":"社恐内向昭爷爷","tag":[]},{"mid":1780480185,"name":"飓多多StormCrew","tag":[]},{"mid":472747194,"name":"巫师财经","tag":["科普","社会"]},{"mid":18706318,"name":"龙女之声","tag":[]},{"mid":1809567655,"name":"何大爷课堂","tag":[]},{"mid":1253030023,"name":"一身剑气荡江","tag":["现实"]},{"mid":8157388,"name":"幼稚园大队长丨","tag":[]},{"mid":245645656,"name":"码农高天","tag":["科普"]},{"mid":1871365234,"name":"大问题Dialectic","tag":["科普","特别关注"]},{"mid":1937416537,"name":"陈一枝你坐下","tag":["特别关注"]},{"mid":593251783,"name":"本子在隔壁","tag":[]},{"mid":102584256,"name":"浪花姜","tag":[]},{"mid":1060544882,"name":"东洋雪莲","tag":[]},{"mid":1335713025,"name":"知了解压萌物","tag":[]},{"mid":3546617688886097,"name":"多奇探秘","tag":[]},{"mid":302188068,"name":"小白debug","tag":[]},{"mid":16433002,"name":"隔壁的程序员老王","tag":["学习"]},{"mid":3546752326044595,"name":"啊光小哥哥","tag":[]},{"mid":3546613148551357,"name":"Josh老师和菜鸟小编","tag":[]},{"mid":570064,"name":"章北海official","tag":[]},{"mid":652060948,"name":"童晶老师","tag":[]},{"mid":2116071253,"name":"高考蓝哥","tag":[]},{"mid":97407861,"name":"狼肉好吃","tag":[]},{"mid":3546908731639909,"name":"第三眼日记","tag":[]},{"mid":673835935,"name":"码农的荒岛求生","tag":[]},{"mid":3546693165386233,"name":"挽风的技术教程","tag":[]},{"mid":102438649,"name":"GeekHour","tag":[]},{"mid":325864133,"name":"飞天闪客","tag":["CODEK"]},{"mid":278761367,"name":"唯一讲述者","tag":[]},{"mid":130763764,"name":"三太子敖丙","tag":[]},{"mid":162183,"name":"原子能","tag":[]},{"mid":544451485,"name":"吾爱破解论坛","tag":[]},{"mid":323588182,"name":"毒舌电影编辑部","tag":[]},{"mid":281120100,"name":"我是阿众","tag":["程序员","科普","技术"]},{"mid":668097429,"name":"轩辕的编程宇宙","tag":[]},{"mid":486989780,"name":"老麦的工具库","tag":[]},{"mid":316183842,"name":"技术爬爬虾","tag":["学习","科普","技术"]},{"mid":412704776,"name":"不高兴就喝水","tag":[]},{"mid":3494353494345852,"name":"南哥教恋爱","tag":[]},{"mid":298711658,"name":"路克纪录","tag":[]},{"mid":327247876,"name":"技术蛋老师","tag":[]},{"mid":96609715,"name":"小黑屋的貘_mo","tag":[]},{"mid":623448014,"name":"TIANYU2FM","tag":[]},{"mid":264869770,"name":"丰言疯话","tag":["学习"]},{"mid":3493075691243699,"name":"老戴Donald","tag":["学习"]},{"mid":478849208,"name":"樊登读书上海运营中心","tag":[]},{"mid":3546945542948869,"name":"_美梦守护者_","tag":["现实"]},{"mid":1464874349,"name":"打工人代表巍哥","tag":["科普","信息差"]},{"mid":1679822121,"name":"大唐怪奇笔记","tag":[]},{"mid":19414347,"name":"卡皮巴拉大王拼豆版","tag":[]},{"mid":3493127314737312,"name":"鲶鱼夜话","tag":[]},{"mid":702915816,"name":"云顶数模","tag":[]},{"mid":3546638236781247,"name":"小Lin竖着说","tag":["科普"]},{"mid":15397613,"name":"张云翼_like","tag":["学习"]},{"mid":372313671,"name":"Ross-Ning","tag":[]},{"mid":482867012,"name":"吴悠讲编程","tag":[]},{"mid":3546969421122388,"name":"梦见过彩虹","tag":[]},{"mid":522976477,"name":"Eden说产品","tag":[]},{"mid":1669112799,"name":"产品老兵杰哥","tag":[]},{"mid":3546590214097572,"name":"秀明说","tag":[]},{"mid":3546937947064751,"name":"清华豆师","tag":[]},{"mid":489640651,"name":"新石器公园","tag":["科普"]},{"mid":2100388025,"name":"宇宙世界0","tag":[]},{"mid":254463269,"name":"毕导","tag":[]},{"mid":673779175,"name":"量子位","tag":[]},{"mid":491691175,"name":"C哥聊科技","tag":[]},{"mid":1049078946,"name":"Chris老师即食英语","tag":[]},{"mid":501642082,"name":"萧一白呀","tag":[]},{"mid":3690987316578579,"name":"计算机大白呀","tag":[]},{"mid":458165375,"name":"哔哩哔哩课堂","tag":[]},{"mid":3546662484052067,"name":"娃娃卡哇伊捏","tag":[]},{"mid":481153145,"name":"进击的铁木君","tag":[]},{"mid":1159873315,"name":"大豪夫妇","tag":[]},{"mid":258944527,"name":"陶渊xiao明","tag":[]},{"mid":1037607360,"name":"YOMeeDoll小企鹅窝窝","tag":[]},{"mid":3546857594685834,"name":"陈木白啊","tag":[]},{"mid":1508100119,"name":"零7大王","tag":[]},{"mid":37858284,"name":"网络小白_Uncle城","tag":["技术","科技"]},{"mid":301388587,"name":"Shiki实验室","tag":["学习"]},{"mid":504164656,"name":"科学辟谣","tag":["科普"]},{"mid":111900,"name":"Toka-MK","tag":["零食关注"]},{"mid":1112568165,"name":"汤山老王","tag":[]},{"mid":3690978099595618,"name":"小老板营业中","tag":[]},{"mid":572139281,"name":"鲁本芭娜娜banana","tag":["学习"]},{"mid":3546830396721763,"name":"第四种黑猩猩CHIMP","tag":[]},{"mid":1815948385,"name":"马克的技术工作坊","tag":["学习"]},{"mid":495257108,"name":"小林爱研究","tag":["学习"]},{"mid":385047828,"name":"认知便利店M","tag":["学习"]},{"mid":319526152,"name":"超级TANG-","tag":["科普"]},{"mid":1732848825,"name":"耿同学讲故事","tag":[]},{"mid":276483261,"name":"DeeparchWorks","tag":["程序员","科普","技术"]},{"mid":503577829,"name":"海盗CG","tag":[]},{"mid":3546606469123022,"name":"一觉醒来发生啥","tag":["信息差"]},{"mid":491155397,"name":"信息差猎手","tag":["信息差"]},{"mid":1297136809,"name":"宝藏女嗨沈幼楚","tag":[]},{"mid":270471501,"name":"文文黎","tag":[]},{"mid":106685726,"name":"二二酸酸","tag":["科普"]},{"mid":31341757,"name":"捭阖哗","tag":["特别关注","科普"]},{"mid":490494088,"name":"动动枪DongDongGun","tag":[]},{"mid":1511660367,"name":"西一昂叨叨版","tag":[]}] \ No newline at end of file diff --git a/source/.all_i_need/export_uids.txt b/source/.all_i_need/export_uids.txt deleted file mode 100644 index 1251370..0000000 --- a/source/.all_i_need/export_uids.txt +++ /dev/null @@ -1 +0,0 @@ -1357612844,321583894,439478093,1044673687,62224043,1031543543,1481344732,475443398,2026173074,1858861103,444728505,23947287,35807625,23791195,111714204,1937308559,1587138171,440798355,33291981,648113003,241241407,2099983410,11914415,436700803,3493282273299102,612593877,2125857107,40433405,2000819931,2053592854,546189,507448807,607281655,505935166,14524124,385200931,25876945,669397302,1769820463,1562896062,3493285194632125,3493264275540254,479424216,604710494,1016523517,409109266,1428318343,700817047,1634586116,543931674,1590538073,1574721168,432752294,15247078,499889496,506174440,1784235102,3494376355400290,320819729,1795221360,4848323,495224316,397109346,3493258518858434,379247856,32360194,381653678,393119260,274928598,475656605,365212208,26653094,474881660,3546378525477862,14484744,35339643,1747335,1263990139,3493263038220393,252075192,251642119,387412319,508455218,672614938,1212367465,3494374235179579,589747109,1025542770,23770618,3494350482836026,54091976,252028114,599449178,20826656,384317271,1715594148,3493127266503448,1767282898,487505057,630874464,1264711195,3537118481615036,319358609,518742534,385172962,1999199378,4401694,518619340,419109033,44980991,474803476,629408291,2052851329,525382468,3546595513600180,1475748134,295993972,287591832,38061207,509905775,476819048,21435789,49746395,419052321,488218866,1725223092,1067722283,3494360540777110,2114928296,174471602,43584648,3493281113573620,1480366563,3546590293789198,17095888,391831595,15862638,295100453,1305776725,3493283187657030,25694274,14797570,20998925,166828,3546575620016315,451196839,485163549,13260671,385126080,3546610074126569,523603911,298332602,3461582166166488,3537120815745590,208300745,489302782,430385404,73674032,1500074803,488313112,68134500,1047158092,3546571071293861,1246792669,621235564,124806013,26055664,441631812,243680430,601300995,108526737,2100151539,3461566464789457,3546603229023143,628054609,1749224369,3493133887211865,56300844,35639011,255139870,1029508158,23244398,18562567,3493291869866324,3494354444355822,594840903,3546593938639500,1618054,1098004826,94577838,21849780,35105301,423319981,413276548,693654968,3493111665789758,15520342,535023713,1321969690,11555160,224560702,17789957,2073606358,531692757,1823466601,524899324,3546637651675315,583967110,3494361759221832,1640934198,383587023,1710911403,14342271,2031277323,520814591,603430640,3546568640694467,3546571882892263,3493140684081255,28535841,1741962246,145611758,26742637,418201063,673614860,1304346514,283389925,107861587,1954415159,415500574,3461575868418125,400258300,3546655775263285,3546622413768823,102617968,217475729,685526816,3494364269513335,185549749,502539494,73528331,14004258,3546604311152974,510767506,1169142430,1633547470,1315696773,15741969,3461579156752681,238171381,3546627212052911,3546670222543152,448165099,2233213,1975692083,542824499,16243913,3494354016537425,316627722,14520423,3546613639284889,1944667205,1433031509,3546662922357356,355155672,506786489,3546387566299549,496787581,3546643550963789,515457626,510362725,10698584,345339963,601612399,346563107,289189019,1593690059,382423121,600428973,430426421,294262027,923477,370982805,408179496,100785033,3493107370822154,325848853,22234926,735958,442603088,35162124,520819684,613408351,668794433,3546390949005555,276983285,34107188,385168742,413049762,18509044,22511468,673420980,478548163,563396855,357669580,319176130,3546672034482563,250584301,27022750,485234598,1555665460,1408106571,6776617,30947486,18024796,2097311046,296399504,3493262402783627,487881722,108709998,11146869,37950062,481434238,437840703,598464467,611584263,1957113893,496261881,1735615743,687410230,46880349,245869,1094131374,28378491,1875198641,248466804,1915842925,67079745,379889714,14583962,412499953,395188578,21612876,3494363613104182,1980386544,661141753,151155077,679619486,52699256,67907025,72270557,3546588897086207,32229576,3493079826828072,96639395,1606682745,1534642081,21778636,3546752795805831,703186600,415200463,33683045,569956690,407045223,20259914,942755,205631797,11270116,629101318,321691718,520097839,326427334,452161580,508171633,26108626,3493089637305282,364654971,335850246,519872016,522262428,612194373,1839363891,743226,374377163,213845897,88461692,94727573,693447092,65564239,323713206,1070859358,1705267972,388576777,43219807,11021614,70217434,477671072,3494374304385046,390186534,272107494,514924891,435931665,1140672573,14871346,3546730316433889,622986240,69837092,664086886,439028291,193147738,1773278179,26606146,38598226,3546656899336980,430856432,2039176794,485356818,67141499,1270632901,103261012,353816116,457983079,239688446,3546821062298417,391930545,1632276842,27415479,266765166,22072692,394252131,320203065,11023521,446630510,318331,285027361,114366178,1575688490,108753930,95256449,203983793,3546647317448859,39665558,34786453,302417610,518514395,322683393,519266610,1271953419,1283676771,367678065,386643440,1965933018,470624011,3546583482239276,3493281239402498,3546886008998093,1791942573,35868098,2056649750,30646569,157504840,146668655,1475977561,2016676980,12890453,1209319826,1577562848,1335124945,37974444,416206486,3546768587360615,129860965,371846699,3493129770502861,1780480185,472747194,18706318,1809567655,1253030023,8157388,245645656,1871365234,1937416537,593251783,102584256,1060544882,1335713025,3546617688886097,302188068,16433002,3546752326044595,3546613148551357,570064,652060948,2116071253,97407861,3546908731639909,673835935,3546693165386233,102438649,325864133,278761367,130763764,162183,544451485,323588182,281120100,668097429,486989780,316183842,412704776,3494353494345852,298711658,327247876,96609715,623448014,264869770,3493075691243699,478849208,3546945542948869,1464874349,1679822121,19414347,3493127314737312,702915816,3546638236781247,15397613,372313671,482867012,3546969421122388,522976477,1669112799,3546590214097572,3546937947064751,489640651,2100388025,254463269,673779175,491691175,1049078946,501642082,3690987316578579,458165375,3546662484052067,481153145,1159873315,258944527,1037607360,3546857594685834,1508100119,37858284,301388587,504164656,111900,1112568165,3690978099595618,572139281,3546830396721763,1815948385,495257108,385047828,319526152,1732848825,276483261,503577829,3546606469123022,491155397,1297136809,270471501,106685726,31341757,490494088,1511660367 \ No newline at end of file diff --git a/source/.all_i_need/unfollow_mids_list.txt b/source/.all_i_need/unfollow_mids_list.txt deleted file mode 100644 index d906f72..0000000 --- a/source/.all_i_need/unfollow_mids_list.txt +++ /dev/null @@ -1 +0,0 @@ -1044673687,1481344732,1858861103,444728505,23947287,35807625,111714204,1587138171,440798355,33291981,11914415,436700803,3493282273299102,612593877,2125857107,2000819931,507448807,505935166,14524124,385200931,1769820463,1562896062,3493285194632125,3493264275540254,479424216,604710494,1016523517,1428318343,700817047,543931674,1590538073,1574721168,432752294,3494376355400290,1795221360,4848323,495224316,3493258518858434,379247856,32360194,381653678,274928598,475656605,365212208,3546378525477862,35339643,1747335,1263990139,3493263038220393,251642119,387412319,1212367465,589747109,1025542770,23770618,3494350482836026,54091976,599449178,1715594148,3493127266503448,1767282898,487505057,630874464,1264711195,3537118481615036,319358609,518742534,385172962,4401694,474803476,525382468,3546595513600180,295993972,476819048,21435789,1725223092,2114928296,174471602,1480366563,17095888,295100453,1305776725,25694274,14797570,166828,385126080,3461582166166488,3537120815745590,489302782,73674032,1500074803,68134500,1047158092,3546571071293861,124806013,26055664,441631812,243680430,601300995,108526737,2100151539,3546603229023143,1749224369,3493133887211865,56300844,255139870,23244398,3493291869866324,3494354444355822,3546593938639500,1098004826,94577838,21849780,35105301,423319981,535023713,224560702,3546637651675315,3494361759221832,1640934198,1710911403,14342271,2031277323,603430640,3546568640694467,1741962246,1304346514,283389925,3461575868418125,3546622413768823,3494364269513335,185549749,502539494,73528331,510767506,3461579156752681,238171381,3546627212052911,448165099,1975692083,542824499,16243913,3494354016537425,316627722,1944667205,1433031509,3546387566299549,496787581,3546643550963789,382423121,600428973,430426421,325848853,735958,35162124,668794433,3546390949005555,478548163,3546672034482563,250584301,485234598,1555665460,6776617,108709998,437840703,28378491,67079745,1606682745,629101318,452161580,3493089637305282,374377163,213845897,323713206,272107494,622986240,1773278179,3546656899336980,67141499,318331,285027361,114366178,203983793,1283676771,1965933018,470624011,3546583482239276,3493281239402498,1475977561,2016676980,1209319826,1335124945,416206486,129860965,1780480185,1809567655,245645656,1937416537,1060544882,1335713025,3546617688886097,3546752326044595,3546613148551357,652060948,2116071253,97407861,3546908731639909,3546693165386233,278761367,323588182,486989780,3494353494345852,96609715,264869770,478849208,1679822121,19414347,3493127314737312,702915816,482867012,3546969421122388,3546590214097572,501642082,458165375,3546662484052067,481153145,1159873315,3546857594685834,1508100119,111900,1732848825,3546606469123022,106685726,490494088,1511660367 \ No newline at end of file diff --git a/source/.all_i_need/unfollow_mids_list_1.txt b/source/.all_i_need/unfollow_mids_list_1.txt deleted file mode 100644 index 33a6fcf..0000000 --- a/source/.all_i_need/unfollow_mids_list_1.txt +++ /dev/null @@ -1 +0,0 @@ -1044673687,1481344732,1858861103,444728505,23947287,35807625,111714204,1587138171,440798355,33291981,11914415,436700803,3493282273299102,612593877,2125857107,2000819931,507448807,505935166,14524124,385200931,1769820463,1562896062,3493285194632125,3493264275540254,479424216,604710494,1016523517,1428318343,700817047,543931674,1590538073,1574721168,432752294,3494376355400290,1795221360,4848323,495224316,3493258518858434,379247856,32360194,381653678,274928598,475656605,365212208,3546378525477862,35339643,1747335,1263990139,3493263038220393,251642119,387412319,1212367465,589747109,1025542770,23770618,3494350482836026,54091976,599449178,1715594148,3493127266503448,1767282898,487505057,630874464,1264711195,3537118481615036,319358609,518742534,385172962,4401694,474803476,525382468,3546595513600180,295993972,476819048,21435789,1725223092,2114928296,174471602,1480366563,17095888,295100453,1305776725,25694274,14797570,166828,385126080,3461582166166488,3537120815745590,489302782,73674032,1500074803,68134500,1047158092,3546571071293861,124806013,26055664,441631812,243680430,601300995,108526737 \ No newline at end of file diff --git a/source/.all_i_need/unfollow_mids_list_2.txt b/source/.all_i_need/unfollow_mids_list_2.txt deleted file mode 100644 index 30ec6a1..0000000 --- a/source/.all_i_need/unfollow_mids_list_2.txt +++ /dev/null @@ -1 +0,0 @@ -2100151539,3546603229023143,1749224369,3493133887211865,56300844,255139870,23244398,3493291869866324,3494354444355822,3546593938639500,1098004826,94577838,21849780,35105301,423319981,535023713,224560702,3546637651675315,3494361759221832,1640934198,1710911403,14342271,2031277323,603430640,3546568640694467,1741962246,1304346514,283389925,3461575868418125,3546622413768823,3494364269513335,185549749,502539494,73528331,510767506,3461579156752681,238171381,3546627212052911,448165099,1975692083,542824499,16243913,3494354016537425,316627722,1944667205,1433031509,3546387566299549,496787581,3546643550963789,382423121,600428973,430426421,325848853,735958,35162124,668794433,3546390949005555,478548163,3546672034482563,250584301,485234598,1555665460,6776617,108709998,437840703,28378491,67079745,1606682745,629101318,452161580,3493089637305282,374377163,213845897,323713206,272107494,622986240,1773278179,3546656899336980,67141499,318331,285027361,114366178,203983793,1283676771,1965933018,470624011,3546583482239276,3493281239402498,1475977561,2016676980,1209319826,1335124945,416206486,129860965,1780480185,1809567655,245645656,1937416537,1060544882,1335713025 \ No newline at end of file diff --git a/source/.all_i_need/unfollow_mids_list_3.txt b/source/.all_i_need/unfollow_mids_list_3.txt deleted file mode 100644 index 04a491c..0000000 --- a/source/.all_i_need/unfollow_mids_list_3.txt +++ /dev/null @@ -1 +0,0 @@ -3546617688886097,3546752326044595,3546613148551357,652060948,2116071253,97407861,3546908731639909,3546693165386233,278761367,323588182,486989780,3494353494345852,96609715,264869770,478849208,1679822121,19414347,3493127314737312,702915816,482867012,3546969421122388,3546590214097572,501642082,458165375,3546662484052067,481153145,1159873315,3546857594685834,1508100119,111900,1732848825,3546606469123022,106685726,490494088,1511660367 \ No newline at end of file diff --git a/source/.gitignore b/source/.gitignore deleted file mode 100644 index 89d3008..0000000 --- a/source/.gitignore +++ /dev/null @@ -1,91 +0,0 @@ -# 1. 忽略操作系统自动生成的文件 -.DS_Store -Thumbs.db -*.lnk - -# 2. 忽略编译/构建产物 -__pycache__/ -*.py[cod] -*$py.class -*.so -.Python -build/ -develop-eggs/ -dist/ -downloads/ -eggs/ -.eggs/ -lib/ -lib64/ -parts/ -sdist/ -var/ -wheels/ -*.egg-info/ -.installed.cfg -*.egg -MANIFEST - -# 3. 忽略IDE配置 -.vscode/ -.idea/ -*.swp -*.swo -*~ - -# 4. 忽略日志文件 -*.log -*.tmp -*.temp -*.md -source/all_i_need/ - - -# 5. 忽略敏感数据 -*.env -*.key -*.pem -*.cert -config.yaml -secrets/ - -# 6. 忽略大型媒体文件 -*.mp4 -*.mov -*.avi -*.wav -*.mp3 -*.zip -*.tar -*.gz -*.7z -*.rar - -# 7. 忽略数据分析/机器学习特有 -*.model -*.h5 -*.pkl -*.joblib -.ipynb_checkpoints/ - -# 8. 忽略你项目中的自动生成目录 -# 根据你的目录结构,忽略source/output/和source/reports/下的所有文件 -# 但保留目录结构本身(可以添加空的.gitkeep文件来保持空目录) -source/output/**/* -!source/output/.gitkeep -source/reports/**/* -!source/reports/.gitkeep -source/.note -source/.test_output/ -source/.note -source/.test_output/ -source/all_i_need/**/* -source/.*/ -source/all_i_need/**/*.txt -source/all_i_need/**/*.json -source/.all_i_need/export_uids.json -source/.all_i_need/export_uids.txt -source/.all_i_need/unfollow_mids_list_1.txt -source/.all_i_need/unfollow_mids_list_2.txt -source/.all_i_need/unfollow_mids_list_3.txt -source/.all_i_need/unfollow_mids_list.txt \ No newline at end of file diff --git a/source/output/uids/4_unfollow_mids_list.txt b/source/output/uids/4_unfollow_mids_list.txt deleted file mode 100644 index 4934e4f..0000000 --- a/source/output/uids/4_unfollow_mids_list.txt +++ /dev/null @@ -1 +0,0 @@ -321583894,439478093,1044673687,1031543543,1481344732 \ No newline at end of file diff --git a/source/output/uids/4_unfollow_mids_list_1.txt b/source/output/uids/4_unfollow_mids_list_1.txt deleted file mode 100644 index 4934e4f..0000000 --- a/source/output/uids/4_unfollow_mids_list_1.txt +++ /dev/null @@ -1 +0,0 @@ -321583894,439478093,1044673687,1031543543,1481344732 \ No newline at end of file diff --git a/source/output/uids/unfollow_mids_list.txt b/source/output/uids/unfollow_mids_list.txt deleted file mode 100644 index d906f72..0000000 --- a/source/output/uids/unfollow_mids_list.txt +++ /dev/null @@ -1 +0,0 @@ -1044673687,1481344732,1858861103,444728505,23947287,35807625,111714204,1587138171,440798355,33291981,11914415,436700803,3493282273299102,612593877,2125857107,2000819931,507448807,505935166,14524124,385200931,1769820463,1562896062,3493285194632125,3493264275540254,479424216,604710494,1016523517,1428318343,700817047,543931674,1590538073,1574721168,432752294,3494376355400290,1795221360,4848323,495224316,3493258518858434,379247856,32360194,381653678,274928598,475656605,365212208,3546378525477862,35339643,1747335,1263990139,3493263038220393,251642119,387412319,1212367465,589747109,1025542770,23770618,3494350482836026,54091976,599449178,1715594148,3493127266503448,1767282898,487505057,630874464,1264711195,3537118481615036,319358609,518742534,385172962,4401694,474803476,525382468,3546595513600180,295993972,476819048,21435789,1725223092,2114928296,174471602,1480366563,17095888,295100453,1305776725,25694274,14797570,166828,385126080,3461582166166488,3537120815745590,489302782,73674032,1500074803,68134500,1047158092,3546571071293861,124806013,26055664,441631812,243680430,601300995,108526737,2100151539,3546603229023143,1749224369,3493133887211865,56300844,255139870,23244398,3493291869866324,3494354444355822,3546593938639500,1098004826,94577838,21849780,35105301,423319981,535023713,224560702,3546637651675315,3494361759221832,1640934198,1710911403,14342271,2031277323,603430640,3546568640694467,1741962246,1304346514,283389925,3461575868418125,3546622413768823,3494364269513335,185549749,502539494,73528331,510767506,3461579156752681,238171381,3546627212052911,448165099,1975692083,542824499,16243913,3494354016537425,316627722,1944667205,1433031509,3546387566299549,496787581,3546643550963789,382423121,600428973,430426421,325848853,735958,35162124,668794433,3546390949005555,478548163,3546672034482563,250584301,485234598,1555665460,6776617,108709998,437840703,28378491,67079745,1606682745,629101318,452161580,3493089637305282,374377163,213845897,323713206,272107494,622986240,1773278179,3546656899336980,67141499,318331,285027361,114366178,203983793,1283676771,1965933018,470624011,3546583482239276,3493281239402498,1475977561,2016676980,1209319826,1335124945,416206486,129860965,1780480185,1809567655,245645656,1937416537,1060544882,1335713025,3546617688886097,3546752326044595,3546613148551357,652060948,2116071253,97407861,3546908731639909,3546693165386233,278761367,323588182,486989780,3494353494345852,96609715,264869770,478849208,1679822121,19414347,3493127314737312,702915816,482867012,3546969421122388,3546590214097572,501642082,458165375,3546662484052067,481153145,1159873315,3546857594685834,1508100119,111900,1732848825,3546606469123022,106685726,490494088,1511660367 \ No newline at end of file diff --git a/source/output/uids/unfollow_mids_list_1.txt b/source/output/uids/unfollow_mids_list_1.txt deleted file mode 100644 index 33a6fcf..0000000 --- a/source/output/uids/unfollow_mids_list_1.txt +++ /dev/null @@ -1 +0,0 @@ -1044673687,1481344732,1858861103,444728505,23947287,35807625,111714204,1587138171,440798355,33291981,11914415,436700803,3493282273299102,612593877,2125857107,2000819931,507448807,505935166,14524124,385200931,1769820463,1562896062,3493285194632125,3493264275540254,479424216,604710494,1016523517,1428318343,700817047,543931674,1590538073,1574721168,432752294,3494376355400290,1795221360,4848323,495224316,3493258518858434,379247856,32360194,381653678,274928598,475656605,365212208,3546378525477862,35339643,1747335,1263990139,3493263038220393,251642119,387412319,1212367465,589747109,1025542770,23770618,3494350482836026,54091976,599449178,1715594148,3493127266503448,1767282898,487505057,630874464,1264711195,3537118481615036,319358609,518742534,385172962,4401694,474803476,525382468,3546595513600180,295993972,476819048,21435789,1725223092,2114928296,174471602,1480366563,17095888,295100453,1305776725,25694274,14797570,166828,385126080,3461582166166488,3537120815745590,489302782,73674032,1500074803,68134500,1047158092,3546571071293861,124806013,26055664,441631812,243680430,601300995,108526737 \ No newline at end of file diff --git a/source/output/uids/unfollow_mids_list_2.txt b/source/output/uids/unfollow_mids_list_2.txt deleted file mode 100644 index 30ec6a1..0000000 --- a/source/output/uids/unfollow_mids_list_2.txt +++ /dev/null @@ -1 +0,0 @@ -2100151539,3546603229023143,1749224369,3493133887211865,56300844,255139870,23244398,3493291869866324,3494354444355822,3546593938639500,1098004826,94577838,21849780,35105301,423319981,535023713,224560702,3546637651675315,3494361759221832,1640934198,1710911403,14342271,2031277323,603430640,3546568640694467,1741962246,1304346514,283389925,3461575868418125,3546622413768823,3494364269513335,185549749,502539494,73528331,510767506,3461579156752681,238171381,3546627212052911,448165099,1975692083,542824499,16243913,3494354016537425,316627722,1944667205,1433031509,3546387566299549,496787581,3546643550963789,382423121,600428973,430426421,325848853,735958,35162124,668794433,3546390949005555,478548163,3546672034482563,250584301,485234598,1555665460,6776617,108709998,437840703,28378491,67079745,1606682745,629101318,452161580,3493089637305282,374377163,213845897,323713206,272107494,622986240,1773278179,3546656899336980,67141499,318331,285027361,114366178,203983793,1283676771,1965933018,470624011,3546583482239276,3493281239402498,1475977561,2016676980,1209319826,1335124945,416206486,129860965,1780480185,1809567655,245645656,1937416537,1060544882,1335713025 \ No newline at end of file diff --git a/source/output/uids/unfollow_mids_list_3.txt b/source/output/uids/unfollow_mids_list_3.txt deleted file mode 100644 index 04a491c..0000000 --- a/source/output/uids/unfollow_mids_list_3.txt +++ /dev/null @@ -1 +0,0 @@ -3546617688886097,3546752326044595,3546613148551357,652060948,2116071253,97407861,3546908731639909,3546693165386233,278761367,323588182,486989780,3494353494345852,96609715,264869770,478849208,1679822121,19414347,3493127314737312,702915816,482867012,3546969421122388,3546590214097572,501642082,458165375,3546662484052067,481153145,1159873315,3546857594685834,1508100119,111900,1732848825,3546606469123022,106685726,490494088,1511660367 \ No newline at end of file diff --git a/source/resources/export_uids.json b/source/resources/export_uids.json deleted file mode 100644 index a7165af..0000000 --- a/source/resources/export_uids.json +++ /dev/null @@ -1 +0,0 @@ -[{"mid":1357612844,"name":"考研英语马天艺老师","tag":[]},{"mid":321583894,"name":"我是蓝同学啊","tag":["实力派"]},{"mid":439478093,"name":"中国食品报融媒体","tag":["纪录片","新闻"]},{"mid":1044673687,"name":"心理述","tag":[]},{"mid":62224043,"name":"栗之from一直夫妇","tag":[]},{"mid":1031543543,"name":"Java面试突击-Mic","tag":[]},{"mid":1481344732,"name":"我们都是社畜","tag":["准备取关"]},{"mid":475443398,"name":"黑毛羊驼","tag":["准备取关"]},{"mid":2026173074,"name":"温竣岩","tag":["准备取关"]},{"mid":1858861103,"name":"迷因水母","tag":["准备取关"]},{"mid":444728505,"name":"小狮日记","tag":["准备取关"]},{"mid":23947287,"name":"小约翰可汗","tag":["准备取关"]},{"mid":35807625,"name":"小凡今天出片了吗","tag":["准备取关"]},{"mid":23791195,"name":"科学透镜","tag":["准备取关"]},{"mid":111714204,"name":"胖胖地球君","tag":["准备取关"]},{"mid":1937308559,"name":"赛博食录","tag":["准备取关"]},{"mid":1587138171,"name":"为一放映室","tag":["准备取关"]},{"mid":440798355,"name":"狗性巧克力","tag":["准备取关"]},{"mid":33291981,"name":"脑洞部长","tag":["准备取关"]},{"mid":648113003,"name":"沈逸老师","tag":["准备取关"]},{"mid":241241407,"name":"第一颗思考的蝌蚪","tag":["准备取关"]},{"mid":2099983410,"name":"电子电工之家","tag":["准备取关"]},{"mid":11914415,"name":"严伯钧","tag":["准备取关"]},{"mid":436700803,"name":"天星教育官方号","tag":["准备取关"]},{"mid":3493282273299102,"name":"奇妙世界GPT","tag":["准备取关"]},{"mid":612593877,"name":"Python_子木","tag":["准备取关"]},{"mid":2125857107,"name":"李大可爱玩","tag":["准备取关"]},{"mid":40433405,"name":"科技狐","tag":["准备取关"]},{"mid":2000819931,"name":"中国国家地理","tag":["准备取关"]},{"mid":2053592854,"name":"造梦小懿","tag":["准备取关"]},{"mid":546189,"name":"小Q不是导盲犬","tag":["准备取关"]},{"mid":507448807,"name":"Beelief","tag":["准备取关"]},{"mid":607281655,"name":"Science科学杂志","tag":["准备取关"]},{"mid":505935166,"name":"语文作文菌","tag":["准备取关"]},{"mid":14524124,"name":"胡诌施佬","tag":["准备取关"]},{"mid":385200931,"name":"MappleZS","tag":["准备取关"]},{"mid":25876945,"name":"极客湾Geekerwan","tag":["准备取关"]},{"mid":669397302,"name":"ZiKa-玩机酷","tag":["准备取关"]},{"mid":1769820463,"name":"百电汇数码生活","tag":["准备取关"]},{"mid":1562896062,"name":"EYEZMAZEvideo","tag":["准备取关"]},{"mid":3493285194632125,"name":"原理视界","tag":["准备取关"]},{"mid":3493264275540254,"name":"单词鲨手","tag":["准备取关"]},{"mid":479424216,"name":"卡尼酱本人","tag":["准备取关"]},{"mid":604710494,"name":"长片短解","tag":["准备取关"]},{"mid":1016523517,"name":"科技公元","tag":["准备取关"]},{"mid":409109266,"name":"陨石张大福","tag":["准备取关"]},{"mid":1428318343,"name":"芸曦小手工","tag":["准备取关"]},{"mid":700817047,"name":"第一推动科普","tag":["准备取关"]},{"mid":1634586116,"name":"中国日报双语新闻","tag":["准备取关"]},{"mid":543931674,"name":"马力在知群","tag":["准备取关"]},{"mid":1590538073,"name":"今日搞钱信息差","tag":["准备取关"]},{"mid":1574721168,"name":"潘教授和Fodil聊口语","tag":["准备取关"]},{"mid":432752294,"name":"晓晨聊大学","tag":["准备取关"]},{"mid":15247078,"name":"小飞蛾好可爱","tag":["准备取关"]},{"mid":499889496,"name":"是爱丽丝_","tag":["准备取关"]},{"mid":506174440,"name":"异星探索","tag":["准备取关"]},{"mid":1784235102,"name":"算法大师兄","tag":["准备取关"]},{"mid":3494376355400290,"name":"DayDay常识","tag":["准备取关"]},{"mid":320819729,"name":"Jonathan彭玉印","tag":["准备取关"]},{"mid":1795221360,"name":"心情瓶中信","tag":["准备取关"]},{"mid":4848323,"name":"数字游牧人","tag":["准备取关"]},{"mid":495224316,"name":"一只萧包子","tag":["准备取关"]},{"mid":397109346,"name":"思维社","tag":["准备取关"]},{"mid":3493258518858434,"name":"西安交通大学沈杨书社","tag":["准备取关"]},{"mid":379247856,"name":"好奇心会社","tag":["准备取关"]},{"mid":32360194,"name":"当下频道","tag":["准备取关"]},{"mid":381653678,"name":"老板懂设计","tag":["准备取关"]},{"mid":393119260,"name":"轻玩科技-老肖","tag":["准备取关"]},{"mid":274928598,"name":"幻想奇术师","tag":["准备取关"]},{"mid":475656605,"name":"超时空采访","tag":["准备取关"]},{"mid":365212208,"name":"Albert英语研习社","tag":["准备取关"]},{"mid":26653094,"name":"Marina0826","tag":["准备取关"]},{"mid":474881660,"name":"英语Snow老师","tag":["准备取关"]},{"mid":3546378525477862,"name":"Joseph的机器","tag":["准备取关"]},{"mid":14484744,"name":"科学小视","tag":["准备取关"]},{"mid":35339643,"name":"超极黑科技","tag":["准备取关"]},{"mid":1747335,"name":"老着急的小两居","tag":["准备取关"]},{"mid":1263990139,"name":"机智朱马马","tag":["准备取关"]},{"mid":3493263038220393,"name":"陆玖无敌","tag":["准备取关"]},{"mid":252075192,"name":"迪哥有点愁","tag":["准备取关"]},{"mid":251642119,"name":"简单柑桔Rw","tag":["准备取关"]},{"mid":387412319,"name":"布白PPT","tag":["准备取关"]},{"mid":508455218,"name":"放羊人_论文指导","tag":["准备取关"]},{"mid":672614938,"name":"英文老师Tanner","tag":["准备取关"]},{"mid":1212367465,"name":"水电知识分享","tag":["准备取关"]},{"mid":3494374235179579,"name":"Blender地势坤","tag":["准备取关"]},{"mid":589747109,"name":"后期老毛","tag":["准备取关"]},{"mid":1025542770,"name":"口语提升训练基地","tag":["准备取关"]},{"mid":23770618,"name":"蛇十六","tag":["准备取关"]},{"mid":3494350482836026,"name":"大道只源","tag":["准备取关"]},{"mid":54091976,"name":"拾镹i","tag":["准备取关"]},{"mid":252028114,"name":"戴博士实验室","tag":["准备取关"]},{"mid":599449178,"name":"槽逻辑","tag":["准备取关"]},{"mid":20826656,"name":"糖果果的未来要发光","tag":["准备取关"]},{"mid":384317271,"name":"易展翅-求职小表姐","tag":["准备取关"]},{"mid":1715594148,"name":"offer锦鲤魏校长","tag":["准备取关"]},{"mid":3493127266503448,"name":"安妮的职场与生活","tag":["准备取关"]},{"mid":1767282898,"name":"探长说电影","tag":["准备取关"]},{"mid":487505057,"name":"池早是我","tag":["准备取关"]},{"mid":630874464,"name":"冷科普","tag":["准备取关"]},{"mid":1264711195,"name":"爱读书的豆豆","tag":["准备取关"]},{"mid":3537118481615036,"name":"琅琊阁之信息差","tag":["准备取关"]},{"mid":319358609,"name":"民族自强不息者","tag":["准备取关"]},{"mid":518742534,"name":"那边那个g蛋","tag":["准备取关"]},{"mid":385172962,"name":"我是阿朱吖","tag":["准备取关"]},{"mid":1999199378,"name":"不略-","tag":[]},{"mid":4401694,"name":"林亦LYi","tag":[]},{"mid":518619340,"name":"想开面包店的Ricky","tag":[]},{"mid":419109033,"name":"科普创世纪","tag":["纪录片","科普","特别关注"]},{"mid":44980991,"name":"会放羊的教书匠","tag":[]},{"mid":474803476,"name":"泡厨房的顾小胖","tag":[]},{"mid":629408291,"name":"今日常识练习","tag":[]},{"mid":2052851329,"name":"律师老韩","tag":[]},{"mid":525382468,"name":"人间放映厅","tag":[]},{"mid":3546595513600180,"name":"松哥打虎","tag":[]},{"mid":1475748134,"name":"精分英教谢尔盖","tag":[]},{"mid":295993972,"name":"爱鼓捣的邢志磊","tag":[]},{"mid":287591832,"name":"丁老师现代英语","tag":[]},{"mid":38061207,"name":"Git源宝","tag":["科普","学习","科技","CODEK"]},{"mid":509905775,"name":"燎结构","tag":[]},{"mid":476819048,"name":"Adam陈老丝","tag":[]},{"mid":21435789,"name":"Kiefan琪凡速写","tag":[]},{"mid":49746395,"name":"GenJi是真想教会你","tag":["特别关注"]},{"mid":419052321,"name":"羊小驼叔叔","tag":[]},{"mid":488218866,"name":"EnglishVista2023","tag":[]},{"mid":1725223092,"name":"科学内幕","tag":[]},{"mid":1067722283,"name":"CG快报","tag":["新闻","ACG"]},{"mid":3494360540777110,"name":"老师好我叫白鼠同学","tag":[]},{"mid":2114928296,"name":"麦说","tag":["科普"]},{"mid":174471602,"name":"阿右科普","tag":[]},{"mid":43584648,"name":"工科男孙老师","tag":["科普"]},{"mid":3493281113573620,"name":"OK语文","tag":[]},{"mid":1480366563,"name":"静止想象研究所","tag":[]},{"mid":3546590293789198,"name":"机械视界J","tag":[]},{"mid":17095888,"name":"Crossin的编程教室","tag":[]},{"mid":391831595,"name":"Rudy英语","tag":[]},{"mid":15862638,"name":"哈密瓜微课","tag":[]},{"mid":295100453,"name":"叶梅梅过家家","tag":[]},{"mid":1305776725,"name":"虎哥教英语","tag":[]},{"mid":3493283187657030,"name":"青衫图解数学","tag":[]},{"mid":25694274,"name":"小五只会一点点","tag":["科普"]},{"mid":14797570,"name":"葆二爺的读心术","tag":["科普"]},{"mid":20998925,"name":"英语何太急","tag":[]},{"mid":166828,"name":"机智的商业生活","tag":[]},{"mid":3546575620016315,"name":"阿鹏哥哥探结构","tag":[]},{"mid":451196839,"name":"专心种花兔","tag":["科普","新闻"]},{"mid":485163549,"name":"大胡子老师-Jesse","tag":[]},{"mid":13260671,"name":"张烟囱","tag":[]},{"mid":385126080,"name":"圆中的猫头鹰","tag":[]},{"mid":3546610074126569,"name":"每天一个最强大脑","tag":[]},{"mid":523603911,"name":"七哥论国际战略-","tag":[]},{"mid":298332602,"name":"亦申凌泽","tag":[]},{"mid":3461582166166488,"name":"识万物_","tag":["科普"]},{"mid":3537120815745590,"name":"精英论坛","tag":["科普","特别关注"]},{"mid":208300745,"name":"小猴哥技术美术","tag":[]},{"mid":489302782,"name":"AI视次方","tag":[]},{"mid":430385404,"name":"设计生听超哥说AI","tag":[]},{"mid":73674032,"name":"小草律师呀","tag":[]},{"mid":1500074803,"name":"一朝春暖花满城","tag":[]},{"mid":488313112,"name":"DcMona迪迪西西","tag":[]},{"mid":68134500,"name":"张大碗子","tag":[]},{"mid":1047158092,"name":"奇妙的世界QAQ","tag":[]},{"mid":3546571071293861,"name":"没事我梨姐","tag":["科普"]},{"mid":1246792669,"name":"勃哥只有一辆车","tag":[]},{"mid":621235564,"name":"涤生大数据","tag":[]},{"mid":124806013,"name":"愚知乐","tag":[]},{"mid":26055664,"name":"张宝塔啊","tag":[]},{"mid":441631812,"name":"咕Job工作室","tag":[]},{"mid":243680430,"name":"金泽每日搞钱信息差","tag":["科普"]},{"mid":601300995,"name":"Mrs腊月小九","tag":[]},{"mid":108526737,"name":"法师马马","tag":[]},{"mid":2100151539,"name":"小义子小","tag":["科普"]},{"mid":3461566464789457,"name":"设计师一修","tag":[]},{"mid":3546603229023143,"name":"舒小车日常","tag":[]},{"mid":628054609,"name":"晶姐职说","tag":[]},{"mid":1749224369,"name":"老司机观察","tag":[]},{"mid":3493133887211865,"name":"环球-论坛记","tag":[]},{"mid":56300844,"name":"张小米粒的简单生活","tag":[]},{"mid":35639011,"name":"余扬捷老师","tag":["科普"]},{"mid":255139870,"name":"柴猫小巫师","tag":[]},{"mid":1029508158,"name":"单位晋升","tag":[]},{"mid":23244398,"name":"三口草莓","tag":[]},{"mid":18562567,"name":"mason英语","tag":[]},{"mid":3493291869866324,"name":"全球宏观FICC","tag":[]},{"mid":3494354444355822,"name":"顾老师商业定位","tag":[]},{"mid":594840903,"name":"带带政治理论","tag":[]},{"mid":3546593938639500,"name":"罗胖罗振宇","tag":[]},{"mid":1618054,"name":"商业启示","tag":[]},{"mid":1098004826,"name":"刘丫丫跳舞","tag":[]},{"mid":94577838,"name":"拾叁生意经","tag":[]},{"mid":21849780,"name":"每日搞钱信息差","tag":[]},{"mid":35105301,"name":"法号观芷","tag":[]},{"mid":423319981,"name":"刘沣学长","tag":[]},{"mid":413276548,"name":"城事堂","tag":[]},{"mid":693654968,"name":"罗罗说说Rossi","tag":[]},{"mid":3493111665789758,"name":"纪录频道Nature","tag":["纪录片"]},{"mid":15520342,"name":"创投学社","tag":[]},{"mid":535023713,"name":"是德科技","tag":["科普"]},{"mid":1321969690,"name":"五道口工匠","tag":[]},{"mid":11555160,"name":"空天同学","tag":[]},{"mid":224560702,"name":"鱼不溜秋","tag":[]},{"mid":17789957,"name":"Amethyst_Star","tag":[]},{"mid":2073606358,"name":"wuli_东哥物理","tag":[]},{"mid":531692757,"name":"初中学业业委会主任","tag":[]},{"mid":1823466601,"name":"English-Power","tag":[]},{"mid":524899324,"name":"小八的数分和高代","tag":[]},{"mid":3546637651675315,"name":"锁匠钥匙批发零售","tag":[]},{"mid":583967110,"name":"今日原理","tag":["科普"]},{"mid":3494361759221832,"name":"财富人生看个性签名拍","tag":[]},{"mid":1640934198,"name":"NewCH-娇哥","tag":[]},{"mid":383587023,"name":"复利的奇迹ETF基金理财","tag":[]},{"mid":1710911403,"name":"刘楠Talia","tag":[]},{"mid":14342271,"name":"遇真纪事","tag":[]},{"mid":2031277323,"name":"科普见闻录","tag":[]},{"mid":520814591,"name":"谈三圈","tag":["科普","科技"]},{"mid":603430640,"name":"涛哥讲期权","tag":["科普"]},{"mid":3546568640694467,"name":"还得是跳爷","tag":["科普"]},{"mid":3546571882892263,"name":"轻玩科技智造家","tag":["科普"]},{"mid":3493140684081255,"name":"新惕姆自动化","tag":["科普"]},{"mid":28535841,"name":"每天都在学东西","tag":["科普"]},{"mid":1741962246,"name":"IT界扛霸子","tag":["学习"]},{"mid":145611758,"name":"游点物理","tag":["科普"]},{"mid":26742637,"name":"方法自习室","tag":["特别关注","科普"]},{"mid":418201063,"name":"影子跟读","tag":["科普","学习"]},{"mid":673614860,"name":"卢麒元的视角","tag":["科普"]},{"mid":1304346514,"name":"张琦大大","tag":["科普"]},{"mid":283389925,"name":"每天一篇外刊精读","tag":["学习"]},{"mid":107861587,"name":"AI大模型全栈","tag":["学习"]},{"mid":1954415159,"name":"TED官方","tag":["科普","学习"]},{"mid":415500574,"name":"B站金融学院","tag":["新闻","科普"]},{"mid":3461575868418125,"name":"哔哩大学政治学院","tag":["科普","学习","新闻"]},{"mid":400258300,"name":"币圈五五开","tag":["科普","信息差"]},{"mid":3546655775263285,"name":"电商小菜鸡呀","tag":["科普","纪录片","信息差"]},{"mid":3546622413768823,"name":"懂一些人情世故","tag":["科普"]},{"mid":102617968,"name":"Amor东山再起","tag":["科普","学习"]},{"mid":217475729,"name":"CSDN","tag":["科普"]},{"mid":685526816,"name":"老魏机械百科","tag":["科普"]},{"mid":3494364269513335,"name":"重案纪实","tag":["学习"]},{"mid":185549749,"name":"bili_185549749","tag":["科普"]},{"mid":502539494,"name":"洞察人性缘","tag":["科普"]},{"mid":73528331,"name":"摩斯神探","tag":["科普"]},{"mid":14004258,"name":"奥德修斯的绳索","tag":["科普"]},{"mid":3546604311152974,"name":"销售学习知识库","tag":["科普"]},{"mid":510767506,"name":"单口喜剧侯智元","tag":["科普"]},{"mid":1169142430,"name":"传播学刘阳","tag":["科普"]},{"mid":1633547470,"name":"林少华林老师","tag":["科普"]},{"mid":1315696773,"name":"韩潇老师讲诗词","tag":["科普"]},{"mid":15741969,"name":"像素范","tag":["学习"]},{"mid":3461579156752681,"name":"常军谈心理","tag":["学习"]},{"mid":238171381,"name":"TED原声英语演讲","tag":["学习"]},{"mid":3546627212052911,"name":"天涯神贴YYDS","tag":["科普"]},{"mid":3546670222543152,"name":"富贵儿很正经","tag":["科普"]},{"mid":448165099,"name":"军情D7处","tag":["新闻"]},{"mid":2233213,"name":"星话大白","tag":["新闻"]},{"mid":1975692083,"name":"军情巴朗","tag":["新闻"]},{"mid":542824499,"name":"军情阿丁","tag":["新闻"]},{"mid":16243913,"name":"Solo审判日","tag":["新闻"]},{"mid":3494354016537425,"name":"A电子爱好者老牛","tag":["科普"]},{"mid":316627722,"name":"世界见闻录","tag":["新闻"]},{"mid":14520423,"name":"传说中的挖掘机","tag":["科普"]},{"mid":3546613639284889,"name":"五点半FiveThirty","tag":["科普"]},{"mid":1944667205,"name":"雷峰网","tag":["新闻"]},{"mid":1433031509,"name":"bili_1433031509","tag":["新闻"]},{"mid":3546662922357356,"name":"52赫兹实验室","tag":["科普","科技"]},{"mid":355155672,"name":"费洛凡","tag":["科普"]},{"mid":506786489,"name":"启眸运动","tag":["科普"]},{"mid":3546387566299549,"name":"达利奥利奥","tag":["科普"]},{"mid":496787581,"name":"SiliconPlanet","tag":["科普","新闻"]},{"mid":3546643550963789,"name":"尝试学习常识","tag":["科普"]},{"mid":515457626,"name":"原版外刊精读社","tag":["科普","学习"]},{"mid":510362725,"name":"赛雷话金","tag":["新闻","科普"]},{"mid":10698584,"name":"唠点历史","tag":["学习","科普","纪录片"]},{"mid":345339963,"name":"光城刺史","tag":["科普"]},{"mid":601612399,"name":"北京卫视档案","tag":["科普"]},{"mid":346563107,"name":"波士顿圆脸","tag":["新闻"]},{"mid":289189019,"name":"戏京同志","tag":["科普","新闻"]},{"mid":1593690059,"name":"李筠教授","tag":["科普"]},{"mid":382423121,"name":"白宫日记","tag":["科普"]},{"mid":600428973,"name":"周侃侃plus","tag":["学习"]},{"mid":430426421,"name":"燕三嘤嘤嘤","tag":["科普","乐子","新闻"]},{"mid":294262027,"name":"奔流映画","tag":["科普","科技"]},{"mid":923477,"name":"无骨者伊瓦尔","tag":["学习"]},{"mid":370982805,"name":"人与地球","tag":["科普"]},{"mid":408179496,"name":"环球地图","tag":["科普"]},{"mid":100785033,"name":"地球知识局","tag":["科普"]},{"mid":3493107370822154,"name":"穿透人性","tag":["科普","抽象派"]},{"mid":325848853,"name":"陇上姚明","tag":["科普","信息差"]},{"mid":22234926,"name":"认真的阿真","tag":["学习","科普"]},{"mid":735958,"name":"胖达粑粑","tag":["科普","学习"]},{"mid":442603088,"name":"三维地图看世界","tag":["科普","学习"]},{"mid":35162124,"name":"hum_hallelujah","tag":["科普","学习"]},{"mid":520819684,"name":"小Lin说","tag":["科普"]},{"mid":613408351,"name":"迷幻枸杞","tag":["科普","学习"]},{"mid":668794433,"name":"哈佛雪梨","tag":["科普"]},{"mid":3546390949005555,"name":"一大杯芋圆啵啵","tag":["学习"]},{"mid":276983285,"name":"你今天学地理了吗","tag":["科普","学习"]},{"mid":34107188,"name":"丘丘的数学之旅","tag":["学习"]},{"mid":385168742,"name":"春霖老师","tag":["学习"]},{"mid":413049762,"name":"高中数学蔡德锦","tag":["学习"]},{"mid":18509044,"name":"Mk数学杀手","tag":["学习"]},{"mid":22511468,"name":"小龙阿卡纳","tag":["学习"]},{"mid":673420980,"name":"韩秀云讲经济","tag":["科普"]},{"mid":478548163,"name":"睡前小声比比","tag":["科普"]},{"mid":563396855,"name":"爱喝碳水的瓦冰","tag":["科普"]},{"mid":357669580,"name":"萌萌战队","tag":["学习","科普"]},{"mid":319176130,"name":"圣诞节南瓜灯","tag":["科普","学习"]},{"mid":3546672034482563,"name":"TED官方科普","tag":["科普"]},{"mid":250584301,"name":"艾伦大大-","tag":["科普"]},{"mid":27022750,"name":"子疯实验室","tag":["纪录片","科普"]},{"mid":485234598,"name":"Emily每日英语听读","tag":["学习"]},{"mid":1555665460,"name":"YouTube政治学院","tag":["纪录片","科普","学习"]},{"mid":1408106571,"name":"柏年说","tag":["科普"]},{"mid":6776617,"name":"安东星老6","tag":["实力派","科普","科技","硬核整活"]},{"mid":30947486,"name":"小椰子专栏","tag":["乐子"]},{"mid":18024796,"name":"橙子登登-","tag":["科普"]},{"mid":2097311046,"name":"产经破壁机","tag":["科普"]},{"mid":296399504,"name":"虎嗅视频","tag":["科普"]},{"mid":3493262402783627,"name":"馋逗儿-","tag":["实力派","纪录片","科普","硬核整活"]},{"mid":487881722,"name":"村花熙熙","tag":["科普"]},{"mid":108709998,"name":"易本正经傅师兄","tag":["科普"]},{"mid":11146869,"name":"黑猫星球","tag":["科普","新闻"]},{"mid":37950062,"name":"硬核资本论","tag":["新闻"]},{"mid":481434238,"name":"Ele实验室","tag":["科普","学习"]},{"mid":437840703,"name":"荒野追剧探长","tag":["纪录片"]},{"mid":598464467,"name":"苏星河牛通","tag":["科普"]},{"mid":611584263,"name":"芯机叔Talk","tag":["科普"]},{"mid":1957113893,"name":"AI光影社","tag":["科普"]},{"mid":496261881,"name":"CNSA中国航天文化","tag":["科普","新闻"]},{"mid":1735615743,"name":"东部战区","tag":["新闻","菌嗜"]},{"mid":687410230,"name":"HexUp","tag":["科普","特别关注","学习"]},{"mid":46880349,"name":"啥都会一点的研究生","tag":["科普","学习"]},{"mid":245869,"name":"尚在天国EX","tag":["科普"]},{"mid":1094131374,"name":"哔哩哔哩超级科学晚","tag":["科普"]},{"mid":28378491,"name":"家有神兽","tag":["学习","菌嗜"]},{"mid":1875198641,"name":"SpaceLens","tag":["科普","学习","菌嗜"]},{"mid":248466804,"name":"百岁山不甜pro","tag":["科普","学习","菌嗜"]},{"mid":1915842925,"name":"一只野飞友","tag":["科普","菌嗜"]},{"mid":67079745,"name":"玄离199","tag":["学习","科普","科技","CODEK"]},{"mid":379889714,"name":"边亮_网络安全","tag":["学习","科普"]},{"mid":14583962,"name":"思维实验室","tag":["科普","学习"]},{"mid":412499953,"name":"Github开源软件-阿轩","tag":["科普","科技","学习"]},{"mid":395188578,"name":"爱上半导体","tag":["科普","科技","学习"]},{"mid":21612876,"name":"电力小子-gtetgeg","tag":["硬核整活"]},{"mid":3494363613104182,"name":"每日英语一点通","tag":["学习"]},{"mid":1980386544,"name":"1号档案馆","tag":["科普","学习"]},{"mid":661141753,"name":"框框老师课堂","tag":["学习","特别关注"]},{"mid":151155077,"name":"天才赵德柱","tag":["科普","科技"]},{"mid":679619486,"name":"国仁全球大学堂","tag":["科普","学习"]},{"mid":52699256,"name":"S亦和","tag":["科普"]},{"mid":67907025,"name":"猴博士爱讲课","tag":["学习"]},{"mid":72270557,"name":"芳斯塔芙","tag":["科普"]},{"mid":3546588897086207,"name":"轻玩科技社","tag":["实力派"]},{"mid":32229576,"name":"算法猪立业","tag":["科普","学习"]},{"mid":3493079826828072,"name":"豌克思","tag":["学习","科普","纪录片","硬核整活","实力派"]},{"mid":96639395,"name":"学院派Academia","tag":["科普"]},{"mid":1606682745,"name":"米哥专升本","tag":["学习"]},{"mid":1534642081,"name":"学习强国","tag":["纪录片","新闻","学习"]},{"mid":21778636,"name":"中国日报","tag":["科普","新闻","学习"]},{"mid":3546752795805831,"name":"国家应急广播","tag":["新闻"]},{"mid":703186600,"name":"麻薯波比呀","tag":["科普","新闻"]},{"mid":415200463,"name":"军迷天花板杰哥","tag":["科普","菌嗜"]},{"mid":33683045,"name":"张召忠","tag":["科普","菌嗜"]},{"mid":569956690,"name":"CGTN","tag":["科普","新闻"]},{"mid":407045223,"name":"二次元的中科院物理所","tag":["科普","新闻","学习"]},{"mid":20259914,"name":"稚晖君","tag":["实力派","科普","科技","硬核整活","学习"]},{"mid":942755,"name":"迷影至下Filmlast","tag":["科普"]},{"mid":205631797,"name":"果壳","tag":["科普"]},{"mid":11270116,"name":"酒痴东梦","tag":["科普","学习"]},{"mid":629101318,"name":"远方的青木","tag":["科普","学习"]},{"mid":321691718,"name":"中国日报网","tag":["科普","新闻"]},{"mid":520097839,"name":"发烧好了呢","tag":["科普","学习"]},{"mid":326427334,"name":"星球研究所","tag":["科普","学习"]},{"mid":452161580,"name":"战忽智库","tag":["学习"]},{"mid":508171633,"name":"思考的熊兄","tag":["学习","特别关注"]},{"mid":26108626,"name":"赛雷三分钟","tag":["科普"]},{"mid":3493089637305282,"name":"中国国家地理景观","tag":["科普"]},{"mid":364654971,"name":"中国国家地理频道","tag":["科普"]},{"mid":335850246,"name":"玉渊谭天","tag":["科普"]},{"mid":519872016,"name":"历史调研室","tag":["科普"]},{"mid":522262428,"name":"不严肃问题研究室","tag":["科普","新闻"]},{"mid":612194373,"name":"沙盘上的战争","tag":["科普","学习"]},{"mid":1839363891,"name":"图解价值","tag":["科普","学习"]},{"mid":743226,"name":"花岗岩工作室","tag":["科普"]},{"mid":374377163,"name":"全球档案馆","tag":["科普","学习"]},{"mid":213845897,"name":"天才简史","tag":["科普"]},{"mid":88461692,"name":"3Blue1Brown","tag":["科普"]},{"mid":94727573,"name":"科学认识论","tag":["科普"]},{"mid":693447092,"name":"超离谱科技","tag":["科普","学习"]},{"mid":65564239,"name":"IT咖啡馆","tag":["科普","科技","学习","CODEK"]},{"mid":323713206,"name":"螳螂捕财","tag":["科普","新闻"]},{"mid":1070859358,"name":"军事博物馆","tag":["科普","学习"]},{"mid":1705267972,"name":"百哥讲网络","tag":["科普","学习"]},{"mid":388576777,"name":"英语的平行世界","tag":["学习"]},{"mid":43219807,"name":"毒舌的南瓜","tag":["科普"]},{"mid":11021614,"name":"我是瑞斯拜","tag":["科普","学习"]},{"mid":70217434,"name":"妈妈不用担心我的英语","tag":["学习"]},{"mid":477671072,"name":"至书-山居五年","tag":["科普","学习"]},{"mid":3494374304385046,"name":"海林A读书","tag":["科普","学习"]},{"mid":390186534,"name":"蜀霞客","tag":["纪录片","科普"]},{"mid":272107494,"name":"7小时解锁新技能","tag":["学习"]},{"mid":514924891,"name":"王德峰","tag":["科普","学习"]},{"mid":435931665,"name":"军武志","tag":["科普","新闻"]},{"mid":1140672573,"name":"小王Albert","tag":["新闻"]},{"mid":14871346,"name":"硬件茶谈","tag":["科普"]},{"mid":3546730316433889,"name":"雷电欧姆","tag":[]},{"mid":622986240,"name":"阿吞啊","tag":["新闻"]},{"mid":69837092,"name":"战争研究所","tag":["科普","新闻"]},{"mid":664086886,"name":"鹏城杰森","tag":["科普","新闻","菌嗜"]},{"mid":439028291,"name":"WU_Eric","tag":["学习"]},{"mid":193147738,"name":"幻海航行","tag":["科普","纪录片"]},{"mid":1773278179,"name":"科幻小凌","tag":["科普"]},{"mid":26606146,"name":"底层原理","tag":["科普"]},{"mid":38598226,"name":"医学科普联盟","tag":["科普"]},{"mid":3546656899336980,"name":"冯无畏","tag":["科普"]},{"mid":430856432,"name":"囚水不盐","tag":["科普"]},{"mid":2039176794,"name":"奇异脑博士","tag":["科普"]},{"mid":485356818,"name":"医学边界","tag":["科普"]},{"mid":67141499,"name":"大漠叔叔","tag":[]},{"mid":1270632901,"name":"我是思屹","tag":["纪录片","科普"]},{"mid":103261012,"name":"歪设长","tag":[]},{"mid":353816116,"name":"大猫超人英语工作室","tag":[]},{"mid":457983079,"name":"math也是柠檬精","tag":["学习"]},{"mid":239688446,"name":"硬核的HeyMatt","tag":["特别关注"]},{"mid":3546821062298417,"name":"框框老师课堂_资料号","tag":["学习"]},{"mid":391930545,"name":"Maki的完美算术教室","tag":["科普","学习"]},{"mid":1632276842,"name":"Ayumu爱讲数学","tag":["科普","特别关注"]},{"mid":27415479,"name":"Victius","tag":["科普"]},{"mid":266765166,"name":"漫士沉思录","tag":["科普"]},{"mid":22072692,"name":"喜欢数学的ayumu","tag":["学习"]},{"mid":394252131,"name":"绩满满","tag":["学习"]},{"mid":320203065,"name":"深蓝学院","tag":[]},{"mid":11023521,"name":"letmedream","tag":["科普","创意","艺术"]},{"mid":446630510,"name":"道长的思维铺子","tag":[]},{"mid":318331,"name":"ForgotFun","tag":["科普","社会"]},{"mid":285027361,"name":"爱研究的小阿楠","tag":[]},{"mid":114366178,"name":"从0开始数","tag":[]},{"mid":1575688490,"name":"CLS同学","tag":[]},{"mid":108753930,"name":"降星驰","tag":["科普","零食关注"]},{"mid":95256449,"name":"遇见狂神说","tag":[]},{"mid":203983793,"name":"Linux中国","tag":[]},{"mid":3546647317448859,"name":"NotOnlySuccess","tag":[]},{"mid":39665558,"name":"偶尔有点小迷糊","tag":[]},{"mid":34786453,"name":"康文昌","tag":[]},{"mid":302417610,"name":"尚硅谷","tag":[]},{"mid":518514395,"name":"今天晚放学","tag":[]},{"mid":322683393,"name":"丘比特的帽子","tag":["学习"]},{"mid":519266610,"name":"会AI的哈利波特","tag":[]},{"mid":1271953419,"name":"大模型微调","tag":[]},{"mid":1283676771,"name":"不加醋的氨基酸","tag":["学习"]},{"mid":367678065,"name":"费曼学徒冬瓜","tag":["学习"]},{"mid":386643440,"name":"我是7788_","tag":["学习"]},{"mid":1965933018,"name":"Python大本营","tag":[]},{"mid":470624011,"name":"动物治愈馆","tag":[]},{"mid":3546583482239276,"name":"故史里","tag":[]},{"mid":3493281239402498,"name":"大发程序员","tag":["学习"]},{"mid":3546886008998093,"name":"雍俊海","tag":["学习"]},{"mid":1791942573,"name":"徐宿的经验书","tag":[]},{"mid":35868098,"name":"长河劫","tag":["科普"]},{"mid":2056649750,"name":"哔哩大学计算机学院","tag":[]},{"mid":30646569,"name":"华语辩坛老友赛","tag":[]},{"mid":157504840,"name":"郝英俊和易道云","tag":[]},{"mid":146668655,"name":"千锋教育","tag":[]},{"mid":1475977561,"name":"今天也要努力哦o","tag":[]},{"mid":2016676980,"name":"北京艾雷克斯企业管理","tag":[]},{"mid":12890453,"name":"程序员鱼皮","tag":[]},{"mid":1209319826,"name":"小锅聊攻防","tag":[]},{"mid":1577562848,"name":"Python万能胶","tag":[]},{"mid":1335124945,"name":"百万亚瑟王x","tag":[]},{"mid":37974444,"name":"黑马程序员","tag":[]},{"mid":416206486,"name":"千锋python","tag":[]},{"mid":3546768587360615,"name":"乌昂大叔","tag":[]},{"mid":129860965,"name":"记忆宫殿宁梓亦","tag":[]},{"mid":371846699,"name":"图灵的猫","tag":[]},{"mid":3493129770502861,"name":"社恐内向昭爷爷","tag":[]},{"mid":1780480185,"name":"飓多多StormCrew","tag":[]},{"mid":472747194,"name":"巫师财经","tag":["科普","社会"]},{"mid":18706318,"name":"龙女之声","tag":[]},{"mid":1809567655,"name":"何大爷课堂","tag":[]},{"mid":1253030023,"name":"一身剑气荡江","tag":["现实"]},{"mid":8157388,"name":"幼稚园大队长丨","tag":[]},{"mid":245645656,"name":"码农高天","tag":["科普"]},{"mid":1871365234,"name":"大问题Dialectic","tag":["科普","特别关注"]},{"mid":1937416537,"name":"陈一枝你坐下","tag":["特别关注"]},{"mid":593251783,"name":"本子在隔壁","tag":[]},{"mid":102584256,"name":"浪花姜","tag":[]},{"mid":1060544882,"name":"东洋雪莲","tag":[]},{"mid":1335713025,"name":"知了解压萌物","tag":[]},{"mid":3546617688886097,"name":"多奇探秘","tag":[]},{"mid":302188068,"name":"小白debug","tag":[]},{"mid":16433002,"name":"隔壁的程序员老王","tag":["学习"]},{"mid":3546752326044595,"name":"啊光小哥哥","tag":[]},{"mid":3546613148551357,"name":"Josh老师和菜鸟小编","tag":[]},{"mid":570064,"name":"章北海official","tag":[]},{"mid":652060948,"name":"童晶老师","tag":[]},{"mid":2116071253,"name":"高考蓝哥","tag":[]},{"mid":97407861,"name":"狼肉好吃","tag":[]},{"mid":3546908731639909,"name":"第三眼日记","tag":[]},{"mid":673835935,"name":"码农的荒岛求生","tag":[]},{"mid":3546693165386233,"name":"挽风的技术教程","tag":[]},{"mid":102438649,"name":"GeekHour","tag":[]},{"mid":325864133,"name":"飞天闪客","tag":["CODEK"]},{"mid":278761367,"name":"唯一讲述者","tag":[]},{"mid":130763764,"name":"三太子敖丙","tag":[]},{"mid":162183,"name":"原子能","tag":[]},{"mid":544451485,"name":"吾爱破解论坛","tag":[]},{"mid":323588182,"name":"毒舌电影编辑部","tag":[]},{"mid":281120100,"name":"我是阿众","tag":["程序员","科普","技术"]},{"mid":668097429,"name":"轩辕的编程宇宙","tag":[]},{"mid":486989780,"name":"老麦的工具库","tag":[]},{"mid":316183842,"name":"技术爬爬虾","tag":["学习","科普","技术"]},{"mid":412704776,"name":"不高兴就喝水","tag":[]},{"mid":3494353494345852,"name":"南哥教恋爱","tag":[]},{"mid":298711658,"name":"路克纪录","tag":[]},{"mid":327247876,"name":"技术蛋老师","tag":[]},{"mid":96609715,"name":"小黑屋的貘_mo","tag":[]},{"mid":623448014,"name":"TIANYU2FM","tag":[]},{"mid":264869770,"name":"丰言疯话","tag":["学习"]},{"mid":3493075691243699,"name":"老戴Donald","tag":["学习"]},{"mid":478849208,"name":"樊登读书上海运营中心","tag":[]},{"mid":3546945542948869,"name":"_美梦守护者_","tag":["现实"]},{"mid":1464874349,"name":"打工人代表巍哥","tag":["科普","信息差"]},{"mid":1679822121,"name":"大唐怪奇笔记","tag":[]},{"mid":19414347,"name":"卡皮巴拉大王拼豆版","tag":[]},{"mid":3493127314737312,"name":"鲶鱼夜话","tag":[]},{"mid":702915816,"name":"云顶数模","tag":[]},{"mid":3546638236781247,"name":"小Lin竖着说","tag":["科普"]},{"mid":15397613,"name":"张云翼_like","tag":["学习"]},{"mid":372313671,"name":"Ross-Ning","tag":[]},{"mid":482867012,"name":"吴悠讲编程","tag":[]},{"mid":3546969421122388,"name":"梦见过彩虹","tag":[]},{"mid":522976477,"name":"Eden说产品","tag":[]},{"mid":1669112799,"name":"产品老兵杰哥","tag":[]},{"mid":3546590214097572,"name":"秀明说","tag":[]},{"mid":3546937947064751,"name":"清华豆师","tag":[]},{"mid":489640651,"name":"新石器公园","tag":["科普"]},{"mid":2100388025,"name":"宇宙世界0","tag":[]},{"mid":254463269,"name":"毕导","tag":[]},{"mid":673779175,"name":"量子位","tag":[]},{"mid":491691175,"name":"C哥聊科技","tag":[]},{"mid":1049078946,"name":"Chris老师即食英语","tag":[]},{"mid":501642082,"name":"萧一白呀","tag":[]},{"mid":3690987316578579,"name":"计算机大白呀","tag":[]},{"mid":458165375,"name":"哔哩哔哩课堂","tag":[]},{"mid":3546662484052067,"name":"娃娃卡哇伊捏","tag":[]},{"mid":481153145,"name":"进击的铁木君","tag":[]},{"mid":1159873315,"name":"大豪夫妇","tag":[]},{"mid":258944527,"name":"陶渊xiao明","tag":[]},{"mid":1037607360,"name":"YOMeeDoll小企鹅窝窝","tag":[]},{"mid":3546857594685834,"name":"陈木白啊","tag":[]},{"mid":1508100119,"name":"零7大王","tag":[]},{"mid":37858284,"name":"网络小白_Uncle城","tag":["技术","科技"]},{"mid":301388587,"name":"Shiki实验室","tag":["学习"]},{"mid":504164656,"name":"科学辟谣","tag":["科普"]},{"mid":111900,"name":"Toka-MK","tag":["零食关注"]},{"mid":1112568165,"name":"汤山老王","tag":[]},{"mid":3690978099595618,"name":"小老板营业中","tag":[]},{"mid":572139281,"name":"鲁本芭娜娜banana","tag":["学习"]},{"mid":3546830396721763,"name":"第四种黑猩猩CHIMP","tag":[]},{"mid":1815948385,"name":"马克的技术工作坊","tag":["学习"]},{"mid":495257108,"name":"小林爱研究","tag":["学习"]},{"mid":385047828,"name":"认知便利店M","tag":["学习"]},{"mid":319526152,"name":"超级TANG-","tag":["科普"]},{"mid":1732848825,"name":"耿同学讲故事","tag":[]},{"mid":276483261,"name":"DeeparchWorks","tag":["程序员","科普","技术"]},{"mid":503577829,"name":"海盗CG","tag":[]},{"mid":3546606469123022,"name":"一觉醒来发生啥","tag":["信息差"]},{"mid":491155397,"name":"信息差猎手","tag":["信息差"]},{"mid":1297136809,"name":"宝藏女嗨沈幼楚","tag":[]},{"mid":270471501,"name":"文文黎","tag":[]},{"mid":106685726,"name":"二二酸酸","tag":["科普"]},{"mid":31341757,"name":"捭阖哗","tag":["特别关注","科普"]},{"mid":490494088,"name":"动动枪DongDongGun","tag":[]},{"mid":1511660367,"name":"西一昂叨叨版","tag":[]}] \ No newline at end of file diff --git a/source/resources/export_uids.txt b/source/resources/export_uids.txt deleted file mode 100644 index 1251370..0000000 --- a/source/resources/export_uids.txt +++ /dev/null @@ -1 +0,0 @@ -1357612844,321583894,439478093,1044673687,62224043,1031543543,1481344732,475443398,2026173074,1858861103,444728505,23947287,35807625,23791195,111714204,1937308559,1587138171,440798355,33291981,648113003,241241407,2099983410,11914415,436700803,3493282273299102,612593877,2125857107,40433405,2000819931,2053592854,546189,507448807,607281655,505935166,14524124,385200931,25876945,669397302,1769820463,1562896062,3493285194632125,3493264275540254,479424216,604710494,1016523517,409109266,1428318343,700817047,1634586116,543931674,1590538073,1574721168,432752294,15247078,499889496,506174440,1784235102,3494376355400290,320819729,1795221360,4848323,495224316,397109346,3493258518858434,379247856,32360194,381653678,393119260,274928598,475656605,365212208,26653094,474881660,3546378525477862,14484744,35339643,1747335,1263990139,3493263038220393,252075192,251642119,387412319,508455218,672614938,1212367465,3494374235179579,589747109,1025542770,23770618,3494350482836026,54091976,252028114,599449178,20826656,384317271,1715594148,3493127266503448,1767282898,487505057,630874464,1264711195,3537118481615036,319358609,518742534,385172962,1999199378,4401694,518619340,419109033,44980991,474803476,629408291,2052851329,525382468,3546595513600180,1475748134,295993972,287591832,38061207,509905775,476819048,21435789,49746395,419052321,488218866,1725223092,1067722283,3494360540777110,2114928296,174471602,43584648,3493281113573620,1480366563,3546590293789198,17095888,391831595,15862638,295100453,1305776725,3493283187657030,25694274,14797570,20998925,166828,3546575620016315,451196839,485163549,13260671,385126080,3546610074126569,523603911,298332602,3461582166166488,3537120815745590,208300745,489302782,430385404,73674032,1500074803,488313112,68134500,1047158092,3546571071293861,1246792669,621235564,124806013,26055664,441631812,243680430,601300995,108526737,2100151539,3461566464789457,3546603229023143,628054609,1749224369,3493133887211865,56300844,35639011,255139870,1029508158,23244398,18562567,3493291869866324,3494354444355822,594840903,3546593938639500,1618054,1098004826,94577838,21849780,35105301,423319981,413276548,693654968,3493111665789758,15520342,535023713,1321969690,11555160,224560702,17789957,2073606358,531692757,1823466601,524899324,3546637651675315,583967110,3494361759221832,1640934198,383587023,1710911403,14342271,2031277323,520814591,603430640,3546568640694467,3546571882892263,3493140684081255,28535841,1741962246,145611758,26742637,418201063,673614860,1304346514,283389925,107861587,1954415159,415500574,3461575868418125,400258300,3546655775263285,3546622413768823,102617968,217475729,685526816,3494364269513335,185549749,502539494,73528331,14004258,3546604311152974,510767506,1169142430,1633547470,1315696773,15741969,3461579156752681,238171381,3546627212052911,3546670222543152,448165099,2233213,1975692083,542824499,16243913,3494354016537425,316627722,14520423,3546613639284889,1944667205,1433031509,3546662922357356,355155672,506786489,3546387566299549,496787581,3546643550963789,515457626,510362725,10698584,345339963,601612399,346563107,289189019,1593690059,382423121,600428973,430426421,294262027,923477,370982805,408179496,100785033,3493107370822154,325848853,22234926,735958,442603088,35162124,520819684,613408351,668794433,3546390949005555,276983285,34107188,385168742,413049762,18509044,22511468,673420980,478548163,563396855,357669580,319176130,3546672034482563,250584301,27022750,485234598,1555665460,1408106571,6776617,30947486,18024796,2097311046,296399504,3493262402783627,487881722,108709998,11146869,37950062,481434238,437840703,598464467,611584263,1957113893,496261881,1735615743,687410230,46880349,245869,1094131374,28378491,1875198641,248466804,1915842925,67079745,379889714,14583962,412499953,395188578,21612876,3494363613104182,1980386544,661141753,151155077,679619486,52699256,67907025,72270557,3546588897086207,32229576,3493079826828072,96639395,1606682745,1534642081,21778636,3546752795805831,703186600,415200463,33683045,569956690,407045223,20259914,942755,205631797,11270116,629101318,321691718,520097839,326427334,452161580,508171633,26108626,3493089637305282,364654971,335850246,519872016,522262428,612194373,1839363891,743226,374377163,213845897,88461692,94727573,693447092,65564239,323713206,1070859358,1705267972,388576777,43219807,11021614,70217434,477671072,3494374304385046,390186534,272107494,514924891,435931665,1140672573,14871346,3546730316433889,622986240,69837092,664086886,439028291,193147738,1773278179,26606146,38598226,3546656899336980,430856432,2039176794,485356818,67141499,1270632901,103261012,353816116,457983079,239688446,3546821062298417,391930545,1632276842,27415479,266765166,22072692,394252131,320203065,11023521,446630510,318331,285027361,114366178,1575688490,108753930,95256449,203983793,3546647317448859,39665558,34786453,302417610,518514395,322683393,519266610,1271953419,1283676771,367678065,386643440,1965933018,470624011,3546583482239276,3493281239402498,3546886008998093,1791942573,35868098,2056649750,30646569,157504840,146668655,1475977561,2016676980,12890453,1209319826,1577562848,1335124945,37974444,416206486,3546768587360615,129860965,371846699,3493129770502861,1780480185,472747194,18706318,1809567655,1253030023,8157388,245645656,1871365234,1937416537,593251783,102584256,1060544882,1335713025,3546617688886097,302188068,16433002,3546752326044595,3546613148551357,570064,652060948,2116071253,97407861,3546908731639909,673835935,3546693165386233,102438649,325864133,278761367,130763764,162183,544451485,323588182,281120100,668097429,486989780,316183842,412704776,3494353494345852,298711658,327247876,96609715,623448014,264869770,3493075691243699,478849208,3546945542948869,1464874349,1679822121,19414347,3493127314737312,702915816,3546638236781247,15397613,372313671,482867012,3546969421122388,522976477,1669112799,3546590214097572,3546937947064751,489640651,2100388025,254463269,673779175,491691175,1049078946,501642082,3690987316578579,458165375,3546662484052067,481153145,1159873315,258944527,1037607360,3546857594685834,1508100119,37858284,301388587,504164656,111900,1112568165,3690978099595618,572139281,3546830396721763,1815948385,495257108,385047828,319526152,1732848825,276483261,503577829,3546606469123022,491155397,1297136809,270471501,106685726,31341757,490494088,1511660367 \ No newline at end of file diff --git a/source/resources/export_uids_test5.json b/source/resources/export_uids_test5.json deleted file mode 100644 index 5fc2001..0000000 --- a/source/resources/export_uids_test5.json +++ /dev/null @@ -1 +0,0 @@ -[{"mid":1357612844,"name":"考研英语马天艺老师","tag":[]},{"mid":321583894,"name":"我是蓝同学啊","tag":["实力派"]},{"mid":439478093,"name":"中国食品报融媒体","tag":["纪录片","新闻"]},{"mid":1044673687,"name":"心理述","tag":[]},{"mid":62224043,"name":"栗之from一直夫妇","tag":[]},{"mid":1031543543,"name":"Java面试突击-Mic","tag":[]},{"mid":1481344732,"name":"我们都是社畜","tag":["准备取关"]},{"mid":475443398,"name":"黑毛羊驼","tag":["准备取关"]}] diff --git a/source/resources/export_uids_test5.txt b/source/resources/export_uids_test5.txt deleted file mode 100644 index 5f948bd..0000000 --- a/source/resources/export_uids_test5.txt +++ /dev/null @@ -1 +0,0 @@ -1357612844,321583894,439478093,1044673687,62224043 \ No newline at end of file diff --git a/source/scripts/analyze_up_content.py b/source/scripts/analyze_up_content.py deleted file mode 100644 index fb7c973..0000000 --- a/source/scripts/analyze_up_content.py +++ /dev/null @@ -1,690 +0,0 @@ -#!/usr/bin/env python3 -"""Fetch recent Bilibili video titles for UIDs and analyze with Volcengine API. - -Input JSON format (list of objects): -[ - {"mid": 12345, "name": "UP Name", "tag": ["准备取关"]} -] -""" - -from __future__ import annotations - -import argparse -import hashlib -import html -import json -import random -import re -import sys -import time -from dataclasses import dataclass -from pathlib import Path -from typing import Any -from urllib import error, parse, request - - -BILIBILI_API = "https://api.bilibili.com/x/space/arc/search" -BILIBILI_WBI_API = "https://api.bilibili.com/x/space/wbi/arc/search" -BILIBILI_NAV_API = "https://api.bilibili.com/x/web-interface/nav" -# 可选:如果仍频繁触发412,可填浏览器里复制的Cookie字符串。 -BILIBILI_COOKIE = "buvid3=5D02D792-070F-79D0-4243-4F75C6277EC022345infoc; b_nut=1765807422; _uuid=1796ECEE-451E-E1B7-1D9A-5D7F5CCCDA5822634infoc; buvid_fp=993faeece85f3e3119d8331a4e5bf683; buvid4=785EC013-0E2C-BC9F-5CBD-B8B00C76D13024715-025121522-ba1d0oh5R0Q47E2dVDisZg%3D%3D; SESSDATA=875331b4%2C1781359476%2C70459%2Ac1CjAXAQicR89csAHVVl-X8yAIy0-eko5ey69tJAyAXIbHhSU5HaUgth-E2fW1e9ij0MESVll2anVrYXVOYkc3VzZ2RmtFQlZzUnNoR0JOdUNZYldWSXh4Y3NZVlVWc1lOaC04M2JRQ3VKZ0x5b2RMbXl1MWpCSE1XMjd2UjVDTUJoUko1bU96aE9BIIEC; bili_jct=2e6b55fe6837ee753c69cd477c1b1ac6; DedeUserID=440102691; DedeUserID__ckMd5=42ab71f1395d8071; theme-tip-show=SHOWED; rpdid=|(u~RklkYm)u0J'u~Yl)|~YuR; hit-dyn-v2=1; theme-avatar-tip-show=SHOWED; LIVE_BUVID=AUTO5117758855687732; PVID=3; CURRENT_QUALITY=64; theme-switch-show=SHOWED; home_feed_column=4; browser_resolution=1359-871; bili_ticket=eyJhbGciOiJIUzI1NiIsImtpZCI6InMwMyIsInR5cCI6IkpXVCJ9.eyJleHAiOjE3NzcyODE5NjAsImlhdCI6MTc3NzAyMjcwMCwicGx0IjotMX0.euCIXefcvPlg1SwKKQh2HLfYStrTdG8dN-qnKCeUBFU; bili_ticket_expires=1777281900; sid=7beimq93; CURRENT_FNVAL=2000; bp_t_offset_440102691=1195139899255160832; b_lsid=52AAA640_19DC3A11696" -RUNTIME_BILIBILI_COOKIE = "" -DEFAULT_USER_AGENT = ( - "Mozilla/5.0 (Windows NT 10.0; Win64; x64) " - "AppleWebKit/537.36 (KHTML, like Gecko) " - "Chrome/124.0.0.0 Safari/537.36" -) -MIXIN_KEY_ENC_TAB = [ - 46, 47, 18, 2, 53, 8, 23, 32, 15, 50, 10, 31, 58, 3, 45, 35, - 27, 43, 5, 49, 33, 9, 42, 19, 29, 28, 14, 39, 12, 38, 41, 13, - 37, 48, 7, 16, 24, 55, 40, 61, 26, 17, 0, 1, 60, 51, 30, 4, - 22, 25, 54, 21, 56, 59, 6, 63, 57, 62, 11, 36, 20, 34, 44, 52, -] - -# 在这里直接填写火山引擎配置。 -VOLCENGINE_API_KEY = "586d443c-5034-4810-9760-50ce77394e8a" -VOLCENGINE_MODEL = "deepseek-v3-1-terminus" -VOLCENGINE_BASE_URL = "https://ark.cn-beijing.volces.com/api/v3" - - -@dataclass -class UpItem: - mid: int - name: str - tag: list[str] - - -def parse_args() -> argparse.Namespace: - parser = argparse.ArgumentParser( - description="抓取 UP 前10个视频标题,并调用火山引擎 API 生成分析报告" - ) - parser.add_argument( - "--input", - default="./source/resources/export_uids.json", - help="输入 JSON 文件路径,默认: ./source/resources/export_uids.json", - ) - parser.add_argument( - "--output", - default="./source/output/reports/up_titles_report.md", - help="输出 Markdown 报告路径,默认: ./source/output/reports/up_titles_report.md", - ) - parser.add_argument( - "--titles-per-up", - type=int, - default=10, - help="每个 UP 抓取的视频标题数量,默认: 10", - ) - parser.add_argument( - "--max-ups", - type=int, - default=0, - help="最多处理多少个 UP,0 表示全部", - ) - parser.add_argument( - "--only-tag", - default="", - help="只处理包含该标签的 UP,例如: 准备取关;留空表示不过滤", - ) - parser.add_argument( - "--sleep-seconds", - type=float, - default=0.8, - help="每个 UP 抓取后的等待秒数,默认: 0.8", - ) - parser.add_argument( - "--retry-times", - type=int, - default=3, - help="抓取重试次数(遇到412/-799时),默认: 3", - ) - parser.add_argument( - "--test-mid", - type=int, - default=0, - help="测试模式:只抓取这个mid,不读取输入文件", - ) - parser.add_argument( - "--test-name", - default="TEST_UP", - help="测试模式下显示名称,默认: TEST_UP", - ) - parser.add_argument( - "--skip-ai", - action="store_true", - help="只测试抓取,不调用AI分析", - ) - parser.add_argument( - "--debug", - action="store_true", - help="输出抓取调试信息", - ) - parser.add_argument( - "--bili-cookie", - default="", - help="可选:运行时传入B站Cookie,优先级高于脚本内BILIBILI_COOKIE", - ) - parser.add_argument( - "--fetch-mode", - choices=["auto", "api", "html"], - default="auto", - help="抓取模式: auto(先API后HTML)/api/html,默认: auto", - ) - parser.add_argument( - "--analyze-from-report", - default="", - help="从已有报告读取标题并仅执行AI分析,例如: source/up_analysis_report.md", - ) - parser.add_argument( - "--batch-size", - type=int, - default=30, - help="分批分析时每批数量,默认: 30", - ) - parser.add_argument( - "--batch-index", - type=int, - default=1, - help="分批分析批次序号(从1开始),默认: 1", - ) - return parser.parse_args() - - -def parse_report_items(report_path: Path) -> list[dict[str, Any]]: - lines = report_path.read_text(encoding="utf-8").splitlines() - items: list[dict[str, Any]] = [] - current: dict[str, Any] | None = None - section = "" - - for line in lines: - m = re.match(r"^##\s+\d+\.\s+(.*?)\s+\(mid:\s*(\d+)\)", line) - if m: - if current is not None: - items.append(current) - current = { - "mid": int(m.group(2)), - "name": m.group(1).strip(), - "tag": [], - "url": f"https://space.bilibili.com/{int(m.group(2))}/video", - "titles": [], - "analysis": "", - "error": "", - } - section = "" - continue - - if current is None: - continue - - if line.startswith("- 主页: "): - current["url"] = line.replace("- 主页: ", "", 1).strip() - continue - if line.startswith("- 标签: "): - raw_tag = line.replace("- 标签: ", "", 1).strip() - current["tag"] = [] if raw_tag in ("", "无") else [x.strip() for x in raw_tag.split(",") if x.strip()] - continue - if line == "### 最近10条标题": - section = "titles" - continue - if line == "### AI分析": - section = "analysis" - continue - if line == "### 异常": - section = "error" - continue - if line.startswith("### "): - section = "" - continue - - if section == "titles" and line.startswith("- "): - t = line[2:].strip() - if t and t != "(未抓取到标题)": - current["titles"].append(t) - elif section == "analysis": - if line.strip(): - if current["analysis"]: - current["analysis"] += "\n" + line.strip() - else: - current["analysis"] = line.strip() - elif section == "error" and line.startswith("- "): - current["error"] = line[2:].strip() - - if current is not None: - items.append(current) - return items - - -def run_batch_analysis_from_report(args: argparse.Namespace, output_path: Path) -> int: - report_path = Path(args.analyze_from_report) - if not report_path.exists(): - print(f"报告文件不存在: {report_path}", file=sys.stderr) - return 1 - - items = parse_report_items(report_path) - if not items: - print("报告中未解析到可分析条目", file=sys.stderr) - return 1 - - pending = [ - it for it in items - if it.get("titles") and (not it.get("analysis") or it.get("analysis") == "测试模式已跳过AI分析") - ] - if not pending: - print("报告中没有待分析条目(可能已全部分析完成)") - output_path.write_text(build_report(items), encoding="utf-8") - return 0 - - batch_size = max(args.batch_size, 1) - batch_index = max(args.batch_index, 1) - start = (batch_index - 1) * batch_size - end = start + batch_size - batch = pending[start:end] - if not batch: - print(f"批次为空: batch-index={batch_index}, batch-size={batch_size}, 待分析总数={len(pending)}") - output_path.write_text(build_report(items), encoding="utf-8") - return 0 - - print( - f"开始分批分析: 第{batch_index}批, 每批{batch_size}条, " - f"本批{len(batch)}条, 待分析总数{len(pending)}" - ) - - key_to_index = {f"{it['mid']}::{it['name']}": idx for idx, it in enumerate(items)} - for idx, it in enumerate(batch, start=1): - print(f"[batch {idx}/{len(batch)}] AI分析: {it['name']} ({it['mid']})") - try: - analysis = analyze_titles(it["name"], it["url"], it["titles"]) - origin_idx = key_to_index.get(f"{it['mid']}::{it['name']}") - if origin_idx is not None: - items[origin_idx]["analysis"] = analysis - items[origin_idx]["error"] = "" - except Exception as exc: # noqa: BLE001 - origin_idx = key_to_index.get(f"{it['mid']}::{it['name']}") - if origin_idx is not None: - items[origin_idx]["error"] = str(exc) - time.sleep(max(args.sleep_seconds, 0.0)) - - output_path.parent.mkdir(parents=True, exist_ok=True) - output_path.write_text(build_report(items), encoding="utf-8") - print(f"分批分析报告已生成: {output_path}") - return 0 - - -def load_up_items(input_path: Path) -> list[UpItem]: - raw = json.loads(input_path.read_text(encoding="utf-8")) - if not isinstance(raw, list): - raise ValueError("输入 JSON 必须是数组") - - items: list[UpItem] = [] - for idx, obj in enumerate(raw): - if not isinstance(obj, dict): - raise ValueError(f"第 {idx + 1} 项不是对象") - mid = obj.get("mid") - name = obj.get("name", "") - tags = obj.get("tag", []) - if mid is None: - continue - try: - mid_int = int(mid) - except (TypeError, ValueError): - continue - if not isinstance(name, str): - name = str(name) - if not isinstance(tags, list): - tags = [] - tags = [str(t) for t in tags] - items.append(UpItem(mid=mid_int, name=name.strip(), tag=tags)) - return items - - -def http_get_json( - url: str, - timeout: float = 20.0, - referer: str = "https://space.bilibili.com/", -) -> dict[str, Any]: - headers = { - "User-Agent": DEFAULT_USER_AGENT, - "Referer": referer, - "Origin": "https://www.bilibili.com", - "Accept": "application/json, text/plain, */*", - "Accept-Language": "zh-CN,zh;q=0.9,en;q=0.8", - } - cookie = RUNTIME_BILIBILI_COOKIE.strip() or BILIBILI_COOKIE.strip() - if cookie: - headers["Cookie"] = cookie - req = request.Request(url, headers=headers, method="GET") - with request.urlopen(req, timeout=timeout) as resp: - body = resp.read().decode("utf-8", errors="replace") - return json.loads(body) - - -def http_get_text( - url: str, - timeout: float = 20.0, - referer: str = "https://space.bilibili.com/", -) -> str: - headers = { - "User-Agent": DEFAULT_USER_AGENT, - "Referer": referer, - "Origin": "https://www.bilibili.com", - "Accept": "text/html,application/xhtml+xml,application/xml;q=0.9,*/*;q=0.8", - "Accept-Language": "zh-CN,zh;q=0.9,en;q=0.8", - } - cookie = RUNTIME_BILIBILI_COOKIE.strip() or BILIBILI_COOKIE.strip() - if cookie: - headers["Cookie"] = cookie - req = request.Request(url, headers=headers, method="GET") - with request.urlopen(req, timeout=timeout) as resp: - return resp.read().decode("utf-8", errors="replace") - - -def get_mixin_key(img_key: str, sub_key: str) -> str: - origin = img_key + sub_key - mixed = "".join(origin[i] for i in MIXIN_KEY_ENC_TAB) - return mixed[:32] - - -def build_wbi_params(base_params: dict[str, Any], mixin_key: str) -> dict[str, Any]: - params = {k: str(v) for k, v in base_params.items()} - params["wts"] = str(int(time.time())) - params = dict(sorted(params.items())) - filtered = { - k: re.sub(r"[!'()*]", "", v) - for k, v in params.items() - } - query = parse.urlencode(filtered) - w_rid = hashlib.md5((query + mixin_key).encode("utf-8")).hexdigest() - filtered["w_rid"] = w_rid - return filtered - - -def get_wbi_mixin_key() -> str: - data = http_get_json(BILIBILI_NAV_API, referer="https://www.bilibili.com/") - if data.get("code") != 0: - raise RuntimeError( - f"获取wbi密钥失败 code={data.get('code')}, message={data.get('message')}" - ) - wbi_img = data.get("data", {}).get("wbi_img", {}) - img_url = wbi_img.get("img_url", "") - sub_url = wbi_img.get("sub_url", "") - if not img_url or not sub_url: - raise RuntimeError("获取wbi密钥失败: nav接口缺少img_url/sub_url") - img_key = img_url.rsplit("/", 1)[-1].split(".")[0] - sub_key = sub_url.rsplit("/", 1)[-1].split(".")[0] - return get_mixin_key(img_key, sub_key) - - -def parse_titles_from_data(data: dict[str, Any]) -> list[str]: - vlist = data.get("data", {}).get("list", {}).get("vlist", []) - if not isinstance(vlist, list): - return [] - titles: list[str] = [] - for item in vlist: - if not isinstance(item, dict): - continue - title = item.get("title", "") - if isinstance(title, str) and title.strip(): - titles.append(clean_html(title.strip())) - return titles - - -def fetch_titles_from_space_html(mid: int, titles_per_up: int, debug: bool = False) -> list[str]: - url = f"https://space.bilibili.com/{mid}/video" - html_text = http_get_text(url, referer="https://www.bilibili.com/") - - # 页面中视频封面常携带标题到alt字段,优先从这里提取。 - alt_candidates = re.findall( - r']*class="[^"]*b-img__inner[^"]*"[^>]*alt="([^"]+)"', - html_text, - flags=re.IGNORECASE, - ) - - titles: list[str] = [] - seen: set[str] = set() - for raw in alt_candidates: - t = clean_html(html.unescape(raw)).strip() - if not t or t in seen: - continue - seen.add(t) - titles.append(t) - if len(titles) >= titles_per_up: - break - - if debug: - print(f"[debug] HTML模式提取到 {len(titles)} 条标题") - return titles - - -def fetch_titles( - mid: int, - titles_per_up: int, - retry_times: int = 3, - debug: bool = False, - fetch_mode: str = "auto", -) -> list[str]: - base_params = { - "mid": str(mid), - "pn": "1", - "ps": str(titles_per_up), - "order": "pubdate", - "index": "1", - "jsonp": "json", - } - - errors: list[str] = [] - if fetch_mode in ("auto", "api"): - # 优先使用wbi接口,稳定性通常更好。 - mixin_key = "" - try: - mixin_key = get_wbi_mixin_key() - except Exception as exc: # noqa: BLE001 - if debug: - print(f"[debug] 获取wbi密钥失败: {exc}") - - for attempt in range(1, max(retry_times, 1) + 1): - try: - if mixin_key: - signed = build_wbi_params(base_params, mixin_key) - url = f"{BILIBILI_WBI_API}?{parse.urlencode(signed)}" - else: - url = f"{BILIBILI_API}?{parse.urlencode(base_params)}" - data = http_get_json(url, referer=f"https://space.bilibili.com/{mid}/video") - code = data.get("code", -1) - if code == 0: - titles = parse_titles_from_data(data) - if titles: - return titles - errors.append("接口返回成功但标题为空") - else: - errors.append(f"code={code}, message={data.get('message', 'unknown')} ") - except error.HTTPError as exc: - errors.append(f"HTTP {exc.code} {exc.reason}") - except Exception as exc: # noqa: BLE001 - errors.append(str(exc)) - - sleep_for = min(12.0, (1.8 ** attempt) + random.uniform(0.2, 1.0)) - if debug: - print(f"[debug] mid={mid} API第{attempt}次失败: {errors[-1]},{sleep_for:.1f}s后重试") - time.sleep(sleep_for) - - if fetch_mode in ("auto", "html"): - try: - html_titles = fetch_titles_from_space_html(mid, titles_per_up, debug=debug) - if html_titles: - return html_titles - errors.append("HTML模式未提取到标题") - except Exception as exc: # noqa: BLE001 - errors.append(f"HTML模式失败: {exc}") - - joined = "; ".join(errors[-3:]) - if ("412" in joined) or ("-799" in joined): - hint = "提示: 请在脚本里填写BILIBILI_COOKIE,或运行时加 --bili-cookie \"SESSDATA=...; buvid3=...\"" - raise RuntimeError(f"{joined}; {hint}") - raise RuntimeError(joined) - - -def clean_html(text: str) -> str: - return re.sub(r"<[^>]+>", "", text) - - -def call_volcengine_chat(system_prompt: str, user_prompt: str) -> str: - api_key = VOLCENGINE_API_KEY.strip() - base_url = VOLCENGINE_BASE_URL.strip() - model = VOLCENGINE_MODEL.strip() - - if (not api_key) or ("在这里填" in api_key): - raise RuntimeError("请先在脚本顶部填写 VOLCENGINE_API_KEY") - if (not model) or ("在这里填" in model): - raise RuntimeError("请先在脚本顶部填写 VOLCENGINE_MODEL") - if not base_url: - raise RuntimeError("请先在脚本顶部填写 VOLCENGINE_BASE_URL") - - url = f"{base_url.rstrip('/')}/chat/completions" - payload = { - "model": model, - "messages": [ - {"role": "system", "content": system_prompt}, - {"role": "user", "content": user_prompt}, - ], - "temperature": 0.4, - } - data = json.dumps(payload, ensure_ascii=False).encode("utf-8") - - req = request.Request( - url, - data=data, - headers={ - "Content-Type": "application/json", - "Authorization": f"Bearer {api_key}", - }, - method="POST", - ) - - with request.urlopen(req, timeout=60) as resp: - body = resp.read().decode("utf-8", errors="replace") - result = json.loads(body) - content = result.get("choices", [{}])[0].get("message", {}).get("content", "") - if not isinstance(content, str) or not content.strip(): - raise RuntimeError(f"火山引擎返回结构异常: {body[:500]}") - return content.strip() - - -def analyze_titles(up_name: str, up_url: str, titles: list[str]) -> str: - system_prompt = ( - "你是一个内容分析助手。根据视频标题判断UP主内容方向,并给出是否建议取关。" - "输出必须是简体中文,且严格按照用户给定的Markdown格式。" - ) - joined_titles = "\n".join(f"- {t}" for t in titles) - user_prompt = f""" -请分析以下UP主最近视频标题: - -UP主:{up_name} -主页:{up_url} -标题: -{joined_titles} - -请按以下格式输出(不要增加其它段落): -1) 内容定位:一句话 -2) 受众画像:一句话 -3) 近期内容倾向:2-3点,使用-开头 -4) 质量评价:80-120字 -5) 取关建议:保留关注/可以取关(二选一) -6) 建议理由:50-100字 -""".strip() - return call_volcengine_chat(system_prompt, user_prompt) - - -def build_report(results: list[dict[str, Any]]) -> str: - now = time.strftime("%Y-%m-%d %H:%M:%S") - lines: list[str] = [] - lines.append("# UP主内容分析报告") - lines.append("") - lines.append(f"- 生成时间: {now}") - lines.append(f"- 分析数量: {len(results)}") - lines.append("") - - for idx, item in enumerate(results, start=1): - lines.append(f"## {idx}. {item['name']} (mid: {item['mid']})") - lines.append("") - lines.append(f"- 主页: {item['url']}") - tags = item.get("tag", []) - lines.append(f"- 标签: {', '.join(tags) if tags else '无'}") - lines.append("") - lines.append("### 最近10条标题") - lines.append("") - titles = item.get("titles", []) - if titles: - for t in titles: - lines.append(f"- {t}") - else: - lines.append("- (未抓取到标题)") - lines.append("") - - analysis = item.get("analysis", "") - if analysis: - lines.append("### AI分析") - lines.append("") - lines.append(analysis) - lines.append("") - - error_msg = item.get("error", "") - if error_msg: - lines.append("### 异常") - lines.append("") - lines.append(f"- {error_msg}") - lines.append("") - - return "\n".join(lines).rstrip() + "\n" - - -def main() -> int: - global RUNTIME_BILIBILI_COOKIE - args = parse_args() - RUNTIME_BILIBILI_COOKIE = (args.bili_cookie or "").strip() - input_path = Path(args.input) - output_path = Path(args.output) - - if args.analyze_from_report: - return run_batch_analysis_from_report(args, output_path) - - if args.test_mid > 0: - items = [UpItem(mid=args.test_mid, name=args.test_name, tag=["测试模式"]) ] - print(f"测试模式: 仅处理 mid={args.test_mid}") - else: - if not input_path.exists(): - print(f"输入文件不存在: {input_path}", file=sys.stderr) - return 1 - - try: - items = load_up_items(input_path) - except Exception as exc: - print(f"加载输入文件失败: {exc}", file=sys.stderr) - return 1 - - if args.only_tag: - items = [it for it in items if args.only_tag in it.tag] - - if args.max_ups and args.max_ups > 0: - items = items[: args.max_ups] - - if not items: - print("没有可处理的 UP 数据", file=sys.stderr) - return 1 - - print(f"开始处理 {len(items)} 个 UP...") - if args.skip_ai: - print("已启用 --skip-ai,仅测试抓取标题") - if args.debug: - print(f"[debug] 当前抓取模式: {args.fetch_mode}") - - results: list[dict[str, Any]] = [] - for idx, item in enumerate(items, start=1): - up_url = f"https://space.bilibili.com/{item.mid}/video" - row: dict[str, Any] = { - "mid": item.mid, - "name": item.name or f"mid_{item.mid}", - "tag": item.tag, - "url": up_url, - "titles": [], - "analysis": "", - "error": "", - } - - print(f"[{idx}/{len(items)}] 抓取: {row['name']} ({item.mid})") - try: - titles = fetch_titles( - item.mid, - args.titles_per_up, - retry_times=args.retry_times, - debug=args.debug, - fetch_mode=args.fetch_mode, - ) - row["titles"] = titles - if not titles: - row["error"] = "未抓取到标题,可能是接口限制或UP无公开视频" - elif args.skip_ai: - row["analysis"] = "测试模式已跳过AI分析" - else: - row["analysis"] = analyze_titles(row["name"], up_url, titles) - except error.HTTPError as exc: - row["error"] = f"HTTP错误: {exc.code} {exc.reason}" - except error.URLError as exc: - row["error"] = f"网络错误: {exc.reason}" - except Exception as exc: # noqa: BLE001 - row["error"] = str(exc) - - if args.debug and row["titles"]: - sample = row["titles"][: min(3, len(row["titles"]))] - print(f"[debug] mid={item.mid} 成功抓取 {len(row['titles'])} 条,样例: {sample}") - - results.append(row) - time.sleep(max(args.sleep_seconds, 0)) - - report = build_report(results) - output_path.parent.mkdir(parents=True, exist_ok=True) - output_path.write_text(report, encoding="utf-8") - print(f"报告已生成: {output_path}") - return 0 - - -if __name__ == "__main__": - raise SystemExit(main()) diff --git a/source/scripts/batch_ai_summary_from_report.py b/source/scripts/batch_ai_summary_from_report.py deleted file mode 100644 index 9308608..0000000 --- a/source/scripts/batch_ai_summary_from_report.py +++ /dev/null @@ -1,598 +0,0 @@ -#!/usr/bin/env python3 -"""Batch AI summary from existing UP markdown report. - -Read an existing report (e.g. source/up_analysis_report.md), -extract each UP's title list, and generate AI summaries in batches. -""" - -from __future__ import annotations - -import argparse -from concurrent.futures import ThreadPoolExecutor, as_completed -import json -import math -import re -import sys -import time -from pathlib import Path -from typing import Any -from urllib import request - -# Fill your Volcengine Ark settings here. -VOLCENGINE_API_KEY = "586d443c-5034-4810-9760-50ce77394e8a" -VOLCENGINE_MODEL = "deepseek-v3-1-terminus" -VOLCENGINE_BASE_URL = "https://ark.cn-beijing.volces.com/api/v3" - -SKIP_MARKERS = { - "", - "测试模式已跳过AI分析", - "(待分析)", -} - -# 预设分组及关键词规则(可自行扩展)。 -PRESET_GROUPS: dict[str, list[str]] = { - "AAA_核心每日必读":[ - "编程", "算法", "工程", "干货", "新闻", "趋势", - ], - "AA_编程信息干货必留": [ - "编程", "算法", "工程", "教程", "实战", "课程", "新技术", "开源", "工具", "效率", "技术", "架构", - ], - "A_硬核知识保留": [ - "科普", "数学", "物理", "编程", "算法", "工程", "历史", "新闻", "深度", - ], - "B_技能学习保留": [ - "英语", "四六级", "考研", "面试", "教程", "实战", "学习", "课程", "写作", - ], - "C_资讯快餐观察": [ - "热点", "速览", "信息差", "快报", "盘点", "吐槽", "观点", "趋势", - ], - "D_娱乐消遣可取关": [ - "搞笑", "整活", "抽象", "乐子", "娱乐", "段子", "鬼畜", "日常", "情侣", - ], - "E_营销带货谨慎": [ - "好物", "测评", "种草", "直播", "带货", "优惠", "开箱", "广告", "激活", - ], -} - - -def parse_args() -> argparse.Namespace: - parser = argparse.ArgumentParser(description="基于现有报告分批做AI总结") - parser.add_argument( - "--input-report", - default="source/output/reports/1_up_titles_report.md", - help="已有标题报告路径", - ) - parser.add_argument( - "--output-report", - default="source/output/reports/2_up_analysis_full_auto.md", - help="输出报告路径", - ) - parser.add_argument( - "--batch-size", - type=int, - default=20, - help="每批处理数量,默认: 20", - ) - parser.add_argument( - "--batch-index", - type=int, - default=1, - help="批次序号(从1开始),默认: 1", - ) - parser.add_argument( - "--sleep-seconds", - type=float, - default=0.0, - help="提交任务间隔秒数,默认: 0(并发模式建议0)", - ) - parser.add_argument( - "--workers", - type=int, - default=4, - help="并发请求数,默认: 4", - ) - parser.add_argument( - "--max-retries", - type=int, - default=2, - help="单个UP分析最大重试次数,默认: 2", - ) - parser.add_argument( - "--request-timeout", - type=float, - default=60.0, - help="单次AI请求超时秒数,默认: 60", - ) - parser.add_argument( - "--force", - action="store_true", - help="强制覆盖已有AI分析(默认只处理待分析项)", - ) - parser.add_argument( - "--debug", - action="store_true", - help="输出调试信息", - ) - parser.add_argument( - "--config-from", - default="source/scripts/analyze_up_content.py", - help="自动读取API配置的脚本路径", - ) - parser.add_argument( - "--run-all-batches", - action="store_true", - help="自动连续跑完所有批次(忽略batch-index)", - ) - return parser.parse_args() - - -def load_api_config_from_script(path: Path) -> dict[str, str]: - if not path.exists(): - return {} - text = path.read_text(encoding="utf-8", errors="replace") - result: dict[str, str] = {} - for key in ("VOLCENGINE_API_KEY", "VOLCENGINE_MODEL", "VOLCENGINE_BASE_URL"): - m = re.search(rf"^{key}\s*=\s*\"([^\"]*)\"", text, flags=re.MULTILINE) - if m: - result[key] = m.group(1).strip() - return result - - -def parse_report(path: Path) -> list[dict[str, Any]]: - lines = path.read_text(encoding="utf-8").splitlines() - - items: list[dict[str, Any]] = [] - current: dict[str, Any] | None = None - section = "" - - for line in lines: - m = re.match(r"^##\s+\d+\.\s+(.*?)\s+\(mid:\s*(\d+)\)", line) - if m: - if current is not None: - items.append(current) - mid = int(m.group(2)) - current = { - "mid": mid, - "name": m.group(1).strip(), - "tag": [], - "url": f"https://space.bilibili.com/{mid}/video", - "titles": [], - "analysis": "", - "group": "", - "action": "", - "reason": "", - "error": "", - } - section = "" - continue - - if current is None: - continue - - if line.startswith("- 主页: "): - current["url"] = line.replace("- 主页: ", "", 1).strip() - continue - if line.startswith("- 标签: "): - raw = line.replace("- 标签: ", "", 1).strip() - current["tag"] = [] if raw in ("", "无") else [x.strip() for x in raw.split(",") if x.strip()] - continue - - if line == "### 最近10条标题": - section = "titles" - continue - if line == "### AI分析": - section = "analysis" - continue - if line == "### 分组建议": - section = "group" - continue - if line == "### 异常": - section = "error" - continue - if line.startswith("### "): - section = "" - continue - - if section == "titles" and line.startswith("- "): - text = line[2:].strip() - if text and text != "(未抓取到标题)": - current["titles"].append(text) - elif section == "analysis" and line.strip(): - current["analysis"] = (current["analysis"] + "\n" + line.strip()).strip() - elif section == "group": - if line.startswith("- 预设分组: "): - current["group"] = line.replace("- 预设分组: ", "", 1).strip() - elif line.startswith("- 建议动作: "): - current["action"] = line.replace("- 建议动作: ", "", 1).strip() - elif line.startswith("- 判断依据: "): - current["reason"] = line.replace("- 判断依据: ", "", 1).strip() - elif line.strip() == "(待分组)": - current["group"] = "" - current["action"] = "" - current["reason"] = "" - elif section == "error" and line.startswith("- "): - current["error"] = line[2:].strip() - - if current is not None: - items.append(current) - - return items - - -def call_volcengine_chat( - system_prompt: str, - user_prompt: str, - cfg: dict[str, str], - timeout: float, -) -> str: - api_key = cfg.get("VOLCENGINE_API_KEY", "").strip() - model = cfg.get("VOLCENGINE_MODEL", "").strip() - base_url = cfg.get("VOLCENGINE_BASE_URL", "").strip() - - if (not api_key) or ("在这里填" in api_key): - raise RuntimeError("请先在脚本顶部填写 VOLCENGINE_API_KEY") - if (not model) or ("在这里填" in model): - raise RuntimeError("请先在脚本顶部填写 VOLCENGINE_MODEL") - if not base_url: - raise RuntimeError("请先在脚本顶部填写 VOLCENGINE_BASE_URL") - - payload = { - "model": model, - "messages": [ - {"role": "system", "content": system_prompt}, - {"role": "user", "content": user_prompt}, - ], - "temperature": 0.4, - } - - body = json.dumps(payload, ensure_ascii=False).encode("utf-8") - req = request.Request( - f"{base_url.rstrip('/')}/chat/completions", - data=body, - headers={ - "Content-Type": "application/json", - "Authorization": f"Bearer {api_key}", - }, - method="POST", - ) - - with request.urlopen(req, timeout=timeout) as resp: - text = resp.read().decode("utf-8", errors="replace") - - data = json.loads(text) - content = data.get("choices", [{}])[0].get("message", {}).get("content", "") - if not isinstance(content, str) or not content.strip(): - raise RuntimeError(f"AI响应异常: {text[:500]}") - return content.strip() - - -def summarize_one_up( - name: str, - mid: int, - titles: list[str], - tags: list[str], - cfg: dict[str, str], - timeout: float, -) -> dict[str, str]: - system_prompt = ( - "你是内容定位与订阅决策助手。" - "你必须输出合法JSON,不要输出其它文本。" - ) - joined_titles = "\n".join(f"- {t}" for t in titles) - joined_tags = "、".join(tags) if tags else "无" - rule_hint = heuristic_group_hint(titles, tags) - groups_desc = "\n".join(f"- {k}" for k in PRESET_GROUPS) - - user_prompt = f""" -请基于以下信息完成分组与总结。 - -UP主: {name} -mid: {mid} -标签: {joined_tags} -最近标题: -{joined_titles} - -预设分组: -{groups_desc} - -代码规则初判: -{rule_hint} - -要求: -1) 输出JSON对象,字段严格为: summary, group, action, reason。 -2) summary: 一段中文总结,50-100字。 -3) group: 必须从预设分组里选一个。给出详细的分组类别和命中分组中的规则词。 -4) action: 只能是"保留关注"或"可以取关"。敏感一点,只保留真正核心优质的up,其他都建议取关。 -5) reason: 30-60字,解释为什么分到该组并给出该动作。 -""".strip() - - content = call_volcengine_chat(system_prompt, user_prompt, cfg, timeout=timeout) - return parse_ai_json(content) - - -def parse_ai_json(content: str) -> dict[str, str]: - text = content.strip() - if text.startswith("```"): - text = re.sub(r"^```[a-zA-Z]*\n?", "", text) - text = re.sub(r"\n?```$", "", text).strip() - m = re.search(r"\{.*\}", text, flags=re.DOTALL) - if m: - text = m.group(0) - data = json.loads(text) - summary = str(data.get("summary", "")).strip() - group = str(data.get("group", "")).strip() - action = str(data.get("action", "")).strip() - reason = str(data.get("reason", "")).strip() - if not summary: - raise RuntimeError("AI返回缺少summary") - if group not in PRESET_GROUPS: - raise RuntimeError(f"AI返回未知group: {group}") - if action not in ("保留关注", "可以取关"): - raise RuntimeError(f"AI返回未知action: {action}") - if not reason: - reason = "基于标题内容与更新风格综合判断。" - return { - "summary": summary, - "group": group, - "action": action, - "reason": reason, - } - - -def heuristic_group_hint(titles: list[str], tags: list[str]) -> str: - text = "\n".join(titles) + "\n" + " ".join(tags) - score: dict[str, int] = {k: 0 for k in PRESET_GROUPS} - lower_text = text.lower() - for group, words in PRESET_GROUPS.items(): - for w in words: - w_lower = w.lower() - if w_lower in lower_text: - score[group] += 1 - ranked = sorted(score.items(), key=lambda x: x[1], reverse=True) - best_group, best_score = ranked[0] - if best_score <= 0: - return "未命中关键词,倾向按内容专业度与稳定性判断。" - top3 = ", ".join(f"{g}:{s}" for g, s in ranked[:3]) - return f"关键词命中最高组={best_group}(score={best_score}),参考分布: {top3}" - - -def summarize_one_up_with_retry( - item: dict[str, Any], - cfg: dict[str, str], - max_retries: int, - timeout: float, - debug: bool, -) -> dict[str, str]: - last_exc: Exception | None = None - total_try = max(1, max_retries) - for attempt in range(1, total_try + 1): - try: - return summarize_one_up( - item["name"], - item["mid"], - item.get("titles", []), - item.get("tag", []), - cfg, - timeout=timeout, - ) - except Exception as exc: # noqa: BLE001 - last_exc = exc - if debug: - print(f"[debug] {item['name']} 第{attempt}次失败: {exc}") - if attempt < total_try: - time.sleep(min(2.0, 0.5 * attempt)) - raise RuntimeError(str(last_exc) if last_exc else "未知错误") - - -def build_report(items: list[dict[str, Any]], batch_note: str) -> str: - now = time.strftime("%Y-%m-%d %H:%M:%S") - lines: list[str] = [ - "# UP主内容分析报告(分批AI总结)", - "", - f"- 生成时间: {now}", - f"- 分析数量: {len(items)}", - f"- 处理说明: {batch_note}", - "", - ] - - group_stats: dict[str, int] = {k: 0 for k in PRESET_GROUPS} - action_stats: dict[str, int] = {"保留关注": 0, "可以取关": 0} - for item in items: - g = item.get("group", "") - a = item.get("action", "") - if g in group_stats: - group_stats[g] += 1 - if a in action_stats: - action_stats[a] += 1 - - lines.append("## 分组统计") - lines.append("") - for g, c in group_stats.items(): - lines.append(f"- {g}: {c}") - lines.append(f"- 保留关注: {action_stats['保留关注']}") - lines.append(f"- 可以取关: {action_stats['可以取关']}") - lines.append("") - - for idx, item in enumerate(items, start=1): - lines.append(f"## {idx}. {item['name']} (mid: {item['mid']})") - lines.append("") - lines.append(f"- 主页: {item['url']}") - tags = item.get("tag", []) - lines.append(f"- 标签: {', '.join(tags) if tags else '无'}") - lines.append("") - lines.append("### 最近10条标题") - lines.append("") - titles = item.get("titles", []) - if titles: - for t in titles: - lines.append(f"- {t}") - else: - lines.append("- (未抓取到标题)") - lines.append("") - - lines.append("### AI分析") - lines.append("") - analysis = item.get("analysis", "") - lines.append(analysis if analysis else "(待分析)") - lines.append("") - - lines.append("### 分组建议") - lines.append("") - group = item.get("group", "") - action = item.get("action", "") - reason = item.get("group_reason", "") - if group and action: - lines.append(f"- 预设分组: {group}") - lines.append(f"- 建议动作: {action}") - lines.append(f"- 判断依据: {reason if reason else '基于标题与更新风格综合判断。'}") - else: - lines.append("- (待分组)") - lines.append("") - - error = item.get("error", "") - if error: - lines.append("### 异常") - lines.append("") - lines.append(f"- {error}") - lines.append("") - - return "\n".join(lines).rstrip() + "\n" - - -def main() -> int: - args = parse_args() - input_report = Path(args.input_report) - output_report = Path(args.output_report) - - if not input_report.exists(): - print(f"输入报告不存在: {input_report}", file=sys.stderr) - return 1 - - items = parse_report(input_report) - if not items: - print("输入报告未解析出任何UP条目", file=sys.stderr) - return 1 - - config = { - "VOLCENGINE_API_KEY": VOLCENGINE_API_KEY, - "VOLCENGINE_MODEL": VOLCENGINE_MODEL, - "VOLCENGINE_BASE_URL": VOLCENGINE_BASE_URL, - } - if ("在这里填" in config["VOLCENGINE_API_KEY"]) or ("在这里填" in config["VOLCENGINE_MODEL"]): - inherited = load_api_config_from_script(Path(args.config_from)) - if inherited: - config.update(inherited) - - if args.force: - pending = [it for it in items if it.get("titles")] - # else: - # pending = [ - # it for it in items - # if it.get("titles") and it.get("analysis", "").strip() in SKIP_MARKERS - # ] - else: - pending = [ - it for it in items - if it.get("titles") and ( - it.get("analysis", "").strip() in SKIP_MARKERS - or not it.get("group") # 没有分组也要重跑 - ) - ] - - if not pending: - print("没有待分析条目,直接输出当前报告") - output_report.write_text(build_report(items, "无待分析条目"), encoding="utf-8") - return 0 - - index_map = {f"{it['mid']}::{it['name']}": idx for idx, it in enumerate(items)} - success_total = 0 - failed_total = 0 - - batch_size = max(1, args.batch_size) - if args.run_all_batches: - total_batches = math.ceil(len(pending) / batch_size) - batch_indexes = list(range(1, total_batches + 1)) - print(f"自动连续模式: 共{total_batches}批, 待分析总数{len(pending)}") - else: - batch_indexes = [max(1, args.batch_index)] - - workers = max(1, args.workers) - print(f"并发配置: workers={workers}, retries={max(1, args.max_retries)}, timeout={args.request_timeout}s") - - for batch_index in batch_indexes: - start = (batch_index - 1) * batch_size - end = start + batch_size - batch = pending[start:end] - if not batch: - continue - - print( - f"开始分批AI总结: 第{batch_index}批, 每批{batch_size}条, " - f"本批{len(batch)}条, 待分析总数{len(pending)}" - ) - - success = 0 - failed = 0 - future_to_item: dict[Any, dict[str, Any]] = {} - with ThreadPoolExecutor(max_workers=workers) as executor: - for i, it in enumerate(batch, start=1): - print(f"[submit {i}/{len(batch)}] {it['name']} ({it['mid']})") - future = executor.submit( - summarize_one_up_with_retry, - it, - config, - max(1, args.max_retries), - float(args.request_timeout), - args.debug, - ) - future_to_item[future] = it - if args.sleep_seconds > 0: - time.sleep(args.sleep_seconds) - - done_count = 0 - for future in as_completed(future_to_item): - done_count += 1 - it = future_to_item[future] - idx = index_map.get(f"{it['mid']}::{it['name']}") - try: - ai_res = future.result() - if idx is not None: - items[idx]["analysis"] = ai_res["summary"] - items[idx]["group"] = ai_res["group"] - items[idx]["action"] = ai_res["action"] - items[idx]["group_reason"] = ai_res["reason"] - items[idx]["error"] = "" - success += 1 - print(f"[done {done_count}/{len(batch)}] 成功: {it['name']} ({it['mid']})") - except Exception as exc: # noqa: BLE001 - if idx is not None: - items[idx]["error"] = str(exc) - failed += 1 - print(f"[done {done_count}/{len(batch)}] 失败: {it['name']} ({it['mid']})") - if args.debug: - print(f"[debug] 失败详情: {exc}") - - success_total += success - failed_total += failed - - step_note = ( - f"第{batch_index}批完成: 成功{success}, 失败{failed}, " - f"本批{len(batch)}, 待分析总数{len(pending)}" - ) - output_report.parent.mkdir(parents=True, exist_ok=True) - output_report.write_text(build_report(items, step_note), encoding="utf-8") - print(f"第{batch_index}批写入完成: {output_report}") - - mode_text = "自动连续" if args.run_all_batches else "单批" - note = ( - f"{mode_text}模式完成: 成功{success_total}, 失败{failed_total}, " - f"处理批次数={len(batch_indexes)}, 待分析总数={len(pending)}" - ) - output_report.parent.mkdir(parents=True, exist_ok=True) - output_report.write_text(build_report(items, note), encoding="utf-8") - print(f"输出完成: {output_report}") - return 0 - - -if __name__ == "__main__": - raise SystemExit(main()) diff --git a/source/scripts/extract_group_info.py b/source/scripts/extract_group_info.py deleted file mode 100644 index 9b81fc1..0000000 --- a/source/scripts/extract_group_info.py +++ /dev/null @@ -1,101 +0,0 @@ -import argparse -import re - -def parse_args() -> argparse.Namespace: - parser = argparse.ArgumentParser(description="提取UP分组信息") - parser.add_argument( - "--input", - default="./source/19_53_no_titles.md", - help="输入报告路径", - ) - parser.add_argument( - "--output", - help="输出报告路径(默认覆盖输入)", - ) - return parser.parse_args() - -def main(): - args = parse_args() - input_file = args.input - output_file = args.output or input_file - - with open(input_file, 'r', encoding='utf-8') as f: - content = f.read() - - lines = content.split('\n') - section_starts = [] - for i, line in enumerate(lines): - if line.startswith('## '): - section_starts.append(i) - - if len(section_starts) < 2: - print('No sections found') - return 1 - - header = '\n'.join(lines[:section_starts[0]]) - sections = [] - - for idx in range(len(section_starts)): - start = section_starts[idx] - end = section_starts[idx + 1] if idx + 1 < len(section_starts) else len(lines) - section = '\n'.join(lines[start:end]) - sections.append(section) - - sections = sections[1:] - - parsed = [] - for sec in sections: - match = re.match(r'^## (\d+)\. (.+) \(mid: (\d+)\)', sec) - if match: - num = int(match.group(1)) - name = match.group(2) - mid = match.group(3) - - group_m = re.search(r'- 预设分组: (.+)', sec) - action_m = re.search(r'- 建议动作: (.+)', sec) - reason_m = re.search(r'- 判断依据: (.+)', sec) - error_m = re.search(r'AI返回未知group: (.+)', sec) - - group = group_m.group(1).strip() if group_m else "" - action = action_m.group(1).strip() if action_m else "" - reason = reason_m.group(1).strip() if reason_m else "" - error = error_m.group(1).strip() if error_m else "" - - parsed.append({ - 'num': num, - 'name': name, - 'mid': mid, - 'group': group, - 'action': action, - 'reason': reason, - 'error': error - }) - - parsed.sort(key=lambda x: (x['name'].casefold(), int(x['mid']))) - - lines_out = [header, ""] - - for p in parsed: - lines_out.append(f"## {p['num']}. {p['name']} (mid: {p['mid']})") - lines_out.append("") - if p['group']: - lines_out.append(f"- 预设分组: {p['group']}") - if p['action']: - lines_out.append(f"- 建议动作: {p['action']}") - if p['reason']: - lines_out.append(f"- 判断依据: {p['reason']}") - if p['error']: - lines_out.append(f"- 异常: {p['error']}") - lines_out.append("") - - result = '\n'.join(lines_out) - result = re.sub(r'\n{3,}', '\n\n', result) - - with open(output_file, 'w', encoding='utf-8') as f: - f.write(result) - - print(f'Extracted {len(parsed)} sections') - return 0 - -if __name__ == "__main__": - raise SystemExit(main()) \ No newline at end of file diff --git a/source/scripts/extract_keep_follow_doc.py b/source/scripts/extract_keep_follow_doc.py deleted file mode 100644 index afe96f7..0000000 --- a/source/scripts/extract_keep_follow_doc.py +++ /dev/null @@ -1,104 +0,0 @@ -#!/usr/bin/env python3 -from __future__ import annotations - -import argparse -import re -import time -from pathlib import Path - - -def parse_args() -> argparse.Namespace: - parser = argparse.ArgumentParser(description="提取非取关UP的AI分析与分组建议") - parser.add_argument( - "--input-report", - default="source/output/reports/2_up_analysis_full_auto.md", - help="输入分析报告路径", - ) - parser.add_argument( - "--output-report", - default="source/output/reports/3_up_keep_follow_only.md", - help="输出保留关注报告路径", - ) - return parser.parse_args() - - -def main() -> int: - args = parse_args() - src = Path(args.input_report) - dst = Path(args.output_report) - - if not src.exists(): - print(f"来源文件不存在: {src}") - return 1 - - text = src.read_text(encoding="utf-8") - pattern = r"^##\s+\d+\.\s+(.+?)\s+\(mid:\s*(\d+)\)\s*$" - matches = list(re.finditer(pattern, text, re.MULTILINE)) - - items: list[tuple[str, str, str, str, str, str]] = [] - for i, m in enumerate(matches): - start = m.start() - end = matches[i + 1].start() if i + 1 < len(matches) else len(text) - section = text[start:end] - - name = m.group(1).strip() - mid = m.group(2).strip() - - action_m = re.search(r"-\s*建议动作:\s*(.+)", section) - action = action_m.group(1).strip() if action_m else "" - # 反逻辑:没有"建议动作: 可以取关"就保留 - if action == "可以取关": - continue - - ai_m = re.search(r"###\s*AI分析\s*\n([\s\S]*?)(?=\n###\s|\Z)", section) - ai_text = ai_m.group(1).strip() if ai_m else "" - - group_m = re.search(r"###\s*分组建议\s*\n([\s\S]*?)(?=\n###\s|\Z)", section) - group_text = group_m.group(1).strip() if group_m else "" - - error_m = re.search(r"###\s*异常\s*\n([\s\S]*?)(?=\n###\s|\Z)", section) - error_text = error_m.group(1).strip() if error_m else "" - - items.append((name, mid, ai_text, group_text, action, error_text)) - - # 按昵称首字母A-Z排序(同名时按mid升序) - items.sort(key=lambda x: (x[0].casefold(), int(x[1]))) - - lines = [ - "# 保留关注UP主分析与分组建议", - "", - f"- 生成时间: {time.strftime('%Y-%m-%d %H:%M:%S')}", - f"- 来源文件: {src.name}", - f"- 条目数: {len(items)}", - "", - ] - - for idx, (name, mid, ai_text, group_text, action, error_text) in enumerate(items, 1): - lines.append(f"## {idx}. {name} (mid: {mid})") - lines.append("") - - lines.append("### AI分析") - lines.append("") - lines.append(ai_text if ai_text else "(无)") - lines.append("") - - lines.append("### 分组建议") - lines.append("") - lines.append(group_text if group_text else f"- 建议动作: {action if action else '(无)'}") - lines.append("") - - if error_text: - lines.append("### 异常") - lines.append("") - lines.append(error_text) - lines.append("") - - dst.parent.mkdir(parents=True, exist_ok=True) - dst.write_text("\n".join(lines), encoding="utf-8") - print(f"已生成: {dst}") - print(f"保留条目: {len(items)}") - return 0 - - -if __name__ == "__main__": - raise SystemExit(main()) \ No newline at end of file diff --git a/source/scripts/extract_unfollow_list.py b/source/scripts/extract_unfollow_list.py deleted file mode 100644 index 62fc57e..0000000 --- a/source/scripts/extract_unfollow_list.py +++ /dev/null @@ -1,174 +0,0 @@ -#!/usr/bin/env python3 -"""Extract UPs marked as "可以取关" and output their mids to CSV. - -Read an UP analysis report and extract all UPs with action "可以取关", -then output their mids to a CSV file. -""" - -from __future__ import annotations - -import argparse -import csv -import re -import sys -from pathlib import Path -from typing import Any - - -def parse_report(report_path: Path) -> list[dict[str, Any]]: - """解析Markdown格式的UP分析报告,返回UP列表""" - if not report_path.exists(): - return [] - - text = report_path.read_text(encoding="utf-8") - items = [] - - # 按UP项分割(每个UP项以"## N. 名字 (mid: ...)"开头) - pattern = r"^## \d+\. (.+?)\s+\(mid:\s*(\d+)\)" - matches = list(re.finditer(pattern, text, re.MULTILINE)) - - for i, match in enumerate(matches): - start = match.start() - end = matches[i + 1].start() if i + 1 < len(matches) else len(text) - section = text[start:end] - - name = match.group(1).strip() - mid = int(match.group(2)) - - # 提取建议动作 - action_match = re.search(r"- 建议动作: (.+?)(?:\n|$)", section) - action = action_match.group(1).strip() if action_match else "" - - items.append({ - "mid": mid, - "name": name, - "action": action, - }) - - return items - - -def main() -> int: - parser = argparse.ArgumentParser(description="从UP分析报告中提取可以取关的UP") - parser.add_argument( - "--input-report", - default="source/output/reports/2_up_analysis_full_auto.md", - help="输入报告路径", - ) - parser.add_argument( - "--output-csv", - default="source/output/uids/4_unfollow_mids_list.txt", - help="输出文件路径", - ) - parser.add_argument( - "--format", - choices=["csv", "mid-only", "json"], - default="mid-only", - help="输出格式:csv(mid,name), mid-only(仅mid逗号分隔), json(JSON格式)", - ) - parser.add_argument( - "--with-names", - action="store_true", - help="在mid后添加UP名称(仅mid-only格式生效)", - ) - parser.add_argument( - "--split-size", - type=int, - default=0, - help="可选:将mid-only结果按N个一组拆分多个文件,例如100", - ) - - args = parser.parse_args() - - input_report = Path(args.input_report) - output_csv = Path(args.output_csv) - - if not input_report.exists(): - print(f"错误: 输入报告不存在: {input_report}", file=sys.stderr) - return 1 - - print(f"读取报告: {input_report}") - items = parse_report(input_report) - - if not items: - print("未能从报告中解析任何UP", file=sys.stderr) - return 1 - - # 筛选可以取关的UP - unfollow_items = [it for it in items if it.get("action") == "可以取关"] - - print(f"总 UP 数: {len(items)}") - print(f"可以取关: {len(unfollow_items)}") - - if not unfollow_items: - print("没有可以取关的UP") - return 0 - - # 输出格式 - if args.format == "csv": - # 标准CSV格式:mid, name - output_csv.parent.mkdir(parents=True, exist_ok=True) - with open(output_csv, "w", newline="", encoding="utf-8") as f: - writer = csv.DictWriter(f, fieldnames=["mid", "name"]) - writer.writeheader() - for item in unfollow_items: - writer.writerow({"mid": item["mid"], "name": item["name"]}) - - print(f"\n✓ 已输出CSV格式到: {output_csv}") - print(f" 格式: mid,name") - print(f" 行数: {len(unfollow_items)}") - - elif args.format == "mid-only": - # 仅mid,逗号分隔 - mids = [str(it["mid"]) for it in unfollow_items] - - if args.with_names: - # mid:name 格式 - content = ",".join([f"{it['mid']}:{it['name']}" for it in unfollow_items]) - print(f"\n✓ 已输出mid:name列表到: {output_csv}") - print(f" 格式: mid1:name1,mid2:name2,...") - else: - # 仅mid - content = ",".join(mids) - print(f"\n✓ 已输出mid列表到: {output_csv}") - print(f" 格式: mid1,mid2,mid3,...") - - output_csv.parent.mkdir(parents=True, exist_ok=True) - output_csv.write_text(content, encoding="utf-8") - print(f" 数量: {len(mids)}") - - split_size = max(0, int(args.split_size)) - if split_size > 0: - groups = [mids[i:i + split_size] for i in range(0, len(mids), split_size)] - stem = output_csv.stem - suffix = output_csv.suffix or ".txt" - for i, group in enumerate(groups, start=1): - part_path = output_csv.with_name(f"{stem}_{i}{suffix}") - part_path.write_text(",".join(group), encoding="utf-8") - print(f" 已按每组{split_size}个拆分为{len(groups)}个文件") - - elif args.format == "json": - # JSON格式 - import json - - data = [{"mid": it["mid"], "name": it["name"]} for it in unfollow_items] - output_csv.parent.mkdir(parents=True, exist_ok=True) - output_csv.write_text(json.dumps(data, ensure_ascii=False, indent=2), encoding="utf-8") - - print(f"\n✓ 已输出JSON格式到: {output_csv}") - print(f" 数量: {len(data)}") - - # 显示前10个示例 - if len(unfollow_items) > 0: - print(f"\n📋 示例(前10个):") - for item in unfollow_items[:10]: - print(f" - {item['mid']}: {item['name']}") - - if len(unfollow_items) > 10: - print(f" ... 还有 {len(unfollow_items) - 10} 个") - - return 0 - - -if __name__ == "__main__": - sys.exit(main()) diff --git a/source/scripts/remove_10content.py b/source/scripts/remove_10content.py deleted file mode 100644 index aae1058..0000000 --- a/source/scripts/remove_10content.py +++ /dev/null @@ -1,67 +0,0 @@ -import argparse -import re - -def parse_args() -> argparse.Namespace: - parser = argparse.ArgumentParser(description="删除最近10条标题内容") - parser.add_argument( - "--input", - default="source/output/reports/2_up_analysis_full_auto.md", - help="输入报告路径", - ) - parser.add_argument( - "--output", - help="输出报告路径(默认覆盖输入)", - ) - return parser.parse_args() - -def main(): - args = parse_args() - input_file = args.input - output_file = args.output or input_file - - with open(input_file, 'r', encoding='utf-8') as f: - content = f.read() - - lines = content.split('\n') - new_lines = [] - i = 0 - while i < len(lines): - line = lines[i] - new_lines.append(line) - - if line.startswith('## '): - i += 1 - while i < len(lines): - curr = lines[i] - if curr.startswith('## '): - break - if curr.startswith('### '): - if '最近10条标题' in curr: - i += 1 - while i < len(lines) and lines[i].startswith(' - '): - i += 1 - continue - else: - break - if curr.startswith('- ') and not curr.startswith(' - '): - i += 1 - continue - if curr.startswith(' - '): - i += 1 - continue - new_lines.append(curr) - i += 1 - else: - i += 1 - - result = '\n'.join(new_lines) - result = re.sub(r'\n{3,}', '\n\n', result) - - with open(output_file, 'w', encoding='utf-8') as f: - f.write(result) - - print(f'Done: {output_file}') - return 0 - -if __name__ == "__main__": - raise SystemExit(main()) \ No newline at end of file diff --git a/source/scripts/run_pipeline.py b/source/scripts/run_pipeline.py deleted file mode 100644 index 688bff5..0000000 --- a/source/scripts/run_pipeline.py +++ /dev/null @@ -1,208 +0,0 @@ -#!/usr/bin/env python3 -"""One-command pipeline: fetch titles -> batch analyze -> outputs. - -Pipeline outputs: -1) source/output/reports/1_up_titles_report.md -2) source/output/reports/2_up_analysis_full_auto.md -3) source/output/reports/3_up_keep_follow_only.md -4) source/output/uids/4_unfollow_mids_list.txt (+ split files) - -Pipeline steps: -1) 抓取视频标题 (analyze_up_content.py) -2) 分批AI分析 (batch_ai_summary_from_report.py) -3) 生成保留关注报告 (extract_keep_follow_doc.py) -4) 生成取关UID列表 (extract_unfollow_list.py) -5) 按首字母排序 (sort_up_main.py) -6) 提取分组信息 (extract_group_info.py) -""" - -from __future__ import annotations - -import argparse -import subprocess -import sys -from pathlib import Path - - -def parse_args() -> argparse.Namespace: - parser = argparse.ArgumentParser(description="一键运行完整功能链") - parser.add_argument( - "--input-json", - default="source/resources/export_uids.json", - help="UP资源文件路径,默认: source/resources/export_uids.json", - ) - parser.add_argument( - "--titles-report", - default="source/output/reports/1_up_titles_report.md", - help="标题抓取报告输出路径", - ) - parser.add_argument( - "--analysis-report", - default="source/output/reports/2_up_analysis_full_auto.md", - help="分批分析报告输出路径", - ) - parser.add_argument( - "--keep-report", - default="source/output/reports/3_up_keep_follow_only.md", - help="保留关注报告输出路径", - ) - parser.add_argument( - "--unfollow-uids", - default="source/output/uids/4_unfollow_mids_list.txt", - help="取关UID输出路径", - ) - parser.add_argument( - "--group_info", - default="source/output/uids/only_group_info.md", - help="分组信息输出路径", - ) - parser.add_argument("--titles-per-up", type=int, default=10, help="每个UP抓取标题数量") - parser.add_argument("--batch-size", type=int, default=20, help="分批分析每批条数") - parser.add_argument("--workers", type=int, default=6, help="并发请求数") - parser.add_argument("--max-retries", type=int, default=2, help="单条分析重试次数") - parser.add_argument("--request-timeout", type=float, default=60.0, help="单次请求超时") - parser.add_argument("--split-size", type=int, default=100, help="取关UID拆分分组大小") - parser.add_argument("--sleep-seconds", type=float, default=0.0, help="任务间隔秒数") - parser.add_argument("--retry-times", type=int, default=3, help="抓取重试次数") - parser.add_argument("--fetch-mode", choices=["auto", "api", "html"], default="auto", help="标题抓取模式") - parser.add_argument("--only-tag", default="", help="可选:仅处理包含该标签的UP") - parser.add_argument("--max-ups", type=int, default=0, help="可选:限制处理UP数量") - parser.add_argument("--bili-cookie", default="", help="可选:运行时传入B站Cookie") - parser.add_argument("--skip-fetch", action="store_true", help="跳过抓取阶段,直接使用已有标题报告") - parser.add_argument("--skip-analyze", action="store_true", help="跳过分析阶段,直接做产物提取") - parser.add_argument("--skip-sort", action="store_true", help="跳过排序阶段") - parser.add_argument("--skip-group", action="store_true", help="跳过提取分组阶段") - parser.add_argument("--python", default=sys.executable, help="指定Python解释器") - return parser.parse_args() - - -def run_cmd(cmd: list[str], title: str) -> None: - print(f"\n=== {title} ===") - print("$", " ".join(cmd)) - subprocess.run(cmd, check=True) - - -def main() -> int: - args = parse_args() - - for p in [ - Path(args.titles_report).parent, - Path(args.analysis_report).parent, - Path(args.keep_report).parent, - Path(args.unfollow_uids).parent, - ]: - p.mkdir(parents=True, exist_ok=True) - - if not args.skip_fetch: - fetch_cmd = [ - args.python, - "source/scripts/analyze_up_content.py", - "--input", - args.input_json, - "--output", - args.titles_report, - "--titles-per-up", - str(max(1, args.titles_per_up)), - "--retry-times", - str(max(1, args.retry_times)), - "--fetch-mode", - args.fetch_mode, - "--sleep-seconds", - str(max(0.0, args.sleep_seconds)), - "--skip-ai", - ] - if args.only_tag: - fetch_cmd += ["--only-tag", args.only_tag] - if args.max_ups > 0: - fetch_cmd += ["--max-ups", str(args.max_ups)] - if args.bili_cookie: - fetch_cmd += ["--bili-cookie", args.bili_cookie] - - run_cmd(fetch_cmd, "步骤1/6 抓取视频标题") - - if not args.skip_analyze: - analyze_cmd = [ - args.python, - "source/scripts/batch_ai_summary_from_report.py", - "--input-report", - args.titles_report, - "--output-report", - args.analysis_report, - "--batch-size", - str(max(1, args.batch_size)), - "--run-all-batches", - "--workers", - str(max(1, args.workers)), - "--max-retries", - str(max(1, args.max_retries)), - "--request-timeout", - str(max(1.0, args.request_timeout)), - "--sleep-seconds", - str(max(0.0, args.sleep_seconds)), - ] - run_cmd(analyze_cmd, "步骤2/6 分批AI分析") - - keep_cmd = [ - args.python, - "source/scripts/extract_keep_follow_doc.py", - "--input-report", - args.analysis_report, - "--output-report", - args.keep_report, - ] - run_cmd(keep_cmd, "步骤3/6 生成保留关注报告") - - uid_cmd = [ - args.python, - "source/scripts/extract_unfollow_list.py", - "--input-report", - args.analysis_report, - "--output-csv", - args.unfollow_uids, - "--format", - "mid-only", - "--split-size", - str(max(0, args.split_size)), - ] - run_cmd(uid_cmd, "步骤4/6 生成取关UID列表") - - sorted_report = "source/output/reports/5_sorted_up_analysis.md" - group_report = "source/output/reports/6_group_info.md" - - if not args.skip_sort: - sort_cmd = [ - args.python, - "source/scripts/sort_up_main.py", - "--input", - args.analysis_report, - "--output", - sorted_report, - ] - run_cmd(sort_cmd, "步骤5/6 按首字母排序") - - if not args.skip_group: - input_for_group = sorted_report if not args.skip_sort else args.analysis_report - group_cmd = [ - args.python, - "source/scripts/extract_group_info.py", - "--input", - input_for_group, - "--output", - group_report, - ] - run_cmd(group_cmd, "步骤6/6 提取分组信息") - - print("\n流水线完成。") - print(f"- 1 标题报告: {args.titles_report}") - print(f"- 2 分析报告: {args.analysis_report}") - print(f"- 3 保留报告: {args.keep_report}") - print(f"- 4 取关UID: {args.unfollow_uids}") - if not args.skip_sort: - print(f"- 5 排序报告: {sorted_report}") - if not args.skip_group: - print(f"- 6 分组报告: {group_report}") - return 0 - - -if __name__ == "__main__": - raise SystemExit(main()) diff --git a/source/scripts/sort_up_main.py b/source/scripts/sort_up_main.py deleted file mode 100644 index d3ecc4e..0000000 --- a/source/scripts/sort_up_main.py +++ /dev/null @@ -1,93 +0,0 @@ -import argparse -import re - -def parse_args() -> argparse.Namespace: - parser = argparse.ArgumentParser(description="对UP主按首字母排序") - parser.add_argument( - "--input", - default="source/output/reports/2_up_analysis_full_auto.md", - help="输入报告路径", - ) - parser.add_argument( - "--output", - help="输出报告路径(默认覆盖输入)", - ) - return parser.parse_args() - -def main(): - args = parse_args() - input_file = args.input - output_file = args.output or input_file - - with open(input_file, 'r', encoding='utf-8') as f: - content = f.read() - - lines = content.split('\n') - - header_lines = [] - section_starts = [] - for i, line in enumerate(lines): - if line.startswith('## '): - section_starts.append(i) - - if len(section_starts) < 2: - print('No sections found') - return 1 - - header = '\n'.join(lines[:section_starts[0]]) - sections_data = [] - - for idx in range(len(section_starts)): - start = section_starts[idx] - if idx + 1 < len(section_starts): - end = section_starts[idx + 1] - else: - end = len(lines) - - section_lines = lines[start:end] - section_text = '\n'.join(section_lines) - sections_data.append(section_text) - - sections_data = sections_data[1:] - - parsed = [] - for sec in sections_data: - match = re.match(r'^## (\d+)\. (.+) \(mid: (\d+)\)', sec) - if match: - num = int(match.group(1)) - name = match.group(2) - mid = match.group(3) - parsed.append({ - 'num': num, - 'name': name, - 'mid': mid, - 'content': sec - }) - - def sort_key(item): - name = item['name'] - first_char = name[0].lower() if name else '' - if first_char.isdigit(): - return '0' + first_char - elif first_char.isalpha(): - return '1' + first_char - else: - return '2' + first_char - - parsed.sort(key=sort_key) - - new_content = header + '\n' - for i, sec in enumerate(parsed): - new_content += sec['content'] + '\n' - - with open(output_file, 'w', encoding='utf-8') as f: - f.write(new_content) - - print(f'Sorted {len(parsed)} sections') - print('First 10:') - for s in parsed[:10]: - print(f' {s["name"]}') - return 0 - -if __name__ == "__main__": - raise SystemExit(main()) \ No newline at end of file