您的位置: 网站首页> SEO工具> 当前文章
selenium贴吧批量发帖(多账号多吧)
老董-我爱我家房产SEO2020-11-13160围观,139赞
一堆账号一对吧,挨个发帖累趴下,不宜手动需要脚本。selenium多账号对贴吧发帖脚本如下:
注意:
1、发帖按钮用的js提交,如果发布过程出现输入验证码,会提示发布成功但实际上未发布上去。
功能:多账号多吧多条内容,每个账号在每个吧发第一条内容,第二条内容。默认发帖间隔60-70秒
用法:
1、要准备cookie_zh.txt, 一行一个cookie
2、准备一个test文件夹,里面放一堆txt文件,每个txt文件是一个帖子(帖子标题是文件名,内容是文件内容)
3、准备好tiebas.txt,一行一个要发的贴吧网址(https://tieba.baidu.com/f?kw=百度&ie=utf-8)
# -*- coding: utf-8 -*- """ 注意: 用的js提交,如果发布过程出现输入验证码,会提示发布成功但实际上未发布上去) 说明: 多账号多吧多条内容 每个账号在每个吧第一条内容,第二条内容... 默认发帖间隔60-70秒 用法: 准备cookie_zh.txt 一行一个cookie 准备test文件夹,一个txt文件是一个帖子(帖子标题是文件名,内容是文件内容)utf-8编码 准备tiebas.txt,一行一个要发的贴吧网址 """ import time from selenium import webdriver from selenium.webdriver.common.by import By from selenium.webdriver.support.ui import WebDriverWait from selenium.webdriver.support import expected_conditions as EC from selenium.webdriver.chrome.options import Options import random from selenium.webdriver.common.action_chains import ActionChains import os def get_driver(chromedriver_path,chrome_path,ua): ua = ua option = Options() option.binary_location = chrome_path option.add_argument("user-agent=" + ua) option.add_argument("--no-sandbox") option.add_argument("--disable-dev-shm-usage") option.add_argument("--disable-gpu") option.add_argument("--disable-features=NetworkService") option.add_argument("--disable-features=VizDisplayCompositor") # option.add_argument('headless') option.add_argument('log-level=3') # 屏蔽日志 option.add_argument('--ignore-certificate-errors-spki-list') # 屏蔽ssl error option.add_argument('-ignore -ssl-errors') # 屏蔽ssl error option.add_experimental_option("excludeSwitches", ["enable-automation"]) option.add_experimental_option('useAutomationExtension', False) No_Image_loading = {"profile.managed_default_content_settings.images": 1} option.add_experimental_option("prefs", No_Image_loading) # 屏蔽webdriver特征 option.add_argument("--disable-blink-features") option.add_argument("--disable-blink-features=AutomationControlled") driver = webdriver.Chrome(options=option, chrome_options=option,executable_path=chromedriver_path) return driver def get_files(filepath): paths = [] files = os.listdir(filepath) for file in files: path = filepath + file paths.append(path) return paths # 获得所有账号cookie def get_cookie(filepath): cookie_list = [] cookie_list = [line.strip() for line in open(filepath,'r',encoding='utf-8')] return cookie_list # 字符串cookie转为字典 def to_dict(cookie_str): cookie = {} lists = cookie_str.split(';') for i in lists: j = i.strip() j = j.split('=') cookie[j[0]] = j[1] return cookie # 获得所有贴吧 def get_tiebas(filepath): tieba_list = [line.strip() for line in open(filepath,'r',encoding='utf-8')] return tieba_list # 自动登录 def auto_login(cookie_dict): num = user_name = 0 teiba_index = 'https://tieba.baidu.com/' driver.get(teiba_index) driver.delete_all_cookies() for k, v in cookie_dict.items(): driver.add_cookie({'name': k, 'value': v}) try: driver.get(teiba_index) # 带cookie访问 # 右侧导航加载 navs = WebDriverWait(driver, 30).until( EC.visibility_of_element_located((By.ID, "com_userbar")) ) li_list = driver.find_elements_by_css_selector('#com_userbar > ul >li') li_classnames = [li.get_attribute('class') for li in li_list] if 'u_username' in li_classnames: num = 1 user = WebDriverWait(driver, 30).until( EC.visibility_of_element_located( (By.CSS_SELECTOR, "#j_u_username > div.u_menu_item.u_menu_username > a > span")) ) user_name = user.text except Exception as e: print('登陆过程异常',e) else: pass finally: return num,user_name # 发帖 def fa_tie(title,content,url): num = 0 try: # 打开贴吧 driver.get(url) # 加载关注按钮 guanzhu = WebDriverWait(driver, 30).until( EC.visibility_of_element_located((By.ID, "j_head_focus_btn")) ) # 加载签到按钮 qiandao = WebDriverWait(driver, 20).until( EC.visibility_of_element_located((By.XPATH, '//*[@id="signstar_wrapper"]/a')) ) # 标题部分加载 input_title = WebDriverWait(driver, 20).until( EC.visibility_of_element_located((By.XPATH, '//*[@id="tb_rich_poster"]/div[3]/div[1]/div[2]/input')) ) # 内容部分加载 input_content = WebDriverWait(driver, 30).until( EC.visibility_of_element_located((By.ID, "ueditor_replace")) ) # 鼠标移动到关注和签到按钮 ActionChains(driver).move_to_element(guanzhu).perform() ActionChains(driver).move_to_element(qiandao).perform() # 作者列表 posts_author = driver.find_elements_by_class_name('frs-author-name-wrap') # 帖子列表 posts = driver.find_elements_by_class_name('j_th_tit') if len(posts_author) > 0 and len(posts) > 0: # 随机选几个作者 authors_rand = random.sample(posts_author,3) if len(posts_author) > 2 else posts_author # 鼠标随机移动 for author in authors_rand: ActionChains(driver).move_to_element(author).perform() time.sleep(random.randint(1,3)) # 随机选几个帖子 posts_rand = random.sample(posts, 3) if len(posts) > 2 else posts # 鼠标随机移动 for post in posts_rand: ActionChains(driver).move_to_element(post).perform() time.sleep(random.randint(1, 3)) # 滚动条到底部 driver.execute_script(js) time.sleep(2) ActionChains(driver).move_to_element(input_title).click().perform() time.sleep(1) # js赋值帖子标题 title_js = 'document.querySelector("#tb_rich_poster > div.poster_body.editor_wrapper > div.poster_component.title_container > div.j_title_wrap > input").value ="{0}"'.format(title) driver.execute_script(title_js) # 鼠标点击进贴吧内容框 js_content_position = "document.getElementById('ueditor_replace').click();" driver.execute_script(js_content_position) # ActionChains(driver).move_to_element(input_content).click().perform() time.sleep(0.5) # 输入帖子内容 for wd in content: time.sleep(0.04) input_content.send_keys(wd) time.sleep(random.random()) # 用js方式提交 出现弹窗不会影响提交 button_js = 'document.querySelector("#tb_rich_poster > div.poster_body.editor_wrapper > div.poster_component.editor_bottom_panel.clearfix > div > button.btn_default.btn_middle.j_submit.poster_submit").click()' driver.execute_script(button_js) num = 1 except Exception as e: print(e,'发帖异常..') finally: return num def main(tiebas,my_files,cookie_list,time1,time2): for cookie in cookie_list: try: cookie_dict = to_dict(cookie) num_auto,user_name = auto_login(cookie_dict) # 自动登录 if num_auto == 1: print(user_name,'自动登录成功') # exit() else: print('自动登录失败') continue except Exception as e: print(e, '未顺利登录') else: # for my_file in my_files: for i in range(2): my_file = random.choice(my_files) filepath, fullflname = os.path.split(my_file) my_title, ext = os.path.splitext(fullflname) my_content = ''.join(open(my_file,'r',encoding='utf-8').readlines()) # my_content = 'http://tiebapic.baidu.com/forum/w%3D580/sign=73b03dc8ce33c895a67e9873e1127397/55c959899e510fb373b03dc8ce33c895d0430ccc.jpg董某人发扬鸠摩智精神 修炼贴吧武学 贴吧英雄大会有幸会齐北乔峰南慕容,一开始宣称没我鸠摩智算什么英雄大会,认为北乔峰就闭而不战,南慕容简直浪得虚名。被虐后感叹降龙十八掌果然天下第一!,\n' + my_content my_img = 'http://tiebapic.baidu.com/forum/w%3D580/sign=73b03dc8ce33c895a67e9873e1127397/55c959899e510fb373b03dc8ce33c895d0430ccc.jpg' for tieba in tiebas: num = fa_tie(my_title,my_content,tieba) if num == 1: print(tieba,my_file,'--发布成功') else: print(tieba,my_file,'--发布失败') time.sleep(random.randint(time1,time2)) finally: time.sleep(random.randint(time1,time2)) driver.delete_all_cookies() if __name__ == "__main__": f = open('tieba_fabu_fail.txt','a',encoding='utf-8') js = 'window.scrollBy(0,{0})'.format('document.body.scrollHeight') chromedriver_path = 'D:/python3/install/chromedriver.exe' chrome_path = 'C:/Program Files (x86)/Google/Chrome/Application/chrome.exe' ua = 'Mozilla/5.0 (Windows NT 6.1; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/84.0.4147.125 Safari/537.36' # 全局变量 driver = get_driver(chromedriver_path,chrome_path,ua) # cookie账号路径 cookie_path = './cookie_zh.txt' cookie_list = get_cookie(cookie_path) my_files = get_files('./test/') tiebas = get_tiebas('./tiebas.txt') # 登陆间隔时间最小and最大 sleep_min, sleep_max = 60, 70 main(tiebas,my_files,cookie_list,sleep_min,sleep_max) driver.quit()
很赞哦!
python编程网提示:转载请注明来源www.python66.com。
有宝贵意见可添加站长微信(底部),获取技术资料请到公众号(底部)。同行交流请加群
相关文章
文章评论
-
selenium贴吧批量发帖(多账号多吧)文章写得不错,值得赞赏
站点信息
- 网站程序:Laravel
- 客服微信:a772483200