# scrapy-taobao
scrapy模拟淘宝登陆,未加代理ip的处理。希望有好的代理处理方法分享出来。
# 确保安装了scrapy。
self.http_user = 'xxxxxxxx' # taobao username
self.http_pass = 'xxxxxxxx' # taobao password
记得修改taobao_spider.py中的用户名username和密码password。\<br>
# 运行命令
scrapy crawl taobao
如果用户登陆需要输入验证码,则会自动打开验证码的图片链接让客户手动输入,输入错误会重新打开验证码的图片链接供用户再次输入。
# 登陆成功的提示
login-success, get user nick: ["user nick"]
用户看到这句代表登陆成功,可以进行一些其他数据的提取。
Raw data
{
"_id": null,
"home_page": "https://github.com/yanjlee/scrapy-taobao",
"name": "scrapy-taobao",
"maintainer": null,
"docs_url": null,
"requires_python": null,
"maintainer_email": null,
"keywords": null,
"author": "yanjlee",
"author_email": "yanjlee@163.com",
"download_url": "https://files.pythonhosted.org/packages/5b/5c/93efef48e76b908119b138b339dcdc852ca75c61d046f1f1f4cf26881734/scrapy_taobao-1.1.5.tar.gz",
"platform": null,
"description": "# scrapy-taobao\r\nscrapy\u6a21\u62df\u6dd8\u5b9d\u767b\u9646\uff0c\u672a\u52a0\u4ee3\u7406ip\u7684\u5904\u7406\u3002\u5e0c\u671b\u6709\u597d\u7684\u4ee3\u7406\u5904\u7406\u65b9\u6cd5\u5206\u4eab\u51fa\u6765\u3002\r\n\r\n# \u786e\u4fdd\u5b89\u88c5\u4e86scrapy\u3002\r\n self.http_user = 'xxxxxxxx' # taobao username\r\n self.http_pass = 'xxxxxxxx' # taobao password\r\n\u8bb0\u5f97\u4fee\u6539taobao_spider.py\u4e2d\u7684\u7528\u6237\u540dusername\u548c\u5bc6\u7801password\u3002\\<br>\r\n\r\n# \u8fd0\u884c\u547d\u4ee4\r\n scrapy crawl taobao\r\n \u5982\u679c\u7528\u6237\u767b\u9646\u9700\u8981\u8f93\u5165\u9a8c\u8bc1\u7801\uff0c\u5219\u4f1a\u81ea\u52a8\u6253\u5f00\u9a8c\u8bc1\u7801\u7684\u56fe\u7247\u94fe\u63a5\u8ba9\u5ba2\u6237\u624b\u52a8\u8f93\u5165\uff0c\u8f93\u5165\u9519\u8bef\u4f1a\u91cd\u65b0\u6253\u5f00\u9a8c\u8bc1\u7801\u7684\u56fe\u7247\u94fe\u63a5\u4f9b\u7528\u6237\u518d\u6b21\u8f93\u5165\u3002\r\n\r\n# \u767b\u9646\u6210\u529f\u7684\u63d0\u793a\r\n login-success, get user nick: [\"user nick\"]\r\n\u7528\u6237\u770b\u5230\u8fd9\u53e5\u4ee3\u8868\u767b\u9646\u6210\u529f\uff0c\u53ef\u4ee5\u8fdb\u884c\u4e00\u4e9b\u5176\u4ed6\u6570\u636e\u7684\u63d0\u53d6\u3002\r\n \r\n",
"bugtrack_url": null,
"license": null,
"summary": "scrapy\u6a21\u62df\u6dd8\u5b9d\u767b\u9646\uff0c\u672a\u52a0\u4ee3\u7406ip\u7684\u5904\u7406\u3002\u5e0c\u671b\u6709\u597d\u7684\u4ee3\u7406\u5904\u7406\u65b9\u6cd5\u5206\u4eab\u51fa\u6765\u3002.",
"version": "1.1.5",
"project_urls": {
"Homepage": "https://github.com/yanjlee/scrapy-taobao"
},
"split_keywords": [],
"urls": [
{
"comment_text": "",
"digests": {
"blake2b_256": "19f6266e4732b2f3abba733aa58ae54fcd1c9dd26a16fc2ce7984103700e6dac",
"md5": "c9a0e42332b9a60b0d51915f94a8a38e",
"sha256": "6d9c5d1c6199ee8971168c063a9abf6c5d401ad0fce0deeaa00965d3b496080c"
},
"downloads": -1,
"filename": "scrapy_taobao-1.1.5-py3-none-any.whl",
"has_sig": false,
"md5_digest": "c9a0e42332b9a60b0d51915f94a8a38e",
"packagetype": "bdist_wheel",
"python_version": "py3",
"requires_python": null,
"size": 7415,
"upload_time": "2024-06-01T08:22:49",
"upload_time_iso_8601": "2024-06-01T08:22:49.485855Z",
"url": "https://files.pythonhosted.org/packages/19/f6/266e4732b2f3abba733aa58ae54fcd1c9dd26a16fc2ce7984103700e6dac/scrapy_taobao-1.1.5-py3-none-any.whl",
"yanked": false,
"yanked_reason": null
},
{
"comment_text": "",
"digests": {
"blake2b_256": "5b5c93efef48e76b908119b138b339dcdc852ca75c61d046f1f1f4cf26881734",
"md5": "d05c0408d0e1c5f9e0f17d1fa44109f6",
"sha256": "39fdcebb580c4f89999eb2ced9f09ebb31b8e0cd8d2b37374d3c3ce088420ae0"
},
"downloads": -1,
"filename": "scrapy_taobao-1.1.5.tar.gz",
"has_sig": false,
"md5_digest": "d05c0408d0e1c5f9e0f17d1fa44109f6",
"packagetype": "sdist",
"python_version": "source",
"requires_python": null,
"size": 6563,
"upload_time": "2024-06-01T08:22:51",
"upload_time_iso_8601": "2024-06-01T08:22:51.398156Z",
"url": "https://files.pythonhosted.org/packages/5b/5c/93efef48e76b908119b138b339dcdc852ca75c61d046f1f1f4cf26881734/scrapy_taobao-1.1.5.tar.gz",
"yanked": false,
"yanked_reason": null
}
],
"upload_time": "2024-06-01 08:22:51",
"github": true,
"gitlab": false,
"bitbucket": false,
"codeberg": false,
"github_user": "yanjlee",
"github_project": "scrapy-taobao",
"travis_ci": false,
"coveralls": false,
"github_actions": false,
"lcname": "scrapy-taobao"
}