diff --git "a/\347\254\254\344\272\214\346\234\237\350\256\255\347\273\203\350\220\245/3\347\217\255/3\347\217\255_\346\235\216\346\263\212/\347\254\254\345\215\201\344\272\214\345\221\250/\347\254\254\344\270\200\350\212\202/jd_search_producer.py" "b/\347\254\254\344\272\214\346\234\237\350\256\255\347\273\203\350\220\245/3\347\217\255/3\347\217\255_\346\235\216\346\263\212/\347\254\254\345\215\201\344\272\214\345\221\250/\347\254\254\344\270\200\350\212\202/jd_search_producer.py" new file mode 100644 index 0000000000000000000000000000000000000000..61495743be609686caec9ce247c3afa426b62121 --- /dev/null +++ "b/\347\254\254\344\272\214\346\234\237\350\256\255\347\273\203\350\220\245/3\347\217\255/3\347\217\255_\346\235\216\346\263\212/\347\254\254\345\215\201\344\272\214\345\221\250/\347\254\254\344\270\200\350\212\202/jd_search_producer.py" @@ -0,0 +1,27 @@ +import redis +import time +import json + + +redis_con = redis.Redis(host='localhost', port=6379, db=5) + +def search_producer(): + for keyword in ["鼠标", "键盘", "显卡", "耳机"]: + for page_num in range(1, 11): + url = f"https://search.jd.com/Search?keyword={keyword}&page={page_num}" + meta = { + "sta_date": time.strftime("%Y-%m-%d"), + "keyword": keyword, + "page_num": page_num + } + + task = json.dumps({ + "url": url, + "body": '', + "method": "GET", + "meta": meta + }) + redis_con.lpush("jd_search:start_urls", task) + +if __name__ == "__main__": + search_producer() \ No newline at end of file