
Existing cafe info scrapper does not work due to Naver's lazyness, as only first 100 pages are relevent and rest of it is just repeated. This is an rework of that.
@3ac64686feb4e872ab6bfc69beaaf1b8eafaea87
--- cafe_scarapping_executor.py
+++ cafe_scrapping_executor.py
... | ... | @@ -1,7 +1,7 @@ |
1 |
-from naver_blog_url_gatherer import blog_url_scrapper |
|
1 |
+from DEPRECIATED_naver_cafe_info_gatherer import naver_cafe_scrapper |
|
2 | 2 |
|
3 | 3 |
if __name__ == "__main__": |
4 |
- # blog_url_scrapper("선산읍", "2022-01-01", "2023-10-31") |
|
4 |
+ naver_cafe_scrapper("선산읍", 100, 101) |
|
5 | 5 |
# blog_url_scrapper("고아읍", "2022-01-01", "2023-10-31") |
6 | 6 |
# blog_url_scrapper("산동읍", "2022-01-01", "2023-10-31") |
7 | 7 |
# blog_url_scrapper("무을면", "2022-01-01", "2023-10-31") |
... | ... | @@ -25,4 +25,4 @@ |
25 | 25 |
# blog_url_scrapper("인동동", "2022-01-01", "2023-10-31") |
26 | 26 |
# blog_url_scrapper("진미동", "2022-01-01", "2023-10-31") |
27 | 27 |
# blog_url_scrapper("양포동", "2022-01-01", "2023-10-31") |
28 |
- blog_url_scrapper("구미", "2022-01-01", "2023-10-31")(파일 끝에 줄바꿈 문자 없음) |
|
28 |
+ # blog_url_scrapper("구미", "2022-01-01", "2023-10-31")(파일 끝에 줄바꿈 문자 없음) |
Add a comment
Delete comment
Once you delete this comment, you won't be able to recover it. Are you sure you want to delete this comment?