保存的状态一段时间会失效 需要定期重新获取
This commit is contained in:
@@ -44,6 +44,18 @@ def index_data_scraper(index_code: str, data_file_path: str):
|
||||
time.sleep(10)
|
||||
|
||||
|
||||
def get_state():
|
||||
with sync_playwright() as p:
|
||||
browser_state_file_path = "./em_browser_state.json"
|
||||
browser = p.chromium.launch(args=["--start-maximized"], headless=False)
|
||||
page = browser.new_page()
|
||||
url = f"https://quote.eastmoney.com/center/gridlist.html#index_sh"
|
||||
page.goto(url)
|
||||
page.pause()
|
||||
browser.contexts[0].storage_state(path=browser_state_file_path)
|
||||
|
||||
|
||||
|
||||
def parse_data(data_file_path: str):
|
||||
df_list = []
|
||||
with open(data_file_path, "r", encoding="utf-8") as f:
|
||||
@@ -102,7 +114,8 @@ def get_index_latest_data():
|
||||
|
||||
|
||||
if __name__ == "__main__":
|
||||
df = get_index_latest_data()
|
||||
code = "000001"
|
||||
df = df[df["代码"] == code]
|
||||
print(df)
|
||||
# df = get_index_latest_data()
|
||||
# code = "000001"
|
||||
# df = df[df["代码"] == code]
|
||||
# print(df)
|
||||
get_state()
|
||||
|
||||
Reference in New Issue
Block a user