From 94ca383b82a6dc22f686ee36d376b66b8202e88d Mon Sep 17 00:00:00 2001 From: "tv0924@icloud.com" Date: Mon, 9 Jun 2025 10:33:08 +0900 Subject: [PATCH] =?UTF-8?q?[Fix]=20=EC=97=90=EB=9F=AC=20=EB=B0=9C=EC=83=9D?= =?UTF-8?q?=20=EC=8B=9C,=20=EC=9E=AC=EC=8B=9C=EB=8F=84=20=ED=9B=84=20retur?= =?UTF-8?q?n=20=EB=90=98=EC=A7=80=20=EC=95=8A=EB=8A=94=20=EB=AC=B8?= =?UTF-8?q?=EC=A0=9C=20=ED=95=B4=EA=B2=B0?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- lib/prompt.py | 4 ++-- main.py | 9 +++++---- 2 files changed, 7 insertions(+), 6 deletions(-) diff --git a/lib/prompt.py b/lib/prompt.py index 26ab2b4..9bb58e7 100644 --- a/lib/prompt.py +++ b/lib/prompt.py @@ -2,7 +2,7 @@ extend_planner_system_message = """ 🎯 Mission: Collect Initial SSO Redirect URLs (For Browser Automation) -β€» **μ ˆλŒ€λ‘œ ꡬ글 검색, Bing 검색 λ“± μ–΄λ–€ μ™ΈλΆ€ 검색 κΈ°λŠ₯도 μ‚¬μš©ν•˜μ§€ 말고, μ£Όμ–΄μ§„ 둜그인 νŽ˜μ΄μ§€ URL을 직접 λ°©λ¬Έν•˜μ—¬ νƒμƒ‰ν•˜μ„Έμš”.** +β€» **λͺ¨λ“  STEPμ—μ„œ ꡬ글 검색, Bing 검색 λ“± μ–΄λ–€ μ™ΈλΆ€ 검색 κΈ°λŠ₯도 μ ˆλŒ€ μ‚¬μš©ν•˜μ§€ μ•Šκ³ , μ΄ˆκΈ°μ— μ£Όμ–΄μ§„ URLμ—μ„œ νƒμƒ‰ν•˜μ„Έμš”.** 0. **초기 블둝(Block) 체크** - λΈŒλΌμš°μ €κ°€ 둜그인 νŽ˜μ΄μ§€μ— μ ‘κ·Όν•˜λ € ν•  λ•Œ, **νŽ˜μ΄μ§€κ°€ 차단(blocked)** λ˜κ±°λ‚˜ **λ°©ν™”λ²½, CAPTCHA, μ ‘κ·Ό μ œν•œ** λ“±μœΌλ‘œ 인해 μ •μƒμ μœΌλ‘œ λ‘œλ“œλ˜μ§€ μ•ŠμœΌλ©΄ μ¦‰μ‹œ ν”„λ‘œμ„ΈμŠ€λ₯Ό μ’…λ£Œν•˜κ³  μ•„λž˜ JSON만 λ°˜ν™˜ν•΄μ•Ό ν•©λ‹ˆλ‹€. @@ -17,7 +17,7 @@ extend_planner_system_message = """ - 이후 λ‹¨κ³„λ‘œ μ ˆλŒ€ λ„˜μ–΄κ°€μ§€ μ•Šλ„λ‘ ν•©λ‹ˆλ‹€. 1. **둜그인 νŽ˜μ΄μ§€ 탐색** - - **ν΄λΌμ΄μ–ΈνŠΈ(λΉ„μ—”ν„°ν”„λΌμ΄μ¦ˆ) 둜그인 νŽ˜μ΄μ§€**둜 직접 μ΄λ™ν•©λ‹ˆλ‹€. (검색 엔진을 μ‚¬μš©ν•˜μ—¬ μ°Ύμ•„μ„œλŠ” μ•ˆ λ©λ‹ˆλ‹€.) + - **ν΄λΌμ΄μ–ΈνŠΈ(λΉ„μ—”ν„°ν”„λΌμ΄μ¦ˆ) 둜그인 νŽ˜μ΄μ§€**둜 직접 μ΄λ™ν•©λ‹ˆλ‹€. **검색 엔진을 μ‚¬μš©ν•˜μ—¬ μ°Ύμ•„μ„œλŠ” μ•ˆ λ©λ‹ˆλ‹€.** - μ ‘κ·Ό ν›„ **κ°œμΈμ •λ³΄/μΏ ν‚€/λ™μ˜ νŒμ—…**이 뜨면, 이λ₯Ό λ°˜λ“œμ‹œ **λ‹«κ±°λ‚˜(Dismiss)** μ²˜λ¦¬ν•˜κ³  계속 μ§„ν–‰ν•©λ‹ˆλ‹€. - (이미 0λ‹¨κ³„μ—μ„œ 블둝 μ—¬λΆ€λ₯Ό ν™•μΈν–ˆμœΌλ―€λ‘œ, 이 λ‹¨κ³„μ—μ„œλŠ” νŽ˜μ΄μ§€κ°€ 정상 λ‘œλ“œλ˜μ—ˆλ‹€κ³  κ°€μ •ν•©λ‹ˆλ‹€.) diff --git a/main.py b/main.py index 92c0c00..bb22a49 100644 --- a/main.py +++ b/main.py @@ -151,17 +151,18 @@ async def scan_one_url(url: str, skip_html_check: bool = False): break except Exception as e: - if try_cnt >= 3: + await clean_resources(agent, context, browser) + + if try_cnt >= 1: print(f"❌ {url} μŠ€μΊ”μ— μ‹€νŒ¨ν–ˆμŠ΅λ‹ˆλ‹€. μ—λŸ¬: {e}") logger(f"❌ {url} μŠ€μΊ”μ— μ‹€νŒ¨ν–ˆμŠ΅λ‹ˆλ‹€. μ—λŸ¬: {e}") - break + return try_cnt += 1 print(f"⚠️ μ—λŸ¬ λ°œμƒ: {e}. {try_cnt}번째 μž¬μ‹œλ„ 쀑...") - await clean_resources(agent, context, browser) # 1λΆ„ λŒ€κΈ° - await asyncio.sleep(60) + await asyncio.sleep(5) # λ°˜λ³΅λ¬Έμ„ 톡해 μž¬μ‹œλ„ continue