Hi Sheri,

> I tried to get that page with wget, but despite trying all the wget
> options to send cookie and login info, I never managed to sign in
> via wget. Therefore I never got anything better than the page you
> Asee when trying to load the page as Guest. This was my first
> attempt to use wget, maybe Detlef can do better.

Sorry for answering so late - but because i am definitly not a 
wget-expert it took me a while, to get the hang of how to download
web-pages, which require a logon.
At the end the solution i found (there may be others) wasn't so
difficult. You have to logon to such a page with a browser (i used IE
in that case) and then export the browser-cookie-files containing 
the loggin-values to a text-file.

This text-file is usaly called "cookies.txt" and can be activated in
wget. I completed the template-script with that wget-options,
including a regex to extract the requested values. (As i am also not
a regex-expert, i guess there are better regular expressions for
doing that).

Best regards Detlef

---------------------------------------------------------------

local l_wget_path = "C:/program files/wget/wget.exe"
local l_cookies   = scriptfolder ++ ?"\cookies.txt"
local l_wget_log  = scriptfolder ++ ?"\wget.log"
local l_webp_file = scriptfolder ++ ?"\webp_file.htm"
local l_webp_url  = 
"http://www.classiccinemazone.com/index.php?page=users&order=lastconnect&by=DESC&\pages=1";

;delete temporary files
file.deletenorecycle(l_webp_file)
file.deletenorecycle(l_wget_log)

;download webpage
local l_wget_params = "-d -t 2"
local l_wget_params = l_wget_params ++ " -a " ++ l_wget_log
local l_wget_params = l_wget_params ++ " -O " ++ l_webp_file
local l_wget_params = l_wget_params ++ " --load-cookies " ++ l_cookies
local l_wget_params = l_wget_params ++ " " ++ l_webp_url
local l_exitcode    = ""

l_exitcode = file.runwait(99999999,l_wget_path,l_wget_params,"","hide")   

win.debugshow("WGET-Exitcode",l_exitcode,l_wget_path,l_wget_params)

if(l_exitcode)do
   quit
endif

;read web-page-content from file
local l_webp_cont    = file.readall(l_webp_file)

;extract information with regex-plugin
local l_format      = "$1 $2 $3 $4 $5 \\n"
local l_soptions    = "m"
local l_StrtOffs    = ""
local l_MaxMatch    = ""
local l_word        = ""
local l_regexpat    = ?~(?s)id=\d+?(?:"><span 
style='color:#000000'|")?>(\w+)(?:</span>)?</a></td>+.*?;">([\w+\.]+)+.*?;">([\w+\.\d/
 :]+).*?alt='(\w+)'.*?;">(.*?)</td>~
local regex_count   = 0
local regex_status  = ""
local l_result      = 
regex.pcreMatchall(l_regexpat,l_webp_cont,l_format,l_soptions,l_MaxMatch,"",l_StrtOffs)

;display information with win.debug
win.debugshow("regex_count="++regex_count)
win.debugshow("regex_status"++regex_status)

for each line l_line in l_result
    win.debug(l_line)
endfor


Reply via email to