#--*--*--*--*--*--*--*--*--*--*--*--*--*--*--*--*--*--*--*
#-- FILE:
#--   getYMail2.txt
#-- DESCRIPTION:
#--   This script logs onto a particular Yahoo! Mail
#--   account and extracts the summarised list of mail
#--   (called the 'inbox')
#--
#--   A description of the process of the script is as
#--   follows:
#--    1) Get the Yahoo! Mail Login Form from http://mail.yahoo.com
#--    2) Put the user account information into the form
#--       (user-name & password)
#--    3) Reformat the 'input' fields in the form so that
#--       they can be used by the curl -d switch
#--       (i.e. strip html tags, url encode fields, remove
#--        newline characters etc)
#--    4) Post (submit) this information to the Form's target
#--       and save any cookies and headers which the server
#--       sends. Also follow any redirects which the server
#--       specifies.
#--    5) Get the final Yahoo! Mail home-page location by looking at
#--       the final redirection instruction sent by the server
#--    6) Get the Yahoo! Mail home-page hostname. 
#--    7) Get the url of the Yahoo! Mail 'Inbox' from the mail
#--       home-page html.
#--    8) Go to the Yahoo! Mail Inbox. FINISHED 
#--
#--
#-- NOTES:
#--
#--   The script needs to overcome several devices used
#--   by yahoo.
#--     a) The use of cookies
#--     b) The use of automatic redirects of the web-client
#--        (using the LOCATION http header field)
#--     c) The use of ssl to encrypt the logon process
#--     d) The use of hidden fields with random numbers within
#--        the Yahoo! Mail Log-in Form to discourage automatic logins
#--
#--   These things can all be overcome because of the
#--   capabilities of the 'curl' non-interactive web client.
#--
#--   This script has only been used within the 'cygwin'
#--   unix emulating bash shell running on WinMe.
#--
#-- NOTE TO YAHOO ENGINEERS:
#--   This script was not written out of malicious-ness
#--   towards yahoo but because I am not able to get
#--   a credit card since I dont have a job currently
#--   and therefor I am not able to pay for a 'premium'
#--   package which includes pop forwarding of mail.
#--   
#-- DATE:
#--   may 02
#-- AUTHOR: mj bishop (matth3wbishop@yahoo.com)
#--
#--*--*--*--*--*--*--*--*--*--*--*--*--*--*--*--*--*--*--*

sTargetUrl=""              #-- The initial target of the login form                                                           
sYahooMailHomeUrl=""       #-- The final url of the Yahoo! Mail home page
sYahooMailHostName=""      #-- Just the host-name of the above.


#-- Extract the form fields from the html
#--

echo '<html><body>' > mailForm.html

#-- A user progress message
#--
echo "
  --------------------------------------------------
  Extracting the HTML login form from the Yahoo! Mail
  site [http://mail.yahoo.com]

  a) Putting account (user-name & password) into the login form
  b) Retrieving the target url of the login form
  c)
  --------------------------------------------------
     "

curl mail.yahoo.com | sed -n '/<form /,/<\/form>/p' \
  | grep -P '(<form|<input|<\/form>)' > t001.txt

#--
#-- Place the particular account details (user-name & password)
#-- within the Yahoo! Mail login form
#--

sed '/name="login"/s/value=""/value="matth3wbishop"/g' t001.txt > t000.txt
sed '/name="passwd"/s/type="password"/& value="bacibaci"/g' t000.txt >> mailForm.html
echo '</body></html>' >> mailForm.html

sTargetUrl=$(sed -n '/<form /s/.*action="\([^"]*\)".*/\1/p' mailForm.html)
echo "sTargetUrl = $sTargetUrl"

#--
#-- Reformat the HTML form fields into a format which
#-- is usable by the curl -d switch. i.e Name=Value
#-- Ensure that each field is 'url encoded'.
#--
cat mailForm.html | grep '<input' \
  | sed 's/.*name="\([.a-zA-Z0-9 ]*\)".*value="\([.a-zA-Z0-9 ]*\)".*/\1=\2/g' \
  | sed 's/.*name="\([.a-zA-Z0-9 ]*\)".*value=\([0-9]*\).*/\1=\2/g' \
  | expand | sed -e 's/ *$//g' -e 's/^ *//g' | sed 's/ /+/g' \
  | sed 's/$/\&/g' | tr -d '\012' > formData.txt


#--
#--
echo "
  --------------------------------------------------
  Submitting (post method) the Yahoo! Mail Login form
    -- Saving cookies and other header into 'headers.txt'
    -- Automatically following any redirects
  --------------------------------------------------
     "
curl -D headers.txt -d @formData.txt -L $sTargetUrl > ymail.html

sYahooMailHomeUrl=$(sed -n '/Location:/s/Location: *//p' headers.txt)
echo "sYahooMailHomeUrl = $sYahooMailHomeUrl"

sYahooMailHostName=$(echo $sYahooMailHomeUrl | sed 's/\.com\/.*/\.com/g')
echo "sYahooMailHostName = $sYahooMailHostName"

sInboxUrl=$( grep -i 'check mail' ymail.html | sed 's/.*href="\([^"]*\)".*/\1/g')
echo "sInboxUrl = $sInboxUrl"


#--
#-- Go to the Yahoo! Mail Inbox
#--
echo "
  --------------------------------------------------
  Following the link to the Yahoo! Mail inbox
  using previously set cookies
  --------------------------------------------------
     "
  
curl -b headers.txt ${sYahooMailHostName}${sInboxUrl} > ymail.html

# links -dump ymail.html | tr -s ' ' | less

#-- It is not working to manually redirect as the lines below
#-- attempt to do. Maybe have to redirect twice.
# sYahooMailHomeUrl=$(sed -n '/Location:/s/Location: *//gp' headers.txt)
# echo "sYahooMailHomeUrl = $sYahooMailHomeUrl"
# curl -i -b headers.txt -d @formData.txt $sYahooMailHomeUrl | less

# ---------------------------------------------
#  511  (echo '<html><body>'; curl mail.yahoo.com | sed -n '/<form /,/<\/form>/p' | grep -P '(<form|<input|<\/form>)' | sed -e '/name="login"/s/value=""/value="matth3wbishop"/g' -e '/name="passwd"/s/type="password"/& value="bacibaci"/g'; echo '</body></html>') > mailForm.html
#  543  cat mailForm.html | grep '<input' | sed 's/.*name="\([.a-zA-Z0-9 ]*\)".*value="\([.a-zA-Z0-9 ]*\)".*/\1=\2/g' | sed 's/.*name="\([.a-zA-Z0-9 ]*\)".*value=\([0-9]*\).*/\1=\2/g'
#  556  cat mailForm.html | grep '<input' | sed 's/.*name="\([.a-zA-Z0-9 ]*\)".*value="\([.a-zA-Z0-9 ]*\)".*/\1=\2/g' | sed 's/.*name="\([.a-zA-Z0-9 ]*\)".*value=\([0-9]*\).*/\1=\2/g' | expand | sed -e 's/ *$//g' -e 's/^ *//g' | sed 's/ /+/g' | sed 's/$/\&/g' | tr -d '\012'
#  557  history 2 >> getYMail.txt
#  580  curl -D - -d @qsy.txt -L https://login.yahoo.com/config/login?90ep5ie0i4i3q | less
#  581  history 2 >> getYMail.txt