###################################################################### # WWW::Myspace.pm # Sccsid: %Z% %M% %I% Delta: %G% # $Id: Myspace.pm 496 2007-10-11 08:17:05Z grantg $ ###################################################################### # Copyright (c) 2005 Grant Grueninger, Commercial Systems Corp. # # Description: # Module to log into myspace.com ###################################################################### # Setup # Declare our package. package WWW::Myspace; use WWW::Myspace::MyBase -Base; use Data::Dumper; use warnings; use strict; # *** If you're not familiar with Spiffy, read its docs. To save you # confusion, one of its features is to add "my $self = shift;" to # each method definition, so when you see that missing, that's why. *** # Debugging? (Yes=1, No=0) our $DEBUG=0; ###################################################################### # Libraries we use use Carp; use Contextual::Return; #use Locale::SubCountry; # moved to cool_new_people to stop warnings use WWW::Mechanize; use File::Spec::Functions; #use Time::Local; use Time::ParseDate; =head1 NAME WWW::Myspace - Access MySpace.com profile information from Perl =head1 VERSION Version 0.72 =cut our $VERSION = '0.72'; =head1 WARNING March 2007: Using WWW::Myspace for commenting, messaging, or adding friends will probably get your Myspace account deleted or disabled. =head1 SYNOPSIS WWW::Myspace.pm provides methods to access your myspace.com account and functions automatically. It provides a simple interface for scripts to log in, access lists of friends, scan user's profiles, retreive profile data, send messages, and post comments. use WWW::Myspace; my $myspace = WWW::Myspace->new ($account, $password); OR my $myspace = new WWW::Myspace; # Prompts for email and password unless ( $myspace->logged_in ) { die "Login failed: " . $myspace->error } my ( @friends ) = $myspace->get_friends(); This module is designed to help you automate and centralize redundant tasks so that you can better handle keeping in personal touch with numerous friends or fans, or coordinate fan communications among multiple band members. This module operates well within MySpace's security measures. If you're looking for a spambot, this ain't it. WWW::Myspace works by interacting with the site through a UserAgent object, using HTTP::Request::Form to process forms. Since by nature web sites are dynamic, if you find that some interaction with the site breaks, check for a new version of this module (or if you go source diving, submit a patch). You can run "cpan -i WWW::Myspace" as a cron job or before running your scripts, if appropriate, to make sure you have the latest version. =cut # Since WWW::Myspace reads and reacts to a web site which by nature # may change, we define much of the basics up here where it's # easy to see and change. # What's the base URL for the site. our $BASE_URL="http://www.myspace.com/"; # Where should we store files? (cookies, cache dir). We use, and untaint, # the user's home dir for the default. our $HOME_DIR= ""; if ( defined $ENV{'HOME'} ) { $HOME_DIR = "$ENV{'HOME'}"; if ( $HOME_DIR =~ /^([\-A-Za-z0-9_ \/\.@\+\\:]*)$/ ) { $HOME_DIR = $1; } else { croak "Invalid characters in $ENV{HOME}."; } } # What's the URL for the user's Home page? our $HOME_PAGE="http://home.myspace.com/index.cfm?fuseaction=user"; # What's the URL to the Browse page? our $BROWSE_PAGE = 'http://browseusers.myspace.com/browse/Browse.aspx'; # What should we look for to see if there's a link to a friend's page? our $FRIEND_REGEXP = qr/fuseaction=user\.viewprofile\&(amp;)?friendID=/io; # What string should we look for if we're trying to post a comment to # someone who isn't our friend? our $NOT_FRIEND_ERROR='Error: You must be someone\'s friend to make '. 'comments about them\.'; # What should we look for to see if we are being asked for a CAPTCHA code? # We'll extract the URL to return from the area in parenthesis. our $CAPTCHA='
This error has been '. 'forwarded to MySpace\'s technical group\.', 'This user\'s profile has been temporarily '. 'disabled for special maintenance\.', 'This profile is undergoing routine maintenance. '. 'We apologize for the inconvenience', # Removed: Conflicts with "exceeded usage" message # 'An Error has occurred!!.*'. # 'An error has occurred (while )?trying to send this message.', 'We\'re doing some maintenance on the mail for certain users\. '. 'You can take this opportunity to leave your friend a swell comment '. 'while we work on it\. :\)', '

Error Occurred While Processing Request<\/H3>', ); @ERROR_REGEXPS = map qr/$_/i, @ERROR_REGEXPS; # What's the URL for a friend request button (to send a friend request)? our $ADD_FRIEND_URL = 'http://collect.myspace.com/index.cfm?'. 'fuseaction=invite.addfriend_verify&'. 'friendID='; # let's use this to keep track of various regexes that can be used elsewhere my %regex = ( friend_id => qr/fuseaction=mail\.message&friendID=([0-9]+)/o, friend_url => qr/www.myspace.com\/(\w*)\W+<\/title>/oixsm, is_band => qr/fuseaction=bandprofile/ioxsm, is_logged_in => qr/fuseaction=signout/io, is_private => qr/(This profile is set to private\. This user must add you as a friend to see his\/her profile\.)/io, is_invalid => qr/(Invalid Friend ID.
This user has either cancelled their membership, or their account has been deleted.)/io, is_comedy => qr/http\:\/\/.*?myspace\.com\/images\/comedy\/mscomedy\.gif/io, is_film => qr/http\:\/\/.*?myspace\.com\/images\/film_logo\.gif/io, is_music => qr/http\:\/\/.*?myspace\.com\/images\/music_logo\.gif/io, last_login => qr/Last Login:/io, basic_info => qr/Table2".*?>(.*Last Login:.*?)
/smo, basic_info_sub => qr/align="left">(.*)/smo, basic_info_band => qr/Arial, Helvetic, sans-serif">(.*Last Login:.*?)
/smo, comment_posted => qr/Your Comment has been posted/io, not_logged_in => qr/You Must Be Logged-In to do That\!/io, verify_message_sent => qr/Your Message Has Been Sent\!/o, comment_p1 => qr/ctl00\$(cp)?Main\$postComment\$commentTextBox.*<\/form|$NOT_FRIEND_ERROR|($CAPTCHA)|($INVALID_ID)/smio, comment_p2 => qr/ctl00\$(cp)?Main\$postComment\$Button1.*<\/form/smo, comment_approval_msg => qr/This user requires all comments to be approved before being posted/o, not_friend => qr/$NOT_FRIEND_ERROR/smo, bulletin_url => qr/fuseaction=bulletin\.edit/io, bulletin_post_action => qr/<\s*input .*?value\s*=\s*"Post".*?submitPage\s*\(\s*'\s*(.*?)\s*'/ismo, bulletin_p1 => qr/ctl00\$cpMain\$Subject_Textbox/io, bulletin_p2 => qr/Confirm\s+Bulletin/o, bulletin_confirm_action => qr/function postBulletin\(\).*?submitPage\('(.*?)'/ismo, bulletin_posted => qr/Bulletin Has Been Posted/io, verify_get_profile => qr/fuseaction=invite\.addfriend/io, exceed_usage => qr/User has exceeded their daily use?age/io, ); ###################################################################### # Methods # (These "sub" lines make section dividers in BBedit's function menu. # I'm sure there's a better way, so don't go "learning" anything from me # here. :) sub ____SET_OPTIONS__LOG_IN____ {} =head1 SET OPTIONS / LOG IN The new method takes the following options, all of which are optional. See the accessor methods below for defaults. Any option can be passed in a hash or hashref to the "new" method, and retreived or set using the appropriate accessor method below. account_name => 'myaccount', password => 'mypass', cache_dir => '/path/to/dir', cache_file => 'filename', # $cache_dir/$cache_file auto_login => 1 # 1 or 0, default is 1. human => 1 # Go slow. Saves bandwidth. =cut # Options they can pass via hash or hashref. const default_options => { account_name => 0, password => 0, cache_dir => 0, # Default set by field method below cache_file => 0, # Default set by field method below auto_login => 0, # Default set by field method below human => 0, # Default set by field method below max_get_attempts => 0, # Default set by field method below max_post_attempts => 0, # Default set by field method below captcha_killer_api_key => 0, # Default set by field method below captcha_tries => 0, # Default set by field method below }; # Options they can pass by position. # Just "new( 'joe@myspace.com', 'mypass' )". const positional_parameters => [ 'account_name', 'password' ]; =head1 OPTION ACCESSORS These methods can be used to set/retreive the respective option's value. They're also up top here to document the option, which can be passed directly to the "new" method. =head2 account_name Sets or returns the account name (email address) under which you're logged in. Note that the account name is retreived from the user or from your program depending on how you called the "new" method. You'll probably only use this accessor method to get account_name. EXAMPLE The following would prompt the user for their login information, then print out the account name: use WWW::Myspace; my $myspace = new WWW::Myspace; print $myspace->account_name; $myspace->account_name( 'other_account@myspace.com' ); $myspace->password( 'other_accounts_password' ); $myspace->site_login; WARNING: If you do change account_name, make sure you change password and call site_login. Changing account_name doesn't (currently) log you out, nor does it clear "password". If you change this and don't log in under the new account, it'll just have the wrong value, which will probably be ignored, but who knows. =cut field 'account_name'; =head2 password Sets or returns the password you used, or will use, to log in. See the warning under "account_name" above - same applies here. =cut field 'password'; =head2 cache_dir WWW::Myspace stores the last account/password used in a cache file for convenience if the user's entering it. Other modules store other cache data as well. cache_dir sets or returns the directory in which we should store cache data. Defaults to $ENV{'HOME'}/.www-myspace. If using this from a CGI script, you will need to provide the account and password in the "new" method call, or call "new" with "auto_login => 0" so cache_dir will not be used. =cut field cache_dir => catfile( "$HOME_DIR", '.www-myspace' ); =head2 cache_file Sets or returns the name of the file into which the login cache data is stored. Defaults to login_cache. If using this from a CGI script, you will need to provide the account and password in the "new" method call, so cache_file will not be used. =cut field cache_file => 'login_cache'; =head2 auto_login Really only useful as an option passed to the "new" method when creating a new WWW::Myspace object. # Don't log in, just create a new object my $myspace = new WWW::Myspace( auto_login => 0 ); Defaults to 1 for backwards compatibility. =cut field 'auto_login' => 1; =head2 human When set to a true value (which is the default), adds delays to make the module act more like a human. This is both to offset "faux security" measures, and to conserve bandwidth. If you're dumb enough to try to use multiple accounts to spam users who don't want to hear what you have to say, you should turn this off because it'll make your spamming go faster. =cut field 'human' => 1; =head2 max_get_attempts This is only here by request and should probably be left alone. Setting max_get_attempts controls the number of times the module will attempt to get a page. You can make your script really robust by setting this to a really high number. For example setting it to about 17280 would make the module try to get a given page for about 24 hours before giving up. Default is 20. You could also set this to a lower number if you wanted to be "nice" to Myspace, although set get_page mostly retries on errors, this is a bit pointless. Note though that on some occasions if a regular expression on the page being requested doesn't match (possibly due to a change in the site), get_page will keep trying a page that will never load up to max_get_attempts times. =cut field 'max_get_attempts' => 20; =head2 max_post_attempts This is the form version of max_get_attempts. This controls the number of times the submit_form function will attempt to submit a form before giving up. This defaults to 5. This should probably be kept at 5 since posting a form means you're usually sending some data (i.e. a comment), so in the event of a problem (such as the regular expression matching issue mentioned in max_get_attempts above), you could in theory be posting a successful form up to max_post_attempts times. In normal operation, however, submit_form will attempt to post until the post is successful, no matter what the outcome, so it will only retry if it gets an error page or the page doesn't match an expected regular expression. That is, when you're using myspace and have to keep trying things, submit_form does the same thing, but only up to max_post_attempts times. Change at your own risk. =cut field 'max_post_attempts' => 5; =head2 captcha_killer_api_key If you have an API key for captchakiller.com, you can set it using this method, or pass it to the "new" method when creating the myspace object. Methods that support it will use captchakiller to process captchas. use WWW::Myspace; my $myspace = new WWW::Myspace( captcha_killer_api_key => 'asdfjhasdfe' ); =cut field 'captcha_killer_api_key' => ""; =head2 captcha_tries Sets or returns the number of attempts that should be made to retreive the catpcha code (basically, how long it should wait before it gives up - each try takes about 5 seconds). Defaults to 20. =cut field 'captcha_tries' => 20; #--------------------------------------------------------------------- # new method # If we're passed an account and possibly a password, we store them. # Otherwise, we check the login cache file, and if we still # don't have them, we ask the user. =head2 new( $account, $password ) =head2 new( ) If called without the optional account and password, the new method looks in a user-specific preferences file in the user's home directory for the last-used account and password. It prompts for the username and password with which to log in, providing the last-used data (from the preferences file) as defaults. Once the account and password have been retreived, the new method automatically invokes the "site_login" method and returns a new WWW::Myspace object reference. The new object already contains the content of the user's "home" page, the user's friend ID, and a UserAgent object used internally as the "browser" that is used by all methods in the WWW::Myspace class. Myspace.pm is now a subclass of WWW::Myspace::MyBase (I couldn't resist, sorry), which basically just means you can call new in many ways: EXAMPLES use WWW::Myspace; # Prompt for username and password my $myspace = new WWW::Myspace; # Pass just username and password my $myspace = new WWW::Myspace( 'my@email.com', 'mypass' ); # Pass options as a hashref my $myspace = new WWW::Myspace( { account_name => 'my@email.com', password => 'mypass', cache_file => 'passcache', } ); # Hash my $myspace = new WWW::Myspace( account_name => 'my@email.com', password => 'mypass', cache_file => 'passcache', auto_login => 0, ); # Print my friend ID print $myspace->my_friend_id; # Print the contents of the home page print $myspace->current_page->decoded_content; # Print all my friends with a link to their profile. @friend_ids = $myspace->get_friends; foreach $id ( @friend_ids ) { print 'http://profile.myspace.com/index.cfm?'. 'fuseaction=user.viewprofile&friendID='. ${id}."\n"; } # How many friends do we have? (Note: we don't include Tom # because he's everybody's friend and we don't want to be # bugging him with comments and such). print @friend_ids . " friends (not incl Tom)\n"; =cut sub _old_new() { my $proto = shift; my $class = ref($proto) || $proto; my $self = {}; bless ($self, $class); if ( @_ ) { $self->{account_name} = shift } if ( @_ ) { $self->{password} = shift } unless ( $self->{account_name} ) { # Get account/password from the user $self->_get_acct(); } # And for convenience, log in $self->_site_login(); return $self; } sub new() { # Call the MyBase new method (it's ok to feel special about it). my $self = super; # Log in if requested if ( $self->auto_login ) { # Prompt for username/password if we don't have them yet. # (should this be moved to site_login?) $self->_get_acct unless $self->account_name; $self->site_login; } else { $self->logout; # Why? Resets variables and gets Mech object. } return $self; } #--------------------------------------------------------------------- # site_login() # Log into myspace with the stored account login name, password, and # URL (probably "http://www.myspace.com/") =head2 site_login Logs into the myspace account identified by the "account_name" and "password" options. You don't need to call this right now, because "new" does it for you. BUT I PLAN TO CHANGE THAT. You don't need to be logged in to access certain functions, so it's semi-silly to make you log in the second you call "new". Plus, it's not good practice to have "new" require stuff. Bad me. If you call the new method with "auto_login => 0", you'll need to call this method if you want to log in. It's also called automatically if the _check_login method finds that you've been mysteriously logged out, for example if Myspace.com were written in Cold Fusion running on Windows. If the login gets a "you must be logged-in" page when you first try to log in, $myspace->error will be set to an error message that says to check the username and password. Once login is successful for a given username/password combination, the object "remembers" that the username/password is valid, and if it encounters a "you must be logged-in" page, it will try up to 20 times to re-login. Clever, huh? =cut sub site_login { # Reset everything (oddly, this also happens to create a new browser # object). $self->logout; croak "site_login called but account_name isn't set" unless ( $self->account_name ); croak "site_login called but password isn't set" unless ( $self->password ); # Now log in $self->_try_login; return if $self->error; # We probably have an ad or somesuch (started 1/7/2006) # so explicitly request our Home. # We can't click "home", because as of 10/10/07 Myspace sets the Home # link using Javascript if you're logged in. Why do the work on the # server when you can just add extra code and do it on the browser instead? # In fact, why not just make all of Myspace run in the browser? $self->follow_to( $HOME_PAGE, '' ) or warn "Couldn't go to user's home page"; # ( $DEBUG ) && warn $self->current_page->content; # Verify we're logged in if ( $self->_apply_regex( regex => 'is_logged_in' ) ) { $self->logged_in( 1 ); warn "Logged in\n" if ( $DEBUG ); } else { $self->logged_in( 0 ); unless ( $self->error ) { $self->error( "Login Failed. Couldn't verify load of home page." ) } warn $self->current_page->decoded_content if $DEBUG; return; } # Initialize basic account/login-specific settings after login $self->_init_account; } # _try_login # You call this as $self->_try_login. Attempts to log in using # the set account_name and password. It gets and submits the login form, # then checks for a valid submission and for a "you must be logged-in" # page. # If called with a number as an argument, tries that many times to # submit the form. It calls itself recursively. sub _try_login { # Set the recursive tries counter. my ( $tries_left ) = @_; if ( $tries_left ) { $tries_left--; return if ( $tries_left ) < 1; } $tries_left = 20 unless defined $tries_left; # Submit the login form. They have two different ones, so if we see indication of # the ASP form (new as of late Jun 2007), use it, otherwise use the CFM version. # 9/17/07 - they changed from "ctl01" to "ctl00", so we check for both in case # they go back and forth. my $submitted=""; $self->get_page( 'http://www.myspace.com/' ); if ( $self->current_page->decoded_content =~ /ctl00\$Main\$SplashDisplay\$ctl00\$Email_Textbox/io ) { $submitted = $self->submit_form( { # page => 'http://www.myspace.com/', form_name => 'aspnetForm', fields_ref => { 'ctl00$Main$SplashDisplay$ctl00$Email_Textbox' => $self->account_name, 'ctl00$Main$SplashDisplay$ctl00$Password_Textbox' => $self->password, # '__EVENTTARGET' => 'ctl00$Main$SplashDisplay$ctl00$Login_ImageButton', # '__EVENTARGUMENT' => '', }, action => 'http://secure.myspace.com/index.cfm?fuseaction=login.process', # no_click => 1, } ) ; } elsif ( $self->current_page->decoded_content =~ /ctl00\$Main\$SplashDisplay\$ctl01\$Email_Textbox/io ) { $submitted = $self->submit_form( { # page => 'http://www.myspace.com/', form_name => 'aspnetForm', fields_ref => { 'ctl00$Main$SplashDisplay$ctl01$Email_Textbox' => $self->account_name, 'ctl00$Main$SplashDisplay$ctl01$Password_Textbox' => $self->password, # '__EVENTTARGET' => 'ctl00$Main$SplashDisplay$ctl01$Login_ImageButton', # '__EVENTARGUMENT' => '', }, action => 'http://secure.myspace.com/index.cfm?fuseaction=login.process', # no_click => 1, } ) } else { my $btn_name = $self->current_page->decoded_content =~ /ctl00\$Main\$SplashDisplay\$ctl00\$loginbutton/ ? 'ctl00$Main$SplashDisplay$ctl00$loginbutton' : 'ctl00$Main$SplashDisplay$ctl01$loginbutton'; $submitted = $self->submit_form( { # page => 'http://www.myspace.com/', form_name => 'theForm', fields_ref => { email => $self->account_name, password => $self->password }, button => $btn_name } ); } # Check for success if ( $submitted ) { # ( $DEBUG ) && print $self->current_page->decoded_content; # Check for invalid login page, which means we either have # an invalid login/password, or myspace is messing up again. unless ( $self->_check_login ) { # Fail unless we already know this account/password is good, in # which case we'll just beat the door down until we can get in # or the maximum number of attempts has been reached. if ( $self->_account_verified ) { $self->_try_login( $tries_left ); } else { $self->error( "Login Failed. Got 'You Must Be Logged-In' page ". "when logging in.\nCheck username and password." ); return; } } } else { return; # croak $self->error; } } # _account_verified # Returns true if we've verified that the current account and password # are valid (by successfully logging in with them) sub _account_verified { ( ( $self->{_account_verified}->{ $self->account_name } ) && ( $self->password = $self->{_account_verified}->{ $self->account_name } ) ) } # _init_account # Initialize basic account/login-specific settings after login sub _init_account { # Get our friend ID from our home page (which happens to # be the page we go to after logging in). $self->_get_friend_id( $self->current_page ); # If for some reason we couldn't set this, fail login. unless ( $self->my_friend_id ) { $self->logged_in(0) ; return } # Set the user_name and friend_count fields. $self->user_name( $self->current_page ); $self->friend_count( $self->current_page ); # Cache whether or not we're a band. $self->is_band; # Note that we've verified this account/password $self->{_account_verified}->{ $self->account_name } = $self->password; } =head2 mech_params Pass this parameters you wish the WWW::Mechanize object to use, inside a hash reference. for example: $myspace->mech_params({ onerror => undef, agent => 'Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1)' stack_depth => 1, quiet => 1, }); See the docs for WWW::Mechanize for more information. You should really know what you are doing before using this feature. =cut field mech_params => undef; sub _new_mech { my %default_mech_params = ( onerror => undef, agent => 'Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1)', stack_depth => 1, quiet => 1, ); my $new_p = $self->mech_params(); if (defined($new_p)) { if (ref($new_p) eq "HASH") { while (my ($k,$v) = each %$new_p) { $default_mech_params{$k} = $v; } } else { warn "Please pass mech_params() a HASH reference. Thanks!\n"; } } # Set up our web browser (WWW::Mechanize object) $self->mech( new WWW::Mechanize( %default_mech_params ) ); # We need to follow redirects for POST too. push @{ $self->mech->requests_redirectable }, 'POST'; } =head2 logout Clears the current web browsing object and resets any login-specific internal values. Currently this drops and creates a new WWW::Mechanize object. This may change in the future to actually clicking "logout" or something. =cut sub logout { # If you change this to just log out instead of making a new Mech # object, be sure you change site_login too. $self->_new_mech; # Clear anything login-specific $self->{user_name} = undef; $self->{is_band} = undef; $self->{my_friend_id} = undef; $self->logged_in(0); $self->error(0); $self->{page_cache} = undef; # Do NOT clear options that are set by the user! # $self->{account_name} = undef; # $self->{password} = undef; } =head2 get_login_form This handy little convenience method returns a string of HTML code that is a login form pre-filled with the account_name and password. I use it in a little "Dashboard" script I wrote that displays the notifications and a Login button. use WWW::Myspace; use CGI qw/:standard/;; my $myspace = new WWW::Myspace; # Display a login form print header, start_html('Is it worth logging in?'), $myspace->get_login_form, end_html; =cut sub get_login_form { my $x = '
' . '' . '' . ''. '
'; return $x; } #--------------------------------------------------------------------- # Value return methods # These methods return internal data that is of use to outsiders sub ____CHECK_STATUS____ {} =head1 CHECK STATUS =head2 logged_in Returns true if login was successful. When you call the new method of WWW::Myspace, the class logs in using the username and password you provided (or that it prompted for). It then retreives your "home" page (the one you see when you click the "Home" button on myspace.com, and checks it against an RE. If the page matches the RE, logged_in is set to a true value. Otherwise it's set to a false value. Notes: - This method is only set on login. If you're logged out somehow, this method won't tell you that (yet - I may add that later). - The internal login method calls this method to set the value. You can (currently) call logged_in with a value, and it'll set it, but that would be stupid, and it might not work later anyway, so don't. Examples: my $myspace = new WWW::Myspace; unless ( $myspace->logged_in ) { die "Login failed\n"; } # This will try forever to log in my $myspace; do { $myspace = new WWW::Myspace( $username, $password ); } until ( $myspace->logged_in ); =cut field logged_in => 0; =head2 error This value is set by some methods to return an error message. If there's no error, it returns a false value, so you can do this: $myspace->get_profile( 12345 ); if ( $myspace->error ) { warn $myspace->error . "\n"; } else { # Do stuff } =cut field 'error' => 0; =head2 current_page Returns a reference to an HTTP::Response object that contains the last page retreived by the WWW::Myspace object. All methods (i.e. get_page, post_comment, get_profile, etc) set this value. EXAMPLE The following will print the content of the user's profile page: use WWW::Myspace; my $myspace = new WWW::Myspace; print $myspace->current_page->decoded_content; =cut sub current_page { return $self->{current_page}; } =head2 mech The internal WWW::Mechanize object. Use at your own risk: I don't promise this method will stay here or work the same in the future. The internal methods used to access Myspace are subject to change at any time, including using something different than WWW::Mechanize. =cut field 'mech'; sub ____GET_INFO____ {} =head1 GET INFO =head2 get_notifications Returns a hash of status codes and printable indicators for "New" indicators ("New Messages!", "New Comments!", etc). Note that you probably want to call this right after logging in, as if you use any of the "read" methods, Myspace will reset that indicator. For example, if you use "get_inbox", Myspace will think you looked at your mail. Codes returned are: NC => New Comments! NM => New Messages! NFR => New Friend Requests! NIC => New Image Comments! EV => New Event Invitation! BC => New Blog Comments! BP => New Blog Posts! # Print all notifications use WWW::Myspace; my $myspace = new WWW::Myspace( $account, $password ); my $notifiers = $myspace->get_notifications; foreach $code ( keys( %notifiers ) ) { print $notifiers{ $code }; } # CGI script to display notifications and a Login button # to click if it's worth logging in (be sure you provide the # account and password ;-): use CGI qw/:standard/; use WWW::Myspace; my $myspace = new WWW::Myspace( $account, $password ); print header, start_html('Is it worth logging in?'); my ( %notifiers ) = $myspace->get_notifications; foreach $code ( keys( %notifiers ) ) { print $notifiers{ $code }, br; } print p, $myspace->get_login_form, p, end_html; =cut my $stats_ref = { 'NC' => { 'search' => { css => '
', db => 'New Comments!', }, 'display' => 'New Comments!' }, 'NM' => { 'search' => { css => '
', db => 'New Messages!' }, 'display' => 'New Messages!' }, 'NFR' => { 'search' => { css => '
', db => 'New Friend Requests!', }, 'display' => 'New Friend Requests!' }, 'NIC' => { 'search' => { css => '
', db => 'New Photo Comments!', }, 'display' => 'New Image Comments!' }, 'EV' => { 'search' => { css => '
', db => 'New Event Invitation!', }, 'display' => 'New Event Invitation!' }, 'BC' => { 'search' => { css => '
', db => 'New Blog Comments!', }, 'display' => 'New Blog Comments!' }, 'BP' => { 'search' => { css => '
', db => 'New Blog Posts!', }, 'display' => 'New Blog Posts!' } }; sub get_notifications { $self->_go_home; my %data = (); my $page = $self->current_page->decoded_content; $page =~ s/[ \t\n\r]+/ /g; # (Eliminate extra whitespace) # Myspace uses two techniques for displaying this data, and they # keep switching back and forth. Figure out which one they're doing # this week... my $dt; if ( $page =~ /
{"$stat_type"}->{'search'}->{"$dt"}; if ( $page =~ /$re/i ) { $data{"$stat_type"} = $stats_ref->{"$stat_type"}->{'display'} } } # Number of friends $data{"friends"} = "You have " . $self->friend_count . " friends"; # Return the data return %data; } =head2 my_friend_id Returns the friendID of the user you're logged in as. Croaks if you're not logged in. EXAMPLE print $myspace->my_friend_id; =cut sub my_friend_id { $self->_die_unless_logged_in( 'my_friend_id' ); return $self->{my_friend_id}; } =head2 is_band( [friend_id] ) Returns true if friend_id is a band profile. If friend_id isn't passed, returns true if the account you're logged in under is a band account. If it can't get the profile page it returns -1 and you can check $myspace->error for the reason (returns a printable message). This is used by send_friend_request to not send friend requests to people who don't accept them from bands, as myspace passively accepts the friend request without displaying an error, but doesn't add the friend request. EXAMPLE $myspace->is_band( $friend_id ); if ( $myspace->error ) { die $myspace->error . "\n"; } else { print "They're a band, go listen to them!\n"; } IMPORTANT: You can NOT assume that a profile is a personal profile if is_band is false. It could be a film profile or some future type of profile. There is currently no test for a personal or film profile. =cut sub is_band { my ( $friend_id ) = @_; # If they gave a friend_id, we load the profile and look at it. # If not, we return, or set, our internal is_band variable. if ( defined $friend_id ) { # Get the profile page my $res = $self->get_profile( $friend_id ); unless ( $self->error ) { # Scan the page for band-specific RE if ( $res->decoded_content =~ $regex{'is_band'} ) { return 1; } else { return 0; } } else { return -1; } } else { # Check for the "upcoming shows" header. This might very well # appear on other types of profiles (i.e. comedy), but it # distinguishes performers from personal profiles pretty well. # Note that this requires is_band to be called for the first time # just after loading the login profile page. site_login calls # this method to take care of that problem. unless ( defined $self->{is_band} ) { if ( $self->current_page->decoded_content =~ /\s*Upcoming Shows\s*<\/h/io ) { $self->{is_band} = 1; } else { $self->{is_band} = 0; } } return $self->{is_band}; } } =head2 is_comedy( [ $friend_id | friend_id => $friend_id ] [ page => $page ] ); Returns true if the specified profile is a comedy page. The method checks for the existence of the "Myspace Comedy" graphic on the page. =cut sub is_comedy { my $page = $self->_validate_page_request( @_ ); if ( $page ) { if ( $self->_apply_regex( regex=> 'is_comedy' ) ) { return 1; } else { return 0; } } return; } =head2 is_private( friend_id => $friend_id || page => $page ) Returns true if we think the profile has been set to private. You should note that you will get the most accurate results if you use this method while *not* logged in. If you *are* logged in and you check the profile of someone who is your friend, you will never get a true response returned you, even if this person has their profile set to private. There will be no warnings or errors if you call this method while logged in. We trust you'll "do the right thing". You can choose to pass either a friend_id OR a Myspace profile page in the form of a response object. You may use the get_profile method or just fetch the page on your own use WWW::Mechanize or an object which provides a $obj->decoded_content method. Returns true (1) if profile is private. Otherwise returns false (0). Returns undef and sets $myspace->error if there is an error. # Thorough privacy check with error checking if ( $myspace->is_private( friend_id => $friend_id ) ) { print "Ooh, it's private...\n"; } elsif ( $myspace->error ) { print $myspace->error; } else { print "It's so not private.\n"; } =cut sub is_private { my $page = $self->_validate_page_request( @_ ); if ( defined $page ) { my $private = $self->_apply_regex( page => $page, regex => 'is_private', ); if ( $private ) { return 1 } if ( !$self->error() && $self->current_page->decoded_content =~ /fuseaction=user\.invite/) { return 0; } elsif ( !$self->error() && $self->current_page->decoded_content !~ /friends\.myspace\.com/) { return 1; } else { return 0; } } return; } =head2 is_invalid( friend_id => $friend_id || page => $page ) Returns true if we think the profile is invalid or disabled. You can choose to pass either a friend_id OR a Myspace profile page in the form of a response object. You may use the get_profile method or just fetch the page on your own use WWW::Mechanize or an object which provides a $obj->decoded_content method. Returns true (1) if profile is invalid/disabled. Otherwise returns false (0). Returns undef and sets $myspace->error if there is an error. # Thorough invalid profile check with error checking if ( $myspace->is_invalid( friend_id => $friend_id ) ) { print "Profile is invalid or disabled.\n"; } elsif ( $myspace->error ) { print $myspace->error; } else { print "Profile seems fine to me.\n"; } =cut sub is_invalid { my $page = $self->_validate_page_request( @_, no_validation => 1 ); if ( defined $page ) { print "page defined" if $DEBUG; my $private = $self->_apply_regex( page => $page, regex => 'is_invalid', ); print $page->decoded_content if $DEBUG; if ( $private ) { return 1 } else { return 0 } } return; } =head2 user_name Returns the profile name of the logged in account. This is the name that shows up at the top of your profile page above your picture. This is NOT the account name. Normally you'll only retreive the value with this method. When logging in, the internal login method calls this routine with the contents of the profile page and this method extracts the user_name from the page code. You can, if you really need to, call user_name with the contents of a page to have it extract the user_name from it. This may not be supported in the future, so it's not recommended. =cut sub user_name { # Otherwise if they gave us a home page, get user's name. if ( @_ ) { my ( $homepage ) = @_; my $page_source = $homepage->decoded_content; if ( $page_source =~ /

\s*Hello,(\s| )+(.*)\!\s*<\/h4>/o ) { # my $line = $1; # $line =~ s/\+/ /g; # $line =~ s/%([a-fA-F0-9][a-fA-F0-9])/pack("C", hex($1))/eg; $self->{user_name} = $2; } } return $self->{user_name}; } =head2 friend_user_name( [friend_id] ) Returns the profile name of the friend specified by friend_id. This is the name that shows up at the top of their profile page above their picture. If no friend_id is specified, this method scans the current page so you can do: $myspace->get_profile( $friend_id ); print $myspace->friend_user_name; (Note, DON'T go using this to sign comments because most users use funky names and it'll just look cheesy. If you really want to personalize things, write a table mapping friend IDs to first names - you'll have to enter them yourself). =cut sub friend_user_name { my $page; if ( @_ ) { $page = $self->get_profile( @_ ); } else { $page = $self->current_page; } if ( $page->decoded_content =~ /(.*?)<\/span>/o ) { my $line = $1; # $line =~ s/\+/ /g; # $line =~ s/%([a-fA-F0-9][a-fA-F0-9])/pack("C", hex($1))/eg; return $line; } else { return ""; } } =head2 friend_url( [friend_id] ) Returns the custom URL of friend_id's profile page. If they haven't specified one, it returns an empty string. Example: foreach my $friend_id ( $myspace->get_friends ) { my $url = $myspace->friend_url( $friend_id ); if ( $url ) { print 'Friend's custom URL: http://www.myspace.com/' . $myspace->friend_url( $friend_id ); } else { print 'Friend doesn't have a custom URL. Use: '. 'http://www.myspace.com/' . $friend_id; } } If no friend_id is specified, this method scans the current page so you can do: $myspace->get_profile( $friend_id ); print $myspace->friend_url; =cut sub friend_url { my $page; if ( @_ ) { $page = $self->get_profile( @_ ); } else { $page = $self->current_page; } return $self->_apply_regex( regex => 'friend_url', page => $page ); } =head2 friend_id ( friend_url ) Returns the friend_id corresponding to a given custom URL. (This is basically the reverse of friend_url). # Print the friendID of Amber G: myspace.com/iamamberg print $myspace->friend_id("iamamberg"); > 37033247 If no friend_url is specified, this method scans the current page so you can do: $myspace->get_profile( $friend_id ); print $myspace->friend_url; =cut sub friend_id { my ($friend_url) = @_; my $page; if ( $friend_url ) { # If they gave a full URL chop off all but the last part. $friend_url =~ s/^.*\///; #Get page corresponding to the given custom URL $page = $self->get_page( $BASE_URL.$friend_url ); } else { $page = $self->current_page; } #Look for a RE that's near the top of the page that contains friendid if (defined $page && $page->decoded_content =~ $self->_regex('friend_id') ) { return $1; } else { return; } } =head2 C $friend_id | page => $page ] )> Tries to determine the real name of the person whose profile is specified. It does this by looking for "my name is ____" or "my real name is _____" on their profile page. The regex used takes several common myspace grammar/spelling erorrs into account. If passed no arguments, real_name parses the current page. If passed a friend_id, it calls get_profile to retrieve the friend's profile page. If passed a page (an HTTP::Response object), it parses $page->decoded_content. =cut sub get_real_name { my ( $page ) = $self->_validate_page_request( @_ ); # Matches: "my name is ___", "my real name is ___", "my name's ___", "my namez ___", # "my name'z ___", etc. Makes sure it's before the top friends section (because # someone could have a profile named "my name's joe", or leave a similar comment). if ( $page->decoded_content =~ /my (real )?(name i[sz]|name'?[sz])\s+(\w+).*class="friendSpace"/ismo ) { return ucfirst ( lc( $3 ) ); } return; } =head2 friend_count Returns the logged in user's friend count as displayed on the profile page ("You have NN friends"). Note that due to one of WWW::Myspace's many bugs, this count may not be equal to the count of friends returned by get_friends. Like the user_name method, friend_count is called by the internal login method with the contents of the user's profile page, from which it extracts the friend count using a regexp on the "You have NN friends" string. If you need to, you can do so also, but again this might not be supported in the future so do so at your own risk. =cut sub friend_count { # If they gave us a page, set friend_count. if ( @_ ) { my ( $homepage ) = @_; my $page_source = $homepage->decoded_content; if ( $page_source =~ /You have(\s| |)*(]+>)?([0-9]+)(<\/a>)?(<\/span>|\s| )*friends/o ) { $self->{friend_count} = $3; } # has someone else's friend count been requested? in this case, # return the value and don't stuff it into self elsif ( $page_source =~ /has (\d{1,})<\/span> friends\./ ){ return $1; } } return $self->{friend_count}; } =head2 last_login( [friend_id] ) Returns the last login date from the specified profile in Perl "time" format. As of WWW::Myspace 0.70, uses the Time::ParseDate module's "parsedate" method to parse the date according to your system's locale settings. This was done to allow for UK-style dates, which myspace seems to display based either on your profile settings, if you're logged in, or based on your IP address if not logged in. If no friend_id is specified, this method scans the current page so you can do: $myspace->get_profile( $friend_id ); ($sec,$min,$hour,$mday,$mon,$year,$wday,$yday,$isdst) = localtime( $myspace->last_login ); # or if ( $myspace->last_login( $friend_id ) < today - 3600 * 60 ) { print "They haven't logged in in 60 days!" } =cut sub last_login { my ( $page, $time ); if ( @_ ) { $page = $self->get_profile( @_ ) or return; } else { $page = $self->current_page; } if ( $page && $page->decoded_content =~ /Last Login:(\s| )+([0-9]+\/[0-9]+\/[0-9]+)\s*
/o ) { # Convert to Perl's time format. my $time = parsedate( "$2", DATE_REQUIRED => 1); # From Time::ParseDate $self->error( "Unable to parse date: $1" ) unless $time; # eval { $time = timelocal( 0, 0, 0, $3, $2 - 1, $4 ); }; # From Time::Local # $self->error( $@ . "\nDate found was $2/$3/$4" ); # Need to report to the caller if we got an error. # Return it. return $time; } else { $self->error("Last Login regex not found on profile page"); return; } } =head2 last_login_ymd ( $friend_id || friend_id => $friend_id || page => $page ) Returns the "Last Login" date for a given friend_id in YMD format. Behaves the same as profile_views. See profile_views for documentation on passing parameters to this function. =cut sub last_login_ymd { my $page = $self->_validate_page_request( @_ ); if ( defined $page ) { my $content = $page->decoded_content; $content =~ s/\n//g; # Band pages. if ( $content =~ /Last\sLogin: \s*(\d{1,})\/(\d{1,})\/(\d{4})/igmsoxc ) { return join("-", $3, $1, $2); } # Personal pages elsif ( $content =~ /Last\sLogin:\s*(\d{1,})\/(\d{1,})\/(\d{4})/igmsoxc ) { return join("-", $3, $1, $2); } } return; } #--------------------------------------------------------------------- # get_profile( $friend_id ) # Return the friend's profile page as an HTTP::Response object =head2 get_profile( $friend_id || $friend_url ) Gets the profile identified by $friend_id or $friend_url. That means both of these will work: $myspace->get_profile( "12345" ); $myspace->get_profile( "hilaryduff" ); Returns a reference to a HTTP::Response object that contains the profile page for $friend_id. The following displays the HTML source code of the friend's profile identified by "$friend_id": my $res = $myspace->get_profile( $friend_id ); print $res->decoded_content; =cut sub get_profile { # $no_validate is used by the internal _validate_page_request method # in case a method needs to specifically check for an invalid # profile or somesuch. my ( $friend_id, $no_validate ) = @_; my $re = 'verify_get_profile'; $re = undef if ( $no_validate ); return $self->get_page( "${BASE_URL}${friend_id}", $re ); } =head2 profile_views( $friend_id || friend_id => $friend_id || page => $page ) Returns the listed number of Profile Views for a given friend_id. This has only been tested on band profiles. You can choose to pass either a friend_id OR a Myspace profile page in the form of a response object. You may use the get_profile method or just fetch the page on your own use WWW::Mechanize or an object which provides a $obj->decoded_content method. EXAMPLE my $views = $myspace->profile_views( friend_id => $friend_id ); OR my $page = $myspace->get_profile( $friend_id ); $myspace->profile_views( page => $page ); =cut sub profile_views { my $page = $self->_validate_page_request( @_ ); if ( defined $page ) { my $content = $page->decoded_content; $content =~ s/\n//g; # Scan the page for band-specific RE (the music player plug-in). if ( $content =~ /Profile\sViews: \s*(\d{1,})/igmsoxc ) { return $1; } } return; } =head2 comment_count( $friend_id || friend_id => $friend_id || page => $page ) Returns the listed number comments posted a given friend_id. Behaves the same way as profile_views. See profile_views for documentation on passing parameters to this function. =cut sub comment_count { my $page = $self->_validate_page_request( @_ ); if ( defined $page ) { my $content = $page->decoded_content; $content =~ s/\n//g; if ( $content =~ /Displaying \d{1,} <\/span>of (\d{1,}) <\/span>comments/ ) { return $1; } #check whether there are zero comments on profile elsif($content =~ /.*?Friends Comments/){ return 0; } else { print "can't find comment count" if $DEBUG; } } else { print "page undefined" if $DEBUG; } return; } =head2 get_basic_info( $friend_id || friend_id => $friend_id || page => $page ); This routine takes either a friend_id or a page response object and returns a hash of information containing: country - country in profile (names of countries are as standardized on MySpace) cityregion - the line with city and region information (this is free text) headline - whatever it says next to the picture (including quotes) lastlogin - date of last login city - city* region - region* in addition, for profiles of individuals returns age - as number gender - as text, either male or female while for band/music profile returns profileviews - number of people that checked the profile EXAMPLE: my ( %info ) = $myspace->get_basic_info( $friend_id ); print "Your friend is $info{'age'} years old and is a $info{'gender'}.\n"; # sample output: Your friend is 25 years old and is a female. * Note: MySpace joins the profile data from city and region to one line (such as Berlin, Germany). However, both city and region are free text so people can write whatever they want. What is more, region and city is optional. This function tries to extract the city and the region by splitting cityregion at the last comma and do some other guesswork if there is only one value. However, it might not work (depending on the profile information) so both city and region can either be undefined or empty. See profile_views for documentation on passing parameters to this function. =cut sub get_basic_info { # Get and decode the page into HTML source my $page = $self->_validate_page_request( @_ ); my %info = (); #first find out what kind of profile this is #as band profiles work a bit different from #personal, film and comedy profiles my $type=$self->get_profile_type(page => $page); return undef if($self->error); #if it is not a band profile unless($type == 2){ $page = $self->_apply_regex( regex => 'basic_info', page => $page ); $page = $self->_apply_regex( regex => 'basic_info_sub', source => $page ); #assign values and trim leading and trailing white spaces ( $info{'headline'},undef,$info{'gender'}, $info{'age'},$info{'cityregion'},$info{'country'}, undef,undef,$info{'lastlogin'} )=map {s/^\s+//;s/\s+$//;$_} split('
',$page); #return age as number only $info{'age'} =~ s/^(\d+).*/$1/; #return last login as date only $info{'lastlogin'} =~ s/Last Login:\s+([\d\/]*)/$1/; } #separately for band profiles else{ $page = $self->_apply_regex( regex => 'basic_info_band', page => $page ); $page =~ s/<\/strong><\/font>//; #assign values and trim leading and trailing white spaces ( $info{'headline'},undef,$info{'cityregion'}, $info{'country'},undef,$info{'profileviews'}, undef,undef,undef,$info{'lastlogin'} )=map {s/^\s+//;s/\s+$//;$_} split('
',$page); #make sure profile views returns only the number $info{'profileviews'}=~ s/[^\d]*([\d]+)/$1/sm; #return last login as date only $info{'lastlogin'} =~ s/Last Login:[^\d]*([\d\/]+)/$1/sm; } ( $DEBUG ) && print %info,"\n"; #let's guess what is the city and what the region if ($info{'cityregion'} =~ /(.*),\s*(.*)/){ $info{'city'} = $1; $info{'region'} = $2; }elsif($info{'cityregion'} =~ /(.+)/){ $info{'region'} = $1; } return (%info); } =head2 get_comments( $friend_id ) Returns a list of hashrefs, like "get_inbox", of comments left for the profile indicated by $friend_id. get_comments returns a maximum of 50 pages of comments (about 2500). This limit was added in version 0.66 to prevent the method from "running away" if myspace changes the code for which the method looks when gathering the comments. Each list element contains: { sender => $friend_id, # friendID of the person who sent the comment date => $date_time, # As formatted on MySpace comment => $string # HTML of the comment. } Comments are returned in the order in which they appear on myspace (currently most recent first). Dies if called when not logged in. =cut sub get_comments { my ( $friend_id ) = @_; my @comments = (); my $url="http://comment.myspace.com/index.cfm?fuseaction=user.viewComments&friendID=". $friend_id; my $eventtarget='ctl00$Main$PagedComments$pagingNavigation1$NextLinkButton'; my $eventvalidation; my $viewstate; my $page=""; my $commentcount; $self->_die_unless_logged_in( 'get_comments' ); # only get a maximum of 50 comment pages # this should translate to 2500 comments # and also serves as a safety measure in case # the method breaks again ( $DEBUG ) && print "Getting $url\n"; $page = $self->get_page( $url ); #raise an error if its private #if($self->is_private(page => $page)) { #$self->error("cannot get comments from private profile"); #return undef; #} # find out how many comments in total if ($page->decoded_content =~ /.*Listing [\d-]+ of (\d+).*/smo){ $commentcount=$1; } else { $self->error("Could not find how many comments are on profile"); return undef; } for (my $i=1;$i<=50;$i++) { $page=$self->{current_page}; push @comments, $self->_get_comments_from_page( $page->decoded_content ); #make sure we did not get an error return undef if ($self->error); last unless ( $self->_next_button( $page->decoded_content ) ); #get value of form field eventvalidation if ($page->decoded_content =~ /id=\"__EVENTVALIDATION\" value=\"(.*?)\"/o){ $eventvalidation=$1; } else { $self->error("get_comments could not determine eventvalidation in form"); return undef; } #get value of form field viewstate if ($page->decoded_content =~ /id=\"__VIEWSTATE\" value=\"(.*?)\"/o){ $viewstate=$1; } else{ $self->error("get_comments could not determine viewstate in form"); return undef; } #create a form using these values my $htmlform=qq{
}. qq{}. qq{}. qq{}. qq{}. qq{
}; my $form=HTML::Form->parse($htmlform,"http://comment.myspace.com/index.cfm"); ( $DEBUG ) && print "try to submit form to access comments page #",$i+1,"\n"; #submit it and hope for the best $self->submit_form({form => $form,no_click=> 1,follow=>0}); # submit the form to get to next page #$self->submit_form({ # follow => 0, # form_name => "aspnetForm", # no_click => 1, # fields_ref => { __EVENTTARGET => $eventtarget, __EVENTARGUMENT => '' } # #re1 => 'something unique.?about this[ \t\n]+page', # }); # sleep ( int( rand( 2 ) ) + 1 ); } # unless(scalar (@comments) == $commentcount){ # $self->error("Could not collect all comments. Have " . @comments .", should have $commentcount"); # return undef; # } return \@comments; } sub _get_comments_from_page { # Take a page, return a list of comment data my ( $page ) = @_; my @comments = (); # Get to the comments section to avoid mis-reads if ( $page !~ m/Add Comment<\/a>/gs ) { $self->error("Comment section not found on page"); return undef; } # Read the comment data and push it into our array. while ( $page =~ s/.*?UserID=([0-9]+).*?

(.*?)<\/h4>\s*(.*?)\s*<\/textarea>//smo ) { push @comments, { sender => $1, date => $2, comment => $3 }; #print "found 1:$1\nfound 2:$2\nfound 3:$3\n"; } return @comments; } =head2 get_profile_type( $friend_id || friend_id => $friend_id || page => $page ) Can take either a friend id or a page response object and returns an integer that indicates the type of MySpace profile. The codes are as follows 1 individual profile 2 band profile (detected by looking for the MySpace Music logo) 3 film profile (detected by looking for the MySpace Film logo) 4 comedy profile (detected by looking for the MySpace Comedy logo) First we try to look for all the non-individual profiles. If these do not match, we try to make sure that we have at least a "Last Login" date on the profile to make sure that this is really an individual's profile. returns undef and sets an error if nothing of the above matches. =cut #more error checking needed sub get_profile_type { # Get and decode the page into HTML source my $page = $self->_validate_page_request( @_ ); #band profile #return 2 if ( $page->decoded_content =~ qr/x\.myspace\.com\/images\/music_logo\.gif/o ); return 2 if($self->_apply_regex( regex => 'is_music', page => $page )); #film profile #return 3 if ( $page->decoded_content =~ qr/x\.myspace\.com\/images\/film_logo\.gif/o ); return 3 if($self->_apply_regex( regex => 'is_film', page => $page )); #comedy profile #return 4 if ( $page->decoded_content =~ qr/x\.myspace\.com\/images\/comedy\/mscomedy\.gif/o ); return 4 if($self->_apply_regex( regex => 'is_comedy', page => $page )); #should be a personal profile if we have a mention of a last login date somehwhere #return 1 if ($page->decoded_content =~ qr/Last Login:/o ); return 1 if($self->_apply_regex( regex => 'last_login', page => $page )); #if non of the above applies, return an error $self->error("Could not determine type of profile"); return undef; } sub get_birthdays { =head2 get_birthdays Returns a hash of the birthdays from View Upcoming Birthdays as friendID => birthday, friend_id => birthday, ... Croaks if called when not logged in. Example: my ( %birthays ) = $myspace->get_birthdays; foreach my $friend ( keys( %birthdays ) ) { print "Friend ${friend}'s birthday is on ". $birthdays{"$friend"} . "\n"; } =cut $self->_die_unless_logged_in( 'get_birthdays' ); $self->_go_home or return; $self->follow_link( url_regex => qr/fuseaction\=user\.birthdays/io ) or return; my %bd=(); my $page = 1; do { my $page_source = $self->current_page->decoded_content; while ( $page_source =~ s/^.*?friendid=([0-9]+).*?birthday_icon\.gif.*?>\s*(.*?)\s* 5 ); # To prevent endless loop if below doesn't work. $self->submit_form( { form_name=>'aspnetForm', fields_ref=>{ '__EVENTTARGET' => 'ctl00$cpMain$BirthdayList$PagerTop', '__EVENTARGUMENT' => $page }, no_click => 1, } ); } while ( $self->_next_button ); return ( %bd ); } sub ____EDIT_ACCOUNT____ {} =head1 EDIT ACCOUNT =head2 get_photo_ids( %options ) Each of your profile's photos is stored using a unique ID number. This method returns a list of the IDS of the photos in your profile's photo section. The only valid option at this time is: friend_id => $friend_id Defaults to your friendID. Croaks if called when not logged in. =cut sub get_photo_ids { my ( %options ) = @_; $self->_die_unless_logged_in( 'get_photo_ids' ); my $friend_id = $options{'friend_id'} || $self->my_friend_id; $self->get_profile( $friend_id ) or return; $self->follow_link( url_regex => qr/fuseaction\=user\.viewAlbums/io ) or return; # If there's a "View All Pictures" link, click it. Otherwise it means # they only have one album (or myspace changed something again). $self->follow_link( url_regex => qr/fuseaction\=user\.viewPicture/io ); $self->error(undef); # Ignore any error we got. my $last_id = -1; my @photo_ids = (); my $page = $self->current_page->decoded_content; while ( $page =~ s/^.*?imageID=([0-9]+)[^0-9]//iso ) { unless ( $1 == $last_id ) { push( @photo_ids, $1 ); $last_id = $1; } } return ( @photo_ids ); } =head2 set_default_photo( photo_id => $photo_id ) Sets your profile's default photo to the photo_id specified. Example: Set your default photo to a random photo. use WWW::Myspace 0.60; my $myspace = new WWW::Myspace; my @ids = $myspace->get_photo_ids; $myspace->set_default_photo( $ids[ int( rand( @ids ) ) ] ); =cut sub set_default_photo { my ( %options ) = @_; $self->_die_unless_logged_in( 'set_default_photo' ); $self->_go_home or return; # warn "Going to Edit photos page\n"; $self->follow_link( text_regex => qr/Edit Photos/io ) or return; # Click "View All Photos". $self->follow_link( url_regex => qr/fuseaction=user\.editAlbumPhotos/io ) or return; # Click on the picture $self->follow_link( url_regex => qr/imageID=$options{'photo_id'}/i ) or return; # Click the "Set a default" button $self->submit_form( { form_name => 'aspnetForm', fields_ref => { '__EVENTTARGET' => 'ctl00$cpMain$contentHolder$editPhoto$PhotoHeader1$lbtnSetAsDefault', '__EVENTARGUMENT' => '' }, no_click => 1, } ); } # Myspace now (July 2007) numbers the submit buttons sequentially on the page. # The RE here searches for the imageID in the URL and returns the sequence number # from the "set as default" button that follows it. sub _get_photo_button_no { my ( $photo_id ) = @_; my $page = $self->current_page->decoded_content; my $re = 'imageID=' . $photo_id . '.*?ctl00\$Main\$ViewAndEditPhotos1\$ImageListings1\$dtImageList\$ctl([0-9]+)\$SetAsDefault'; if ( $page =~ /$re/sm ) { return $1 } $self->error( "No button for photo ID $photo_id found on page" ); return; } sub _get_photo_form_no { my ( $photo_id ) = @_; my ( @forms ) = $self->mech->forms; my $form_no = 0; foreach my $f ( @forms ) { if ( $f->find_input( 'imageID' ) ) { return $form_no if ( $f->value( 'imageID' ) == $photo_id ); } $form_no++; } $self->error( "No photo with ID $photo_id found on Edit Photos page" ); return; } sub ____FIND_PEOPLE____ {} =head1 FIND PEOPLE =head2 C Takes an email address and returns a list of the friend_ids of the owner. It does so by clicking "Search" and filling in the "Find a Friend" form with "email" selected. Example: use WWW::Myspace; my $myspace=new WWW::Myspace( auto_login=>0 ); my $email = shift; my ( @friend_ids ) = $myspace->find_friend( $email ); if ( $myspace->error ) { die $myspace->error; } elsif ( @friend_ids ) { print "${email}'s friendID is @friend_ids\n"; } else { print "Don't think $email is on myspace, sorry\n"; } =cut sub find_friend { my ( $email ) = @_; $self->error( "Must provide an email address in find_friend") unless ( $email ); $self->_go_home or return; $self->follow_to( 'http://search.myspace.com/index.cfm?fuseaction=find', '' ) or return; return unless $self->submit_form( { form_no => 2, fields_ref=>{ searchBy => 'Email', f_first_name => "$email", }, re2=>qr/find a friend/io, } ); # We'll either get: We weren't able to find a "your@email.com" on Myspace.com # or : "Results for your@email.com" if ( $self->current_page->decoded_content =~ qr/results for /io ) { return ( $self->get_friends_on_page ); } else { return; } } =head2 browse Call browse with a hashref of your search criteria and it returns a list of friendIDs that match your criteria. This is a complex form. Don't trust the defaults you see in your web browser. Easiest thing to do is paste this into your script and change the values you want. (This example script looks up the specified criteria and dumps a list of friendIDs in YAML). use WWW::Myspace; use YAML; my $myspace = new WWW::Myspace( human => 0, auto_login => 0 ); my @friends = $myspace->browse( { 'ctl00$Main$ctl00$Scope' => 'scopeFullNetwork', # or 'scopeMyFriends' 'ctl00$Main$ctl00$Gender' => 'genderWomen', # or 'genderMen', 'genderBoth' 'ctl00$Main$ctl00$minAge' => 18, 'ctl00$Main$ctl00$maxAge' => 35, # Marital Status 'ctl00$Main$ctl00$statusSingle' => 'on', 'ctl00$Main$ctl00$statusInRelationship' => 'off', 'ctl00$Main$ctl00$statusSwinger' => 'off', 'ctl00$Main$ctl00$statusMarried' => 'off', 'ctl00$Main$ctl00$statusDivorced' => 'off', # Here for 'ctl00$Main$ctl00$motiveDating' => 'on', 'ctl00$Main$ctl00$motiveNetworking' => 'off', 'ctl00$Main$ctl00$motiveRelationships' => 'on', # Location (there are MANY country values. Check the browse page # source (see below)). 'ctl00$Main$ctl00$country' => 'US', 'ctl00$Main$ctl00$zipRadius' => 20, 'ctl00$Main$ctl00$zipCode' => 91604, 'ctl00$Main$ctl00$region' => 'Any', # Photos 'ctl00$Main$ctl00$showHasPhotoOnly' => 'on', 'ctl00$Main$ctl00$showNamePhotoOnly' => 'on', # Leave this on for speed. # Ethnicity 'ctl00$Main$ctl00$asian' => 'on', 'ctl00$Main$ctl00$white' => 'on', 'ctl00$Main$ctl00$black' => 'off', 'ctl00$Main$ctl00$eastIndian' => 'off', 'ctl00$Main$ctl00$latino' => 'off', 'ctl00$Main$ctl00$midEastern' => 'off', 'ctl00$Main$ctl00$nativeAmer' => 'off', 'ctl00$Main$ctl00$ethnOther' => 'off', 'ctl00$Main$ctl00$pacIslander' => 'off', # Body Type 'ctl00$Main$ctl00$slimSlender' => 'on', 'ctl00$Main$ctl00$average' => 'off', 'ctl00$Main$ctl00$moreToLove' => 'off', 'ctl00$Main$ctl00$athletic' => 'on', 'ctl00$Main$ctl00$littleExtra' => 'off', 'ctl00$Main$ctl00$bodyBuilder' => 'off', # Height 'ctl00$Main$ctl00$Height' => 'heightBetween', # or 'heightNoPreference' 'ctl00$Main$ctl00$minFoot' => 5, 'ctl00$Main$ctl00$minInch' => 0, 'ctl00$Main$ctl00$maxFoot' => 6, 'ctl00$Main$ctl00$maxInch' => 0, # Background & Lifestyle 'ctl00$Main$ctl00$Smoker' => 'smokerBoth', # or 'smokerNo', 'smokerYes' 'ctl00$Main$ctl00$Drinker' => 'drinkerBoth', # or 'drinkerNo', 'drinkerYes' 'ctl00$Main$ctl00$straight' => 'on', 'ctl00$Main$ctl00$bi' => 'on', 'ctl00$Main$ctl00$gay' => 'off', 'ctl00$Main$ctl00$notSure' => 'off', # Education (note: all off means no preference) 'ctl00$Main$ctl00$highSchool' => 'off', 'ctl00$Main$ctl00$inCollege' => 'off', 'ctl00$Main$ctl00$gradSchool' => 'off', 'ctl00$Main$ctl00$someCollege' => 'off', 'ctl00$Main$ctl00$collegeGrad' => 'off', 'ctl00$Main$ctl00$postGrad' => 'off', # Religion 'ctl00$Main$ctl00$religion' => 'NoPreference', # Possible Values Are: # NoPreference # Agnostic # Atheist # Buddhist # Catholic # ChristianOther # Hindu # Jewish # Mormon # Muslim # Other # Protestant # Scientologist # Taoist # Wiccan # Income 'ctl00$Main$ctl00$income' => 'NoPreference', # Possible Values Are: # NoPreference # LessThan30000 # From30000To45000 # From45000To60000 # From60000To75000 # From75000To100000 # From100000To150000 # From150000To250000 # From250000ToHigher # Children 'ctl00$Main$ctl00$children' => 'NoPreference', # Possible Values Are: # NoPreference # IDontWantKids # Someday # Undecided # LoveKidsButNotForMe # Proud parent # Sort By (last login is good to weed out dead accounts) 'ctl00$Main$ctl00$SortBy' => 'sortByLastLogin', # Possible Values Are: # sortByLastLogin # sortByNewToMySpace # sortByDistance } ); print Dump( @friends ); I'm not sure how I'm going to make the criteria passing easier. I'm also concerned about your script breaking if they change the browse form variable names. So maybe I'll add a mapping later. The values above are current, and you can copy/paste that code, change the values, and browse away. If you need to look at values (i.e. something's not working or you need to change "Location" fields): Go to the browse page: http://browseusers.myspace.com/browse/Browse.aspx Switch to Advanced mode and enter your search criteria. View Source in your web browser and find "submit_form( { page => $BROWSE_PAGE, form_name => 'aspnetForm', no_click => 1, fields_ref => { '__EVENTTARGET' => 'ctl00$Main$advancedView', }, re1 => $re, re2 => $re, } ) or return; # Enter the search criteria and click Update $self->submit_form( { form_name => 'aspnetForm', action => $self->_browse_action( 'Update' ), fields_ref => { %{$criteria}, '__EVENTTARGET' => 'ctl00$Main$update' }, re1 => $re, re2 => $re, } ) or return; # $self->mech->form_name( "aspnetForm" )->dump; # Loop through the resulting pages getting friendIDs. my $page = 1; until ( ( $self->error ) || ( ! $self->_next_button ) ) { # Get the friends from the current page push @friends, $self->get_friends_on_page( $self->current_page->decoded_content ); # Click "Next" $page++; $self->_browse_next( $page, $re ); warn "Page: $page, friends: " . @friends . "\n"; } # Sort and remove duplicates my %friends = (); foreach my $id ( @friends ) { $friends{ $id } = 1; } return ( sort( keys( %friends ) ) ); } =head2 _browse_next( $page ) The browse form's Next button calls a JavaScript function that sets "action" and "page" in the browse form and "clicks" submit. So we do the same here. Called by browse to simulate clicking "next". =cut sub _browse_next { my ( $page, $re ) = @_; # Get the javascript-set action for the next button post my $action = $self->_browse_action( "GotoPage" ); return 0 unless $action; # Submit the form. my $submitted = $self->submit_form( { 'form_name' => "aspnetForm", 'action' => $action, 'no_click' => 1, 'fields_ref' => { page => $page }, 're1' => $re, 're2' => $re, # 'base' => "http://browseusers.myspace.com/", } ); return $submitted; } =head2 _browse_action( $function_name ) Gets the action set by the specificied function on the Browse page. =cut sub _browse_action { my ( $function ) = @_; # Look for the action (we need MyToken) $self->current_page->decoded_content =~ /function ${function}.*?theForm\.action = "Browse\.aspx(\?MyToken=[^"]+)"/is; # my $action = "http://browseusers.myspace.com/browse" . $1; my $args = $1; unless ( $args ) { $self->error("Couldn't find Javascript GotoPage function to set action"); return ""; } my $action = "http://browseusers.myspace.com/browse/Browse.aspx" . $args; return $action; } =head2 cool_new_people( $country_code ) NOTE: Myspace appears to have abandoned this method of posting "cool new people" sometime around August of 2006. However, the .js pages are still posted, so this method will return a list of people. However, they are not new and maybe not even cool. This method should be considered deprecated. This method provides you with a list of "cool new people". Currently Myspace saves the "cool new people" data to a JavaScript file which is named something like this: http://viewmorepics.myspace.com/js/coolNewPeople_us.js Since these files are named using country codes, you'll need to provide the ISO 3166-1 two letter code country code for the list you'd like to get. For example, $myspace->cool_new_people( 'US' ) When called in a list context, this function returns the friend ids of the cool folks: my @friend_ids = $myspace->cool_new_people( 'US' ); If you treat the return value as a hash reference, you'll get a hash keyed on friend ids. The values consist of hash references containing the urls of the friend thumbnails (thumb_url) as well as their display names (friend_user_name). There will probably be about 200 keys returned in the hash. my $cool = $myspace->cool_new_people('US'); my %cool_new_people = %{$cool}; %cool_new_people = { ... 'friend_id' => { 'thumb_url' => 'url_to_jpg_here', 'friend_user_name' => 'friend display name here' }, ... } So far, we know of 4 country-specific cool new people lists: AU, CA, UK/GB and US Submitting any of these values to the function should return valid friend ids. If you want to check for other countries for which cool people lists may exist, you can do something like this: use Locale::SubCountry; my $world = new Locale::SubCountry::World; my %countries = $world->code_full_name_hash(); my @country_codes = sort keys %countries; foreach my $country_code ( @country_codes ) { my %cool_people = $myspace->cool_new_people($country_code); if (%cool_people) { print "$country_code $countries{$country_code} has cool folks\n"; } else { print "****** $country_code\n"; } } =cut sub cool_new_people { my $country_code = shift; my $country_code_uc = "\U$country_code"; my %cool_people = ( ); $self->error(0); # Lets the calling script check for error being true. # special case for UK if ($country_code_uc eq 'UK') { $country_code_uc = 'GB'; } # get a list of valid country codes my ( $world, %countries ); eval 'use Locale::SubCountry;$world = new Locale::SubCountry::World; '. '%countries = $world->code_full_name_hash();'; if (exists $countries{$country_code_uc}) { my $country_code_lc = "\L$country_code"; my $javascript_url = 'http://viewmorepics.myspace.com/js/coolNewPeople_'. $country_code_lc.'.js'; # my $res = $self->get_page( $javascript_url ); # get_page helps circumvent myspace errors by checking for # errors and trying many times. We might not want to do that here # (since we could have a country code that's not working, etc). my $res = $self->mech->get( $javascript_url ); unless ($res->is_success) { if ($res->code == 404) { $self->error("Unable to find cool new friends for $country_code_uc ($countries{$country_code_uc})"); } else { $self->error( $res->status_line . " $javascript_url\n" ); return; # don't die in modules, scripters will be mad. :) # die $mech->response->status_line, "$javascript_url\n"; } } my $html = $res->decoded_content; my @lines = split(/\n/, $html); foreach my $line (@lines) { if ($line =~ /new coolNewPerson\('(.*?)', '(\d*?)', '(http.*?)'/) { $cool_people{$2} = { friend_user_name => $1, thumb_url => $3 }; } } } else { $self->error( qq[You supplied: $country_code You must supply a valid 2 character country code. For example cool_new_people('US')] ); return; #die qq[You supplied: $country_code You must supply a valid 2 character country code. For example cool_new_people('US')]; } return LIST { keys %cool_people } HASHREF { \%cool_people } ; } =head2 get_friends( %options ) NOTE: As of version 0.59, "source => inbox" has been removed due to a formatting change in Myspace.com. Use the "friends_who_emailed" method instead. This method is a complete re-write as of version 0.62. Please see the Changes file. Returns, as a list of friendIDs, all of your friends. It does not include Tom, because he's everybody's friend and when you're debugging your band central CGI page it's probably best to limit your mistakes to actual friends. # Simplest form - gets your friends. @friends = $myspace->get_friends; # Advanced form @friends = $myspace->( source => 'group', # 'profile', 'group', 'inbox', or '' id => $group_id, # friendID or groupID as appropriate start_page => $start_page # Start on this page. Starts on page 1 if not included. end_page => $end_page, # Stop on this page. Goes to last page if not included. max_count => 300, # Number of friends to return ); Accepts the following options: source: "profile" or "group" If not specified, gets your friends. profile: Get friends from the profile specified by the "id" option. group: Get the friends from the group specified by the "id" option. id: The friendID or groupID (depending on "source"). "id" is only needed for "profile" or "group". (See the "friends_in_group" method for more info). start_page: Start on this page. end_page: Stop on this page. $myspace->get_friends( end_page => 5 ); If not specified, gets all pages. See note below about interaction with other options. max_count: Return this many friendIDs. $myspace->get_friends( max_count => 300 ); Stops searching and returns when max_count is reached. (See note below). exclude: Ignored as of version 0.62. Previous versions took this as a list of friends to exclude. If you specify max_count and end_page, get_friends will stop when it hits the earliest condition that matches. max_count may return up to 40 more friends than you specify. This is because it reads each friend page, and returns when it's gathered max_count or more friends (and there are 40 per page). Myspace trivia: The friends on friends lists are sorted by friendID. Croaks if called with no arguments (i.e. to get your friends) and you're not logged in. =cut # This re-write of get_friends "correctly" # handles paging through the friends pages the same way a browser does. # Current issues are: # - "source" handling is sloppy. This should really be separate methods. # - Doesn't handle exclusions. # - No real error checking. # sub get_friends { my ( %options ) = @_; my @friends = (); my $exclude = ""; my $page_no = 1; # This should be split into "get_my_friends", "get_profile_friends", # and "get_group_friends". if ( ! defined $options{'source'} ) { $self->_go_home; $self->follow_link( url_regex => qr/fuseaction=user\.viewfriends/io, re => 'View All Friends', ); } elsif ( $options{'source'} eq 'group' ) { warn "Can't get friends from group due to change in myspace until method is updated."; return undef; # Note: This needs to be moved to its own method - form is different. $self->get_page( 'http://groups.myspace.com/index.cfm?'. 'fuseaction=groups.viewMembers&groupID=' . $options{id} ); $options{start_page} && $options{start_page}--; $options{end_page} && $options{end_page}--; $page_no--; } elsif ( $options{'source'} eq 'profile' ) { $self->get_profile( $options{id} ); #check first whether there are friends at all #if not, return zero friends if ( $self->current_page->decoded_content =~ qr/Invite Your Friends Here/o ) { return ( @friends) } else { $self->follow_link( url_regex => qr/fuseaction=user\.viewfriends/io ); $exclude=$options{id}; # Exclude the owner's ID (bit of a hack). } } return undef if $self->error; #TODO: This should be "_get_friends", called by the above methods. while (1) { push ( @friends, $self->get_friends_on_page( '', $exclude ) ) unless ( $options{start_page} && ( $page_no < $options{start_page} ) ); #TODO: This needs to try harder - maybe check the number of pages # and if we're not on the last one, keep trying a certain number # of times. Currently, it's likely we'll only get part of the # friend list. last unless $self->_next_button; return @friends if ( $options{'end_page'} && ( $page_no > $options{'end_page'} ) ); return @friends if ( $options{'max_count'} && ( $#friends >= $options{max_count} ) ); $page_no++; $self->submit_form( { form_name => 'aspnetForm', no_click => 1, re2 => 'View All Friends', fields_ref => { '__EVENTTARGET' => 'ctl00$cpMain$pagerTop', '__EVENTARGUMENT' => $page_no }, } ); } return ( @friends ); } #--------------------------------------------------------------------- # friends_from_profile( friend_id ); =head2 friends_from_profile( %options ) Returns a list of the friends of the profile(s) specified by the "id" option. id can be a friendID or a reference to an array of friendIDs. If passed a list of friend IDs, scans each profile and returns a sorted, unique list of friendIDs. Yes, that means if you pass 5 friendIDs and they have friends in common, you'll only get each friendID once. You're welcome. Also accepts the same options as the get_friends method (end_page, max_count, etc). Examples: # Band 12345 and 54366 sound like us, get their friends list @similar_bands_friends= $myspace->friends_from_profile( id => [ 12345, 54366 ] ); # Get the first 500 friends from profile 12345 @friends = $myspace->friends_from_profile( id => 12345, max_count => 500 ); # A further example: # Before you do anything with these ids, make sure you don't already # have them as friends (uses the "exclude" option in get_friends, # which is very efficient as friends are excluded as they're read # instead of afterwards): my @current_friends = $myspace->get_friends; die $self->error if $self->error; my @potential_friends = $myspace->friends_from_profile( id => [ 12345, 54366 ], exclude => \@current_friends ); =cut sub friends_from_profile { my ( @profiles ) = @_; my ( %options ); # Check for old format ( @friend_ids ) or new ( id => \@friend_ids ) if ( $profiles[0] =~ /^[0-9]+$/o ) { %options = ( id => \@profiles ); } else { ( %options ) = ( @profiles ); } my @friends = (); my $id; my %friend_ids = (); # Get the profiles. Take an arrayref or a single number if ( ref $options{'id'} ) { ( @profiles ) = ( @{ $options{'id'} } ); } else { ( @profiles ) = ( $options{'id'} ); } # Delete the id and source options. delete $options{'id'}; delete $options{'source'} if ( $options{'source'} ); # Get the friendIDs foreach $id ( @profiles ) { push ( @friends, $self->get_friends( source => 'profile', id => $id, %options ) ); last if ( $self->error ); } # Sort and return (also removes duplicates from multiple profiles) foreach $id ( @friends ) { $friend_ids{"$id"}=1; } return ( sort( keys( %friend_ids ) ) ); } #--------------------------------------------------------------------- =head2 friends_in_group( group_id ); Convenience method: Same as calling "get_friends( source => 'group', id => $group_id )". Returns a list of the friend IDs of all people in the group identified by group_id. Tom is disincluded as in get_friends (because the same routine is used to get the friendIDs). Example: my @hilary_fans = $myspace->friends_in_group( 100011592 ); @hilary_fans now contains the friendID of everyone in the HIlary Duff Fan Club group (group ID 100011592 ). To get the group ID, go to the group page in WWW::Myspace and look at the URL: http://groups.myspace.com/index.cfm?fuseaction=groups.viewMembers&GroupID=100011592&adTopicId=&page=3 The group ID is the number after "GroupID=". =cut sub friends_in_group { # If they didn't give us a group, return nothing. Could # be argued that we should croak here. return () unless ( @_ ); # Return the friends. return $self->get_friends( source => 'group', id => $_[0] ); } #--------------------------------------------------------------------- # friends_who_emailed(); # Return a list of friends with mail in the inbox. =head2 friends_who_emailed Convenience method. Reads messages from "inbox" method and returns a list of senders. This used to be the same as calling "get_friends( source => 'inbox' )", but Myspace changed the way the inbox paging wored and it was more practical to read from the inbox method. Changed in 0.59. Returns, as a list of friend IDs, all friends with messages in your inbox (mail). Note that this only tells you who you have mail from, not how many messages, nor does it contain any method to link to those messages. Use "inbox" for that. This method is primarily designed to aid in auto-responding programs that want to not contact (comment or email) people who have sent messages so someone can attend to them personally. Frankly, it was written before "inbox" and may be deprecated in the future. Croaks if you're not logged in. @friends = $myspace->friends_who_emailed; =cut sub friends_who_emailed { $self->_die_unless_logged_in( 'friends_who_emailed' ); my %senders = (); my $messages = $self->inbox; # Store the senders foreach my $message ( @{$messages} ) { $senders{ $message->{sender} }++; } return ( sort( keys( %senders ) ) ); } =head2 search_music Search for bands using the search music form. Takes a hashref containing field => value pairs that are passed directly to submit_form to set the search criteria. http://musicsearch.myspace.com/index.cfm?fuseaction=music.search The easiest way I've found to get your values is to fill them in on the search form, click "Update", then look at the page source. Scroll to the botton where "PageForm" is and you'll see the values you selected. Put the pertinent ones (i.e. things you changed) into your script. Note that the field *names* are different, so just take the values, and use the names as described below. Any value the form can take (present or future) can be passed, so in theory you could write a CGI front-end also that just had the form, posted the values to itself, then used those values to call this method (i.e. do what I suggested above automatically). Here are the currently available form labels/values (looking at the form helps): genreID: See the form for values search_term: 0: Band Name 1: Band Bio 2: Band Members 3: Influences 4: Sounds like keywords: text field. Use it if you're searching by band name, etc. Country: Labeled "Location" in the form. See the form source for values. localType: The radio buttons. Set to: countryState: To search by Country / State distanceZip: To search by distance and zip code. if localType is "countryState", set this: state: State code (like the post office uses, thankfully. See form code if you have any questions). If localType is "distanceZip", set these: zip: The 5-digit zip code. distance: Distance from zip code [0|5|10|20|50|100|500]. 0="Any" and is the default. OrderBy: [ 5 = Plays | 4 = Friends |3 = New | 2 = Alphabetical ] Default is 2. IMPORTANT: Results are currently sorted by friendID regardless of the OrderBy setting. For those who care about details, here's how the Search Music page works: There are three forms on the page, the generic "search" form in the nav bar, a second form called "myForm" that is the user-modified update form, and a third form called "PageForm" that is actually used to pass the values. PageForm is updated with the values after "update" is clicked in myForm. Clicking "Next" just sets (using JavaScript in Myspace) the page value in PageForm and submits PageForm. Oddly enough, PageForm ends up being a "GET", so you could theoretically just loop through using URLs. But we don't, we fill in the form like a browser would. =cut # And now this is compiled only once, not potentially 4 times. This would be # a good candidate to put at the top? our $page_verify_re = qr/Music.*?».*?Search Results.*<\/html>/o; sub search_music { my ( $sc ) = @_; # Page verification RE my $re = $page_verify_re; # First fill in the search form with their criteria. $self->submit_form( { page => 'http://musicsearch.myspace.com/index.cfm?fuseaction=music.search', form_no => 1, fields_ref => $sc, re1 => $re, re2 => $re, # base => 'http://musicsearch.myspace.com/' } ); return undef if $self->error; # Get the friends my $page_no = 0; my %friends = (); do { # Get the friends on this page foreach my $id ( $self->get_friends_on_page ) { $friends{ "$id" } = { 'page_no' => $page_no+1 }; } # Click "Next". $page_no++; print "Getting page " . $page_no . "\n"; $self->submit_form( { 'form_name' => 'PageForm', no_click => 1, 'fields_ref' => { page => $page_no }, 're1' => $re, 're2' => $re, # base => 'http://musicsearch.myspace.com/', } ); } until ( ( $self->error ) || ( ! $self->_next_button ) ); # Clean up and return return LIST { sort( keys( %friends ) ) } HASHREF { \%friends } ; } sub ____CONTACT_PEOPLE____ {} =head1 CONTACT PEOPLE These methods interact with other users. =cut #--------------------------------------------------------------------- =head2 post_comment( $friend_id, $message ) Post $message as a comment for the friend identified by $friend_id. The routine confirms success or failure by reading the resulting page. It returns a status string as follows: P => Passed! Verification string received. PA => Passed, requires approval. FF => Failed, you must be someone's friend to post a comment about them. FN => Failed, network error (couldn't get the page, etc). FC => Failed, CAPTCHA response requested. FI => Failed, Invalid friendID. FL => Failed, Add Comment link not found on profile page. F => Failed, verification string not found on page after posting. Warning: It is possible for the status code to return a false "Failed" if the form post is successful but the resulting page fails to load. If called in scalar context, it returns the status code. If called in list context, returns the status code and the description. EXAMPLE: use WWW::Myspace; my $myspace = new WWW::Myspace; foreach $id ( $myspace->friends_who_emailed ) { $status = $myspace->post_comment( $id, "Thanks for the message!" ) } # Get a printable status (and print it) ( $status, $desc ) = $myspace->post_comment( $id, "Thanks for being my friend!" ); print "Status of post: $desc\n"; post_comment loads $friend_id's profile page, clicks the "Add Comment" link, fills in, posts, and confirms a comment. If $friend_id is a non-true value (i.e. "0" or ''), post_comment will search for and click an "Add Comment" link on the last page loaded. This lets you do this without double-loading the profile page wasting time and bandwidth: $myspace->get_profile( $friend_id ); if ( $myspace->current_page->decoded_content =~ /something special/ ) { $myspace->post_comment( 0, "Your page is special!" ); } If called when you're not logged in, post_comment croaks to make you look stupid. See also the WWW::Myspace::Comment module that installs with the distribution. =cut sub post_comment { # warn "post_comment disabled due to change in myspace code until method can be updated." # return undef; my ( $friend_id, $message, $captcha_response ) = @_; my $status = ""; # Our return status my ($submitted, $attempts, $link); $self->_die_unless_logged_in( 'post_comment' ); # Check data croak "Must pass friend_id and message to post_comment" unless ( ( $friend_id ) && ( $message ) ); my %status_codes = ( P => 'Passed! Verification string received.', PA => 'Passed, requires approval.', FF => 'Failed, you must be someone\'s friend to post a comment about them.', FN => 'Failed, network error (couldn\'t get the page, etc).', FC => 'Failed, CAPTCHA response requested.', FI => 'Failed, Invalid FriendID.', FL => 'Failed, Add Comment link not found on profile page.', F => 'Failed, verification string not found on page after posting.', ); TESTBLOCK: { unless ( $captcha_response ) { # Convert newlines (\n) into socket-ready CRLF ASCII characters. # This also takes care of possible literal "\n"s that come # from command-line arguments. $message =~ s/(\n|\\n)/\015\012/gos; # Myspace bug fix: $message .= "\n "; # If we have a friendID, load the profile if ( $friend_id ) { $self->get_profile( $friend_id ); if ( $self->error ) { $status='FN'; last TESTBLOCK; } } # Submit the comment to $friend_id's page $link = $self->mech->find_link( text_regex => qr/^add\s+comment$/io ); unless ( $link ) { $status="FL"; last TESTBLOCK; } ( $DEBUG ) && print "Getting comment form..\n"; $submitted = $self->submit_form( { page => $link->url, follow => 1, form_name => 'aspnetForm', fields_ref => { 'ctl00$cpMain$postComment$commentTextBox' => "$message", '__EVENTTARGET' => 'ctl00$cpMain$postComment$postcommentImageButton', # '__EVENTARGUMENT' => '', }, re1 => 'comment_p1', re2 => 'comment_p2' } ); # If we posted ok, confirm the comment if ( $submitted ) { my $captcha_result=""; my @captcha=(); # See if there's a CAPTCHA response required, if so, # deal with it or fail appropriately. if ( $self->current_page->decoded_content =~ $CAPTCHAi ) { $self->captcha( "$1" ); #TODO: Not tested - comment captcha may be on a separate form? $captcha_result = $self->_handle_captcha( $1 ); unless ( $captcha_result ) { $status='FC'; last TESTBLOCK; } @captcha = ( 'CAPTCHAResponse' => $captcha_result ); } # Otherwise, confirm it. ( $DEBUG ) && print "Confirming comment...\n"; $submitted = $self->submit_form( { follow => 1, form_name => 'aspnetForm', button => 'ctl00$cpMain$postComment$ConfirmPostButton', @captcha } ); } else { $self->error( 'First submit failed in post_comment with error: '. $self->error ); } } else { # Post the confirmation $submitted = $self->submit_form( '', 1, '', { 'CAPTCHAResponse' => $captcha_response } ); } # Get the resulting page and clean it up (strip whitespace) my $page = $self->current_page->decoded_content; $page =~ s/[ \t\n\r]+/ /g; # Set the status code to return. if ( $self->_apply_regex( source => $page, regex => 'not_friend_error' ) ) { $status="FF"; } elsif ( $self->_apply_regex( source => $page, regex => 'is_invalid' ) ) { $status="FI"; } elsif (! $submitted ) { $status="FN"; } elsif ( $self->_apply_regex( source => $page, regex => 'comment_posted') ) { $status="P"; } elsif ( $self->_apply_regex( source => $page, regex => 'comment_approval_msg' ) ) { $status = "PA"; } else { $status="F"; } } return ( LIST { $status, $status_codes{$status} } SCALAR { $status } ); } =head2 captcha If post_comment returns "FC", the "captcha" method will return the URL to the CAPTCHA image that contains the text that the user must enter to post the comment. Psuedo-code example of how you can use this in a CGI script: my $response = $myspace->post_comment( 12345, 'This is a message' ); if ( $response eq 'FC' ) { # Get and display the image print '
\n'. "\n". '' . '' . '
'; } # Post the comment $myspace->post_comment( 12345, 'This is a message', $captcha_response ); (Use in a CGI script is currently problematic since you'll lose the Myspace object. I'll try to write a better example later. You could try doing a YAML Dump and Load of the $myspace object...) =cut field 'captcha'; #--------------------------------------------------------------------- # comment_friends( $message, $attr ) # Posts a comment to all of our friends. $attr is a hash reference # containing selection criteria. # Example: # $myspace->comment_friends( "Merry Christmas!", { 'ignore_dup' => 'Y' } ); # (Note: we don't handle the filtering here yet) =head2 comment_friends( $message ) =head2 comment_friends( $message, { 'ignore_dup' => 1 } ) This convenience method sends the message in $message to all of your friends. (Since you can only comment friends, it sends the comment to everyone you can). By default it will scan the user's profile page for a previous comment (by searching for your profile URL on the page, which also detects you if you're in their top 8 or otherwise linked to from their page). If called in the second form, it forgoes this duplicate checking (ignores duplicates), and posts anyway. Note that you'll probably want to use the WWW::Myspace::Comment module as if the process is interrupted (which is likely), this routine doesn't offer a way to recover. The WWW::Myspace::Comment module logs where comments have been left, scans for previous comments we've left on the user's page, and can stop after a specified number of posts to avoid triggering security measures. It can also be re-run without leaving duplicate comments. Of course, if you just want to whip off a quick comment to a few (less than 50) friends, this method's for you. EXAMPLE: A simple script to leave a comment saying "Merry Christmas" to everyone on your friends list: use WWW::Myspace; my $myspace = new WWW::Myspace; $myspace->comment_friends( "Merry Christmas!" ); =cut sub comment_friends { my ( $message, $attr ) = @_; my $status = ""; my $friend_id; # Get friends my @friends=$self->get_friends; # Loop and post foreach $friend_id ( @friends ) { # If we can ignore duplicates or we haven't commented them already, # post the comment. if ( ( $attr->{'ignore_dup'} ) || (! $self->already_commented( $friend_id ) ) ) { $status = $self->post_comment( $friend_id, $message ); } } } #--------------------------------------------------------------------- # already_commented( $friend_id ); # Return true if we've previously left a comment for this person. =head2 already_commented Returns true if there is a link to our profile on "$friend_id"'s page. (If we've left a comment, there'll be a link). Note that if you're friends with this person and they have another link to your profile on their page, this will return true, even though you may not have left a comment. EXAMPLE my WWW::Myspace; my $myspace = new WWW::Myspace; foreach $friend_id ( $myspace->get_friends ) { unless ( $myspace->already_commented( $friend_id ) ) { $myspace->post_comment( $friend_id, "Hi, I haven't commented you before!" ) } } already_commented croaks if called when you're not logged in. =cut sub already_commented { my ( $friend_id ) = @_; $self->_die_unless_logged_in( 'already_commented' ); # Get the page my $page = $self->get_profile( $friend_id )->decoded_content; # If we got an error, return a false true (but error is set) return 1 if $self->error; # If $self->my_friend_id isn't set for some reason, this'll return # a false "true", so set error. if ( $self->my_friend_id ) { $self->error(0) } else { $self->error( "my_friend_id is not set!" ) } # Set up our regular expression. We're looking for the link code my $fr_id = $self->my_friend_id; # If the link's on their page, return true, otherwise return false. if ( $page =~ /${FRIEND_REGEXP}$fr_id/ ) { return 1 } else { return 0; } } =head2 get_inbox ( %options ) Returns a reference to an array of hash references that contain data about the messages in your Myspace message inbox. The hashes contain: sender (friendID) status (Read, Unread, Sent, Replied) message_id (The unique ID of the message) subject (The subject of the message) The messages are returned IN ORDER with the newest first to oldest last (that is, the same order in which they'd appear if you were looking through your inbox). There is currently one option: end_msg => $message_id # Stop and return when # the message with this # messageID is reached. # Does NOT return message $message_id. end_page => $page_no # Stop and return after reading this page. end_msg is primarily used if you're caching your mail into a database. This lets you get all the mail since the last message you cached. get_inbox does not return the message matching $message_id (because you already have it). If there are no new messages before $message_id, returns an empty list. end_page will read up to and including the page specified. So if you pass "end_page => 1", it will read only the first page of messages. I'm sure reading that first line made you as dizzy as it made me typing it. I think this says it all much more clearly: EXAMPLE # This script displays the contents of your inbox. use WWW::Myspace; $myspace = new WWW::Myspace; print "Getting inbox...\n"; my $messages = $myspace->inbox; # Display data for each message foreach $message ( @{$messages} ) { print "Sender: " . $message->{sender} . "\n"; print "Status: " . $message->{status} . "\n"; print "messageID: " . $message->{message_id} . "\n"; print "Subject: " . $message->{subject} . "\n\n"; } (This script is in the sample_scripts directory, named "get_inbox"). EXAMPLE 2 # Read the messages since the last one we got my $last_msg = selectrow_array( "select message_id from mydatabase order by messagedate desc limit 1" ); # Sorry for the psuedocode, but hopefully you get the idea my $messages = $myspace->get_inbox( stop_at => $last_msg ) "inbox" croaks if called when you're not logged in. =cut sub get_inbox { my ( %options ) = @_; my $page=""; my $page_no = 0; my @messages = (); $self->_die_unless_logged_in( 'inbox' ); # Go home $self->_go_home or return; # Get the first page $page = $self->follow_to( $self->mech->find_link( url_regex => qr/fuseaction=mail\.inbox/i )->url, 'Mail Center.*Inbox' ) or return; # Loop until we get an empty page or there isn't a "next" link. while ( 1 ) { $page_no++; ( $DEBUG ) && print "inbox reading page $page_no\n"; # Get the message data. push @messages, $self->_get_messages_from_page( %options ); # Stop if we got to the specified message last if ( $options{'stop_at_msg'} && ( $options{'stop_at_msg'} == $messages[-1]->{message_id} ) ); # Stop if we're on the last page last unless ( $self->_next_button ); # Stop if we've reached the last page they requested last if ( $options{'end_page'} && ( $page_no >= $options{'end_page'} ) ); # Next! $self->submit_form( { form_name => 'aspnetForm', fields_ref => { '__EVENTTARGET' => 'ctl00$ctl00$Main$Main$messageList$pagingTop', '__EVENTARGUMENT' => $page_no+1 }, no_click => 1, } ); } return \@messages; } # Return a list of message data from the current page sub _get_messages_from_page { my ( %options ) = @_; my $page = $self->current_page->decoded_content; my @messages = (); while ( $page =~ s/.*?viewprofile&friendid=([0-9]+).*?(Unread|Read|Sent|Replied).*?messageID=([^&]+)&.*?>([^<]+) $1, status => $2, message_id => $3, subject => $4 } } return @messages; } =head2 inbox Here for backwards compatibility only. Use get_inbox instead. (Version 0.69) =cut sub inbox { $self->get_inbox( @_ ); } =head2 read_message( message_id ) Returns a hashref containing the message identified by message_id. my $message_ref = $myspace->read_message( 123456 ); print 'From: ' . $message_ref->{'from'} . .'\n' . # Friend ID of sender 'Date: ' . $message_ref->{'date'} . .'\n' . # Date (as formatted on Myspace) 'Subject: ' . $message_ref->{'subject'} .'\n' . 'Body: ' . $message_ref->{'body'} . '\n'; # Message body Croaks if you're not logged in. =cut sub read_message { my ( $message_id ) = @_; $self->_die_unless_logged_in( 'read_message' ); my %message = (); my $res = $self->get_page( 'http://messaging.myspace.com/index.cfm?'. 'fuseaction=mail.readmessage&userID='.$self->my_friend_id. '&type=inbox&messageID='.$message_id.'&fed=True', 'read mail.*body:|Mail Center.*Inbox'); return \%message if $self->error; # If we were passed a bad message ID, we'll have the inbox again if ( $res->decoded_content !~ /read mail.*Body:/smio ) { warn "Invalid Message ID\n"; return \%message; } # Include the messageID in the hash $message{'message_id'} = $message_id; # Now we have to yank data out of a messy page. my $page = $res->decoded_content; $page =~ s/[ \t\n\r]+/ /go; # Turn multiple whitespace into single space # From: $page =~ /From:.*?friendID=([0-9]+)[^0-9]/io; $message{'from'} = $1; # Date: # $page =~ /Date:.*?> ?([^<]+) ? [^<]+ <)/o; $page =~ /Date:.*?\s+([^<]+)\s?\s*Subject:\s*<.*?\s*(.*?)\s*<\/td>/smo ) { $message{'subject'} = $1; } # Body: # $res->decoded_content =~ /.*^(.*)^


/sm; # TODO: Message body works like this: # Body:This is a great message


# In real life, there's a lot of random whitespace in there. # Myspace adds three br tags after the message. # This RE looks for those tags followed by the . We do this because # it's always possible someone will include an HTML table in the message. # What we really need to do is find the matching closing tag for the body's # tag, but I'm not really sure how to easily do that, so I did this as a # workaround. $page =~ /\s*Body:\s*<\/th>\s*\s*(.*)\s+
\s*
\s*
\s*<\/td>/smo; $message{'body'} = $1; # Clean up newlines $message{'body'} =~ s/[\n\r]/\n/go; # Gotta clean white space before and after the body $message{'body'} =~ s/^\s*//so; # Before $message{'body'} =~ s/\s*$//so; # After # And they have these BR tags at the beginning of each line... # Not any more - 8/16/07 # $message{'body'} =~ s/^[ \t]*
[ \t]*//mog; # And sometimes they put them elsewhere, so we'll convert those to newlines. $message{'body'} =~ s/
/\n/mog; return \%message; } #--------------------------------------------------------------------- =head2 reply_message( $message_id, $reply_message ) Warning: This is a new, un-tested method. If you're reading this, it means I had to release a new version for some reason before I got to complete the testing and documentation of this method. It "should" work fine. Let me know if it does or not. Reply to message $message_id using the text in the string $reply_message. Returns a status code: P: Posted. Verified by HTTP response code and reading a regexp from the resulting page saying the message was sent. FC: Failed. A CAPTCHA response was requested. FF: Failed. The person's profile is set to private. You must be their friend to message them. FA: Failed. The person has set their status to "away". FE: Failed. The account has exceeded its daily usage. FN: Failed. The POST returned an unsuccessful HTTP response code. F: Failed. Post went through, but we didn't see the regexp on the resulting page (message may or may not have been sent). Example: my $status = $myspace->reply_message( 1234567, "Thanks for emailing me!" ); If you're not logged in? Croaks. =cut sub reply_message { my ( $id, $reply ) = @_; my ( $submitted, $message, $reply_message, $page ); $self->_die_unless_logged_in( 'reply_message' ); # Fill in the message (this is lazy...) $message = $self->read_message( $id ); $reply_message = $reply . $message; # Convert newlines (\n) into socket-ready CRLF ASCII characters. # This also takes care of possible literal "\n"s that come # from command-line arguments. # (Note that \n does seem to work, but this "should" be safer, especially # against myspace changes and platform differences). $reply_message =~ s/(\n|\\n)/\015\012/gos; # First load the message and click "Reply" (first button - it has no # name so this'll break if they change the button order). $submitted = $self->submit_form( { page => 'http://messaging.myspace.com/index.cfm?'. 'fuseaction=mail.readmessage&userID='.$self->my_friend_id. '&type=inbox&messageID='.$message.'&fed=True', form_no => 1, re1 => "Read Mail" } ); # See if we can mail or if there's an error. if ( $submitted ) { $page = $self->current_page->decoded_content; $page =~ s/[ \t\n\r]+/ /go; if ( $page =~ /${MAIL_PRIVATE_ERROR}/i ) { return "FF"; } elsif ( $page =~ /${MAIL_AWAY_ERROR}/i ) { return "FA"; } } else { return "FN"; } # Post the reply $submitted = $self->submit_form( '', 1, '', { 'ctl00$ctl00$Main$Main$sendMessageControl$bodyTextBox' => $reply_message } ); # Verify and return the appropriate code. $page = $self->current_page->decoded_content; $page =~ s/[ \t\n\r]+/ /g; # Return the result if (! $submitted ) { return "FN"; } elsif ( $self->_apply_regex( source => $page, regex => 'verify_message_sent') ) { return "P"; } elsif ( $self->_apply_regex( source => $page, regex => 'exceed_usage' ) ) { return "FE"; } elsif ( $page =~ $CAPTCHAi ) { return "FC"; } else { return "F"; } # my ( $url, $form_no, $button, $fields_ref, $regexp1, $regexp2, $base_url ) = @_; } #--------------------------------------------------------------------- =head2 send_message( $friend_id, $subject, $message, $add_friend_button ) =head2 send_message( %options ) Options are friend_id, subject, message, atf. Example: $status = $myspace->send_message( friend_id => 12345, subject => 'Hi there', message => 'This is the bestest message ever!', atf => 0, skip_re => 'i hate everyone', # Skip negative people ); The %options hash is the "correct" method of passing arguments as of version 0.53. The parameter based method is here for backwards-compatibility. send_message sends a message to the user identified by "friend_id". If "atf" is a true value, HTML code for a "View My Profile" link will be added at the end of the message. (This was an Add To Friends button until Myspace started munging that code). If "skip_re" is defined, friend_id's profile will be matched against the RE. Whitespace will be compressed and the match will NOT be case-sensitive. So you can do this: skip_re => 'i hate everyone!* ?(
)?' And it will match: I Hate EVERYONE!!!! I hate everyone
I Hate EvEryone!!!
etc. If "friend_id" is an untrue value (i.e. 0 or ''), send_message will look for a Send Message button (identified by a "fuseaction=mail.message" URL if you're curious) on the current page. This lets you do this efficiently: # Send a message only if the profile has "fancy regex" on their page $myspace->get_profile( $friend_id ); if ( $myspace->current_page =~ /fancy regex/ ) { $myspace->send_message( subject => "Hello", message => "I'm messaging you" ); } $status = $myspace->send_message( friend_id => 6221, subject => 'Hi Tom!', message => 'Just saying hi!', atf => 0 ); if ( $status eq "P" ) { print "Sent!\n" } else { print "Oops\n" } Returns a status code: P => Passed! Verification string received. FF => Failed, profile set to private. You must be their friend to message them. FN => Failed, network error (couldn't get the page, etc). FA => Failed, this person's status is set to "away". FS => Failed, skipped. Profile doesn't match RE. FE => Failed, you have exceeded your daily usage. FC => Failed, CAPTCHA response requested. FI => Failed, Invalid friend ID. F => Failed, verification string not found on page after posting. If called in list context, returns the status code and text description. ( $status, $desc ) = $myspace->send_message( $friend_id, $subject, $message ); print $desc . "\n"; See also WWW::Myspace::Message, which installs along with the distribution. (Croaks if called when you're not logged in). =cut sub send_message { # Backwards compatibility my ( %options ) = (); if ( $_[0] =~ /^[0-9]+$/o ) { my ( $friend_id, $subject, $message, $atf ) = @_; %options = ( friend_id => $friend_id, subject => $subject, message => $message, atf => $atf ); } else { ( %options ) = @_; } my ( $submitted, $res, $page, $status ); $self->_die_unless_logged_in( 'send_message' ); my %status_codes = ( P => 'Passed! Verification string received.', FF => 'Failed, profile set to private. You must be their '. 'friend to message them.', FN => 'Failed, network error (couldn\'t get the page, etc).', FA => 'Failed, this person\s status is set to "away".', FS => 'Failed, skipped. Profile doesn\'t match RE.', FE => 'Failed, you have exceeded your daily usage.', FC => 'Failed, CAPTCHA response requested.', FI => 'Failed, Invalid FriendID.', FL => 'Failed, can\'t find Send Message link on profile page.', F => 'Failed, verification string not found on page after posting.', ); # Add the button if they wanted it. if ( ( defined $options{'atf'} ) && ( $options{'atf'} ) ) { $options{'message'} .= '

Add as friend\n'; $options{'message'} .= '">View My Profile\n'; } TESTBLOCK: { # If we were given a friend ID, get the profile if ( $options{'friend_id'} ) { $res = $self->get_profile( $options{'friend_id'} ); ( $DEBUG ) && print "Got profile:\n" . $res->decoded_content . "\n"; if ( $options{'skip_re'} ) { $page =~ $res->decoded_content; $page =~ s/[ \t\n\r]+/ /go; if ( $options{'skip_re'} =~ /$options{'skip_re'}/i ) { $status='FS'; last TESTBLOCK; } } } # Try to get the message form $res = $self->mech->find_link( url_abs_regex => qr/fuseaction=mail\.message/io ); ( $DEBUG ) && print "Found Send Message link: " . $res->url . "\n"; if ( $res ) { $res = $self->follow_to( $res->url, 'Mail\s+Center.*Send\s+a\s+Message|'.$MAIL_PRIVATE_ERROR.'|'. $MAIL_AWAY_ERROR.'|'.$INVALID_ID ); } else { $status='FL'; last TESTBLOCK; } # Check for network error if ( $self->error ) { $status='FN'; last TESTBLOCK; } # Check for known messages that say we can't send it. $page = $res->decoded_content; $page =~ s/[ \t\n\r]+/ /go; if ( $page =~ /$MAIL_PRIVATE_ERROR/i ) { $status='FF'; last TESTBLOCK; } elsif ( $page =~ /$MAIL_AWAY_ERROR/i ) { $status='FA'; last TESTBLOCK; } elsif ( $page =~ /$INVALID_ID/i ) { $status='FI'; last TESTBLOCK; } elsif ( $page =~ $CAPTCHAi ) { $status='FC'; last TESTBLOCK; } # Convert newlines (\n) into socket-ready CRLF ASCII characters. # This also takes care of possible literal "\n"s that come # from command-line arguments. # (Note that \n does seem to work, but this "should" be safer, especially # against myspace changes and platform differences). $options{'message'} =~ s/(\n|\\n)/\015\012/gso; # Myspace bug fix: $options{'message'} .= "\n "; # Submit the message # if ( $page =~ /ctl00\$ctl00\$Main\$Main\$sendMessageControl\$subjectTextBox/ ) { # New mail form... $submitted = $self->submit_form( { form_name => 'aspnetForm', fields_ref => { 'ctl00$ctl00$Main$Main$sendMessageControl$subjectTextBox' => "$options{'subject'}", 'ctl00$ctl00$Main$Main$sendMessageControl$bodyTextBox' => "$options{'message'}", '__EVENTTARGET' => 'ctl00$ctl00$Main$Main$sendMessageControl$btnSend', '__EVENTARGUMENT' => '' }, no_click => 1, } ); # } else { # # Old mail form... Seriously, don't get me started... # $submitted = $self->submit_form( '', # 1, "", # { 'subject' => "$options{'subject'}", # 'mailbody' => "$options{'message'}" # } # ); # } $page = $self->current_page->decoded_content; $page =~ s/[ \t\n\r]+/ /g; # Return the result if (! $submitted ) { $status = "FN"; } elsif ( $page =~ $CAPTCHAi ) { $status = "FC"; # They keep changing which page this appears on. } elsif ( $self->_apply_regex( source => $page, regex => 'verify_message_sent') ) { $status = "P"; } elsif ( $self->_apply_regex( source => $page, regex => 'exceed_usage' ) ) { $status = "FE"; } else { $status = "F"; } } return ( LIST { $status, $status_codes{$status} } SCALAR { $status } ); } =head2 delete_message( @message_ids ) Deletes the message(s) identified by @message_ids. Takes a list of messageIDs or of hashrefs with a message_id subcomponent (such as one gets from the "inbox" method). Croaks if called when not logged in. Deletes all messages in a single post. Returns true if it worked, false if not, and sets the "error" method to the error encountered. Example: # Delete message 12345 $myspace->delete_message( 12345 ); # File myspace mail where it belongs. $all_messages = $myspace->inbox; $myspace->delete_message( @{ $messages } ); =cut sub delete_message { my ( @message_ids ) = @_; warn "delete_message not working most of the time due to myspace bug.\n". "Use at your own risk."; my ( $form, $tree, $f, $res, $id ); my $pass=1; $self->_die_unless_logged_in( 'delete_message' ); foreach my $message ( @message_ids ) { # Get the message and click "delete" $self->submit_form( { page => 'http://messaging.myspace.com/index.cfm?'. 'fuseaction=mail.readmessage&userID='.$self->my_friend_id. '&type=inbox&messageID='.$message.'&fed=True', form_name => 'aspnetForm', button => 'ctl00$ctl00$Main$Main$ReadMessage1$DeleteButton', no_click => 0, re1 => 'Mail\s+Center.*?Read\s+Mail' } ) or $pass = 0; } return $pass; } #--------------------------------------------------------------------- =head2 approve_friend_requests( [ "message" ] ) Looks for any new friend requests and approves them. Returns a list of friendIDs that were approved. If "message" is given, it will be posted as a comment to the new friends. If called when you're not logged in, approve_friend_requests will croak. If approve_friend_requests runs into a CAPTCHA response when posting comments, it will set $myspace->captcha to the URL of the CAPTCHA image. If no CAPTCHA was encountered, $myspace->captcha will be 0. So you can say: if ( $myspace->captcha ) { print "oh no!\n" } approve_friend_requests will approve all friends whether or not it can comment them as it approves first, then comments the list of approved friends. EXAMPLES # Approve any friend requests @friends_added = $myspace->approve_friend_requests; # Print the number of friends added and their friend IDs. print "Added " . @friends_added . " friends: @friends_added."; # Approve new frieds and leave them a thank you comment. @friends_added = $myspace->approve_friend_requests( "Thanks for adding me!\n\n- Your nww friend" ); Run it as a cron job. :) Note that "\n" is properly handled if you pass it literally also (i.e. from the command line). That is if you write this "approve_friends" script: #!/usr/bin/perl -w # usage: approve_friends [ "message" ] use WWW::Myspace; my $myspace = new WWW::Myspace; $myspace->approve_friend_requests( @ARGV ); And run it as: approve_friends "Thanks for adding me\!\!\n\n- Me" You'll get newlines and not "\n" in the message. There, I even gave you your script. =cut sub approve_friend_requests { my @guids = (); my @friends = (); my %friends = (); # Not a typo. See below. my ( $page, $id ); my ( $message ) = @_; $self->_die_unless_logged_in( 'approve_friend_requests' ); # Go Home $self->_go_home; return undef if $self->error; # Click the friend requests link $self->follow_to( $self->mech->find_link( url_regex => qr/fuseaction=mail\.friendRequests/io )->url, 'Friend Request Manager' ); return undef if $self->error; # As long as there are friend requests on the page, # select all of them and click "Approve Selected Friends" my $f; while ( @guids = $self->_get_friend_requests ) { # Get the friendIDs from the page @friends = ( @friends, $self->get_friends_on_page ); # Check the checkboxes and submit the form $self->submit_form( { form_name => 'aspnetForm', button_name => 'ctl00$ctl00$Main$Main$incomingRequests$ApproveSelectedRequestsButton', fields_ref => { 'ctl00$ctl00$Main$Main$incomingRequests$requestRepeater$ctl00$selectRequest' => \@guids }, re2 => qr/Friend Request Manager/o } ); } # Clean up friends (there -could- be duplicates in some circumstances) my $captcha=0; $self->captcha( 0 ); # Reset captcha so they can check it. foreach $id ( @friends ) { $friends{"$id"}++; # If we're to post a message, and this isn't a duplicate, # post a comment to this new friend. if ( ( $message ) && ( $friends{"$id"} == 1 ) && ( ! $captcha )) { if ( $self->post_comment( $id, $message ) eq "FC" ) { $captcha=1; } } } # Return the list of friends return keys( %friends ); } #--------------------------------------------------------------------- # _get_friend_requests() # Returns a list of friend requests from the Friend Requests page sub _get_friend_requests { my $page = $self->current_page->decoded_content; my %guids = (); my $line = ""; # Get the GUID codes from it. while ( $page =~ s/ctl00\$ctl00\$Main\$Main\$incomingRequests\$requestRepeater\$ctl00\$selectRequest.*? value="(.*?)"//im ) { $guids{"$1"}++; } return keys( %guids ); } ##--------------------------------------------------------------------- ## _post_friend_requests( $form ) ## Post the filled in friend approval form. # #sub _post_friend_requests #{ # # my ( $f ) = @_; # # $self->submit_form( { # form => $f, # button => 'ctl00$ctl00$Main$Main$incomingRequests$ApproveSelectedRequestsButton', # re2 => 'Friend Request Manager', # 'die' => 1 # } ); # #} #--------------------------------------------------------------------- # send_friend_request =head2 send_friend_request( $friend_id ) IMPORTANT: THIS METHOD'S BEHAVIOR HAS CHANGED SINCE VERSION 0.25! Sorry, I hate to break backwards-compatibility, but to keep this method in line with the rest, I had to. The changes are: 1) It takes only one friend, it will DIE if you give it more (mainly to let you know that #2 has changed so your scripts don't think they're succeeding when they're not). 2) It no longer returns pass/fail, it returns a status code like post_comment. Send a friend request to the friend identified by $friend_id. Croaks if not logged in. This is the same as going to their profile page and clicking the "add as friend" button and confirming that you want to add them. Returns a status code and a human-readable error message: FF => Failed, this person is already your friend. FN => Failed, network error (couldn't get the page, etc). FL => Failed, Add Friend error clicking link on profile page FP => Failed, you already have a pending friend request for this person FB => Failed, this person does not accept friend requests from bands. FA => Failed, this person requires an email address or last name to add them FC => Failed, CAPTCHA response requested. P => Passed! Verification string received. F => Failed, verification string not found on page after posting. After send_friend_request posts a friend request, it searches for various Regular Expressions on the resulting page and sets the status code accordingly. The "F" response is of particular interest because it means that the request went through fine, but none of the known failure messages were received, but the verification message wasn't seen either. This means it -might- have gone through, but probably not. Of course, worst case here is you try again. EXAMPLES # Send a friend request and get the response my $status = $myspace->send_friend_request( 12345 ); # Send a friend request and print the result my ( $status, $desc ) = $myspace->send_friend_request( 12345 ); print "Received code $status: $desc\n"; # Send a friend request and check for some status responses. my $status = $myspace->send_friend_request( 12345 ); if ( $status =~ /^P/ ) { print "Friend request sent\n"; } else { if ( $status eq 'FF' ) { print "This person is already your friend\n"; } elsif ( $status eq 'FC' ) { print "Received CAPTCHA image request\n"; } } # Send a bunch of friend requests my @posted = (); my @failed = (); foreach my $friend ( @friends ) { print "Posting to $friend: "; my $status = $myspace->send_friend_request( $friend ) if ( $status =~ /^P/ ) { print "Succeeded\n"; push ( @posted, $friend ); } else { print "Failed with code $status\n"; push ( @failed, $friend ); } # Stop if we got a CAPTCHA request. last if $status eq 'FC'; } # Do what you want with @posted and @failed. Also see the WWW::Myspace::FriendAdder module, which adds multiple friends and lets you enter CAPTCHA codes. =cut sub send_friend_request { # We had to break backwards compatibilty, so enforce it. if ( @_ > 1 ) { die 'send_friend_request has been changed. Must use '. 'send_friend_requests to send to multiple friends.\n'. 'Also now returns status code instead of true/false.\n'. 'perldoc WWW::Myspace for info.'; } my ( $friend_id ) = @_; $self->_die_unless_logged_in( 'send_friend_request' ); my %status_codes = ( FF => 'Failed, this person is already your friend.', FN => 'Failed, network error (couldn\'t get the page, etc).', FL => 'Failed, Add Friend error clicking link on profile page', FP => 'Failed, you already have a pending friend request for this person', FB => 'Failed, this person does not accept friend requests from bands.', FA => 'Failed, this person requires an email address or last name to add them', FC => 'Failed, CAPTCHA response requested.', FE => 'Failed, user has exceeded their daily usage.', P => 'Passed! Verification string received.', F => 'Failed, verification string not found on page after posting.', ); my $return_code = undef; my ($page, $res); my $captcha_result = ""; TESTBLOCK: { # Go to their profile page unless ( $self->get_profile( $friend_id ) ) { $return_code='FN'; last; } # Get the form unless ( $self->follow_link( url_regex => qr/fuseaction=invite\.addfriend_verify/io ) ) { $return_code='FL'; last; } # Strip the page for comparisons $page = $self->current_page->decoded_content; $page =~ s/[ \t\n\r]+/ /go; # Check for "doesn't accept band" if ( $page =~ /does not accept add requests from bands/io ) { $return_code = 'FB'; } # Check for "last name or email" required elsif ( $page =~ /only accepts add requests from people he\/she knows/o ) { $return_code = 'FA'; } # Check for CAPTCHA #elsif ( $page =~ /CAPTCHA/o ) { elsif ( $page =~ $CAPTCHAi ) { $captcha_result = $self->_handle_captcha( $1 ); $return_code = 'FC' unless ( $captcha_result ); } # Check for "already your friend" elsif ( $page =~ /already your friend/io ) { $return_code = 'FF'; } # Check for pending friend request elsif ( $page =~ /pending friend request/io ) { $return_code = 'FP'; } # Check for "exceeded daily usage" message elsif ( $self->_apply_regex( source => $page, regex => 'exceed_usage' ) ) { $return_code = 'FE'; } # Now see if we have a button to click. # MUST BE LAST. # (This probably could return a different code, but it means we don't # have a button and we don't know why). # XXX You may want to loop this entire statement, because currently: # - get_page gets a page, checking for any known error messages. # - this if statement checks for known errors we might receive # - This final statement makes sure we have a button to click so # we don't bomb in "submit_form". # - BUT, if we get an error page get_page doesn't know (i.e. they # change an error message or something), we probbaly # want to retry this page. # You might want to change this whole section to: # do { $res = $self->get_page ... ; # $attempts++; } until ( ( $attempts > 20 ) || ( $page =~ /]*>/io ) { $return_code ='F'; warn "No Add to Friends button on form!\n"; } # If we got a return code above, go return it. last if ( $return_code ); # Post the add request form if ( $captcha_result ) { $res = $self->submit_form( '', 1, '', { 'CAPTCHAResponse' => $captcha_result } ); } else { $res = $self->submit_form( { form_no => 1 } ); } # Check response unless ( $res ) { $return_code = 'FN'; last; } # Unless we already have a return code (in which case we shouldn't be here) # check for REs on the page to see what we got. $page = $self->current_page->decoded_content; $page =~ s/[ \t\n\r]+/ /go; # Check for success if ( $page =~ /An email has been sent to the user/io ) { $return_code = 'P'; last; } } # If we still don't have a return code, something went wrong unless ($return_code) { warn "No return code\n"; $return_code = 'F'; } return ( LIST { $return_code, $status_codes{$return_code} } SCALAR { $return_code } ); } =head2 send_friend_requests( @friend_ids ) Send friend requests to multiple friends. Stops if it hits a CAPTCHA request. Doesn't currently give any indication of which requests succeeded or failed. Use the code example above for that. Croaks if you're not logged in. =cut sub send_friend_requests { $self->_die_unless_logged_in( 'send_friend_requests' ); foreach my $id ( @_ ) { last if $self->send_friend_request( $id ) eq 'FC'; } } =head2 add_to_friends Convenience method - same as send_friend_request. This method's here because the button on Myspace's site that the method emulates is usually labeled "Add to Friends". =cut sub add_to_friends { $self->send_friend_request( @_ ); } =head2 add_as_friend Convenience method - same as send_friend_request. This method's here Solely for backwards compatibility. Use add_to_friends or send_friend_request in new code. =cut sub add_as_friend { $self->send_friend_request( @_ ); } #--------------------------------------------------------------------- # delete_friend =head2 delete_friend( @friend_ids ) Deletes the list of friend_ids passed from your list of friends. $myspace->delete_friend( 12345, 151133 ); Returns true if it posted ok, false if it didn't. Croaks if you're not logged in. =cut sub delete_friend { warn "Myspace page changed - delete_friend method disabled until it can be re-written"; return undef; my ( @del_friends ) = @_; my ( $form, $tree, $f, $res, $id ); # my $pass=1; $self->_die_unless_logged_in( 'delete_friend' ); # Get our home page. $self->_go_home; return 0 if $self->error; # Get the edit friends page $self->follow_to( $self->mech->find_link( url_regex => qr/fuseaction=user\.editfriends/i )->url ); return 0 if $self->error; # Select the edit form and get the hash field $self->mech->form_name( 'friendsDelete' ); my $hash_value = $self->mech->value( 'hash' ); my $mytoken = $self->mech->value( 'Mytoken' ); # Create our delete form $form = '

'; $form .= ''; $form .= ''; foreach $id ( @del_friends ) { $form .= ''; } $form .= ''. '
'; # Turn it into an HTML::Form object $f = HTML::Form->parse( $form, 'http://collect.myspace.com/' ); # Check the checkboxes foreach my $input ( $f->find_input( 'delFriendID' ) ) { $input->check; } # Submit the form my $attempt = 0; my $max_attempts = 25; my $request = $f->click( 'deleteAll' ); $request->header( 'Referer' => $self->current_page->request->uri ); do { $res = $self->mech->request( $request ); $attempt++; $self->_traceme("Delete friend submit attempt $attempt",$res); } until ( ( $self->_page_ok( $res ) ) || ( $attempt > $max_attempts ) ); # I felt guilty adding a variable even for readability so I removed $pass :) #unless ( $attempt <= $max_attempts) { # $pass=0; #} $self->{current_page} = $res; return ($attempt <= $max_attempts); } =head2 send_event_invitation( $event_id, [ @friend_ids ] ) Send an event invitation to each friend in @friend_ids. You need to add the event in Myspace first, then run a script that calls this method feeding it the event ID, which you can get from the URL of the page that lets you invite friends. If no friend IDs are passed, send_event_invitation calls the get_friends method and sends to all of your friends. The method returns a reference to 2 arrays, "passed", and "failed". Because it wil probably take a long time to run, it also prints a running report of the friends its inviting with "Passed" or "Failed": Inviting 12345: Passed Inviting 12346: Failed Known issue: If you already have people in your invitation list and this method attempts to add those friends again, it will cause substantial delays (up to a minute or two per friend ID). This is because submit_form will receive an error message and will retry the post 5 times for each friend. Example: my ( $passed, $failed ) = $myspace->send_event_invitation( $event_id, @friend_ids ); die $myspace->error if $myspace->error; print "Sent to:\n"; foreach $id ( @{ $passed } ) { print $id . "\n"; } print "Failed to send to:\n"; foreach $id ( @{ $failed } ) { print $id . "\n"; } See also the send_event_invitations sample script in the sample_scripts directory included with this distribution. =cut sub send_event_invitation { my ( $event_id, @friend_ids ) = @_; $self->_die_unless_logged_in( 'send_event_invitation' ); # Default to all our friends unless ( @friend_ids ) { @friend_ids = $self->get_friends } # Get the page my $res = $self->get_page( "http://events.myspace.com/index.cfm?fuseaction=events.invitees&eventID=". $event_id ); return( [], \@friend_ids ) if $self->error; # For each friendID, fill in the form and submit it. Hey, this is # their idea, not mine... my @passed = (); my @failed = (); foreach my $id ( @friend_ids ) { print "Inviting $id: "; if ( $self->submit_form( { page => $res, form_name => 'createEvent', fields_ref => { 'hiddenFriends', $id } } ) ) { push( @passed, $id ); print "Passed\n"; } else { push( @failed, $id ); print "Failed\n"; } } return ( \@passed, \@failed ); } =head2 send_group_invitation( $event_id, [ @friend_ids ] ) Send a group invitation to each friend in @friend_ids. You need to add the group in Myspace first, then run a script that calls this method feeding it the group ID, which you can get from the URL of the group's page. If no friend IDs are passed, send_event_invitation calls the get_friends method and sends to all of your friends. The method returns a reference to 2 arrays, "passed", and "failed". Because it wil probably take a long time to run, it also prints a running report of the friends its inviting with "Passed" or "Failed": Inviting 12345: Passed Inviting 12346: Failed You're only allowed to send 25 intivations at a time (because Myspace users are unpopular I guess?), so we pause for 25-30 seconds after each group of 25 to allow for clicking time so we don't make the server mad. Example: my ( $passed, $failed ) = $myspace->send_group_invitation( $event_id, @friend_ids ); die $myspace->error if $myspace->error; print "Sent to:\n"; foreach $id ( @{ $passed } ) { print $id . "\n"; } print "Failed to send to:\n"; foreach $id ( @{ $failed } ) { print $id . "\n"; } See also the send_group_invitations sample script in the sample_scripts directory included with this distribution. Croaks if called when not logged in. =cut sub send_group_invitation { my ( $group_id, @friend_ids ) = @_; $self->_die_unless_logged_in( 'send_group_invitation' ); # Default to all our friends unless ( @friend_ids ) { @friend_ids = $self->get_friends } # Get the page if we don't already have it. my $res; if ( $self->{_group_info}->{$group_id} ) { $res = $self->{_group_info}->{$group_id}->{invite_page}; } else { $res = $self->get_page( 'http://groups.myspace.com/index.cfm?'. 'fuseaction=groups.groupInvite&groupID='. $group_id ); return( [], \@friend_ids ) if $self->error; # Store res in case they're looping for us. $self->{_group_info}->{$group_id}->{invite_page} = $res; } # For each friendID, fill in the form and submit it. Hey, this is # their idea, not mine... # We can only send 25 at a time, so pause like a user clicking the next # batch of friends to invite, then continue. my @passed = (); my @failed = (); my $post_count = 0; foreach my $id ( @friend_ids ) { $post_count++; sleep ( int( rand( 5 ) ) + 25 ) if ( ( $post_count % 25 ) == 0 ); print "Inviting $id: "; if ( $self->submit_form( { page => $res, form_name => 'inviteForm', fields_ref => { 'hiddenFriends', $id } } ) ) { push( @passed, $id ); print "Passed\n"; } else { push( @failed, $id ); print "Failed\n"; } } return ( \@passed, \@failed ); } =head2 post_bulletin( %options ) Post a builletin to your friends. use WWW::Myspace; my $myspace = new WWW::Myspace; $myspace->post_bulletin( subject => $subject, message => $message ); Croaks if called when not logged in. =cut sub post_bulletin { my %options = @_; $self->_die_unless_logged_in( 'post_bulletin' ); # Myspace calls the message the "body", so we'll take that too. if ( ( ! $options{'message'} ) && $options{'body'} ) { $options{'message'} = $options{'body'} } # Go home $self->_go_home; return if $self->error; # warn "Got home page" . "\n" if $options{'testing'}; # Click "post bulletin" my $link = $self->follow_link( url_regex => $self->_regex( 'bulletin_url' ) ); unless ( $link ) { $self->error("Post Bulletin link not found on home page"); return; } # warn "Found Post Bulletin link: ".$link->url . "\n" if $options{'testing'}; # eee eee eee ooo ooo ooo !!! # Sorry, that's myspace programmer speak. I'll translate: # Instead of posting a simple form, the Post button calls a Javascript # routine that takes the values we entered into the main form, puts # them into a hidden form, sets the action of that form, and posts it. my $action = ''; unless ( $action = $self->_apply_regex( regex => 'bulletin_post_action' ) ) { $self->error("Can't find action URL on first bulletin form page"); return; } # print $self->current_page->decoded_content."\n\n".$action."\n"; # Fill in and submit the form (see note below re: form number) my $submitted = $self->submit_form( { # page => $link->url, # follow => 1, form_no => 2, fields_ref => { 'ctl00$cpMain$Subject_Textbox' => $options{'subject'}, 'ctl00$cpMain$Body_Textbox' => $options{'message'}, subject => $options{'subject'}, # Seriously, don't even ask... body => $options{'message'}, mode => 1, }, no_click => 1, action => $action, re1 => 'bulletin_p1', re2 => 'bulletin_p2', } ); return unless $submitted; # Now for the confirmation page... # So on this page, we have the bulletin ASP form, a separate form for # the Post button, and a secret little bulletinForm form. The Post button # calls javascript that sets the bulletinForm's action URL and posts it. # Note that "bulletinForm" is identified by ID, not name, so we just specify # form#3 (4th form on the page). Sorry, did I mention one of those forms # is just a tag, embedded in another form? So it's form 2, not 3... # warn "Submitting Confirmation screen"; # Get the action $action = ''; unless ( $action = $self->_apply_regex( regex => 'bulletin_confirm_action' ) ) { $self->error("Can't find action URL on bulletin confirmation page"); return; } # We skip this if we're testing. return 1 if $options{'testing'}; $submitted = $self->submit_form( { form_no => 2, action => $action, no_click => 1, } ); # See if we submitted ok. if ( $submitted && $self->_apply_regex( regex => 'bulletin_posted' ) ) { return 1; } else { $self->error("Bulletin Posted verification not found - bulletin post failed ". "or confirmation page has changed"); warn $self->current_page->decoded_content."\n"; return; } } =head2 post_blog( %options ) Post a blog entry. $myspace->post_blog( subject => $subject, body => $body ) or die $myspace->error; You can also use "message" instead of "body". Currently only Subject and Message fields are supported. Mood, Category, Music, etc will be left at their default settings. Returns undef and sets $myspace->error if there's an error. Croaks if called when not logged in. =cut sub post_blog { my ( %options ) = @_; # They can pass "message" or "body". if ( $options{message} ) { $options{body} = $options{message} } # Check for requirements. croak "No body passed to post_blog" unless $options{body}; croak "No subject passed to post_blog" unless $options{subject}; $self->_die_unless_logged_in( 'post_blog' ); # Get the blog editor page directly. Going via links tries to load the # advanced editor, which doesn't help much. ( $DEBUG ) && warn "Getting blog editor page\n"; $self->get_page( 'http://blog.myspace.com/index.cfm?fuseaction=blog.create&editor=false', 'Go To Advanced Editor' ) or return undef; # Get Mytoken $self->current_page->decoded_content =~ /Mytoken=([A-Za-z0-9\-]+)/; my $token = $1; # Fill and in post the blog ( $DEBUG ) && warn "Submitting initial blog form\n"; $self->submit_form( { form_no => 1, fields_ref => { subject => $options{subject}, body => $options{body}, }, # They use JavaScript to reset the action of the form... action => 'http://blog.myspace.com/index.cfm?fuseaction=blog.previewBlog&Mytoken='. $token, no_click => 1, re2 => 'Confirm Blog Posting' } ) or return undef; # Post the confirmation, unless we're in test mode. ( $DEBUG ) && warn "Posting blog confirmation\n"; unless ( $options{testing} ) { $self->submit_form( { form_no => 1, action => 'http://blog.myspace.com/index.cfm?fuseaction=blog.processCreate', no_click => 1, } ) or return undef; } ( $DEBUG ) && warn "Returning Successful\n"; return 1; } #--------------------------------------------------------------------- # get_friend_name( $friend_id ) # Return the first name of $friend_id, if we have it. #sub get_friend_name { # # my $self = shift; # # my ( $friend_id ) = @_; # # # Just select and return :) # my $first_mame = $self->{dbh}->selectrow_arrayref("select first_name from friends where friendid=${friend_id}"); # # return $first_name; # #} #--------------------------------------------------------------------- sub ____CORE_INTERNAL_METHODS____ {} =head1 CORE INTERNAL METHODS These are methods used internally to maintain or handle basic stuff (page retreival, error handling, cache file handling, etc) that you probably won't need to use (and probably shouldn't use unless you're submitting a code patch :). =head2 trace_func You may pass this a code reference. If you do, it will be called on EACH successful HTML page retreived this module. The arguments passed to this code reference are: $trace_func->($where, $page) where $where is a descriptive but curt string explaining where this page was gotten and $page is a reference to the actual HTML. Clever Perl programmers can use caller() (perldoc -f caller) to find out where in the code that this page was accessed. =cut field trace_func => undef; sub _traceme { my ($where,$page) = @_; my $t = $self->trace_func(); return unless (defined($t) && ref($t) eq "CODE"); $t->($where,$page); } =head2 get_page( $url, [ $regexp ] ) get_page returns a referece to a HTTP::Response object that contains the web page specified by $url. If it can't get the page, returns undef and sets $myspace->error. Use this method if you need to get a page that's not available via some other method. You could include the URL to a picture page for example then search that page for friendIDs using get_friends_on_page. get_page will try up to 20 times until it gets the page, with a 2-second delay between attempts. It checks for invalid HTTP response codes, and known Myspace error pages. If called with the optional regexp, it will consider the page an error unless the page content matches the regexp. This is designed to get past network problems and such. EXAMPLE The following displays the HTML source of MySpace.com's home page. my $res=get_page( "http://www.myspace.com/" ); print $res->decoded_content; =cut sub get_page { my ( $url, $regexp, $follow ) = @_; # Reset error $self->error( 0 ); ( $DEBUG ) && print "Getting URL: $url\n"; # Try to get the page 20 times. my $attempt = 0; my $max_attempts = $self->max_get_attempts; my $res; my %headers = (); if ( $follow ) { %headers = ( 'Referer' => $self->{current_page}->request->uri ) } do { # Try to get the page # unless ( $res = $self->_read_cache( $url ) ) $res = $self->mech->get("$url", %headers); # } $attempt++; ( $DEBUG ) && print " - Attempt No: $attempt\n"; $self->_traceme("Attempt $attempt",$res); sleep ( int( rand( 3 ) ) + 1 ) if $self->human; } until ( ( $self->_page_ok( $res, $regexp ) ) || ( $attempt >= $max_attempts ) ); # We both set "current_page" and return the value. # $self->_cache_page( $url, $res ) unless $self->error; $self->{current_page} = $res; sleep ( int( rand( 2 ) ) + 5 ) if $self->human; if ( $self->error ) { return undef; } else { return ( $res ); } } =head2 follow_to( $url, $regexp ) Exactly the same as get_page, but sets the Referer header so it looks like you're clicking the link on the current page instead of just GETting it directly. Use this if you're stepping through pages. =cut sub follow_to { my ( $url, $regexp ) = @_; $self->get_page( $url, $regexp, 1 ); } =head2 follow_link This is like a robust version of WWW::Mechanize's "follow_link" method. It calls "find_link" with your arguments (and as such takes the same arguments. It adds the "re" argument, which is passed to get_page to verify we in fact got the page. Returns an HTTP::Response object if it succeeds, sets $self->error and returns undef if it fails. $self->_go_home; $self->follow_link( text_regex => qr/inbox/i, re => 'Mail Center' ) or die $self->error; There are a lot of options, so perldoc WWW::Mechanize and search for $mech->find_link to see them all. =cut sub follow_link { my ( %options ) = @_; my $res; # Take out options that are just for us my $re = ''; if ( $options{re} ) { $re = $options{re}; delete $options{re}; } # Find the link my $link = $self->mech->find_link( %options ); # Follow it if ( $link ) { $res = $self->get_page( $link->url, $re, 1 ); return $res; } else { $self->error('Link not found on page'); return undef; } } =head2 _cache_page( $url, $res ) Stores $res in a cache. =cut sub _cache_page { my ( $url, $res ) = @_; $self->{page_cache}->{$url} = $res; $self->_clean_cache; } =head2 _read_cache( $url ) Check the cache for this page. =cut sub _read_cache { my ( $url ) = @_; if ( ( $self->{page_cache}->{$url} ) && ( $self->{page_cache}->{$url}->is_fresh ) ) { return $self->{page_cache}->{$url}; } else { return ""; } } =head2 _clean_cache Cleans any non-"fresh" page from the cache. =cut sub _clean_cache { foreach my $url ( keys( %{ $self->{'page_cache'} } ) ) { unless ( $url->is_fresh ) { delete $self->{'page_cache'}->{ $url }; } } } #--------------------------------------------------------------------- # _page_ok( $response, $regexp ) # Takes a UserAgent response object and checks to see if the # page was sucessfully retreived, and checks the content against # known error messages (listed at the top of this file). # If passed a regexp, it will return true ONLY if the page content # matches the regexp (instead of checking the known errors). # It will delay 2 seconds if it fails so you can retry immediately. # Called by get_page and submit_form. # Sets the internal error method to 0 if there's no error, or # to a printable error message if there is an error. # # $regexp can be: # - a key that, if passed to _regexp will return the regexp to use # - a quoted RE # - an RE in string form. # # _page_ok will pass $regexp to _regex. If a value is returned, $regex # will be replaced with the value. # If $re is a string, it is converted into an RE and compared to # the page content. # # Examples: # $self->_page_ok( $res, 'you must be logged-in to do that\!.*<\/html>' ) # $self->_page_ok( $res, qr/you must be logged-in to do that\!.*<\/html>/ismo ) # $self->_page_ok( $res, 'logged_in' ) sub _page_ok { my ( $res, $regexp ) = @_; # Reset error $self->error(0); # Check for errors my $page_ok = 1; my $page; # If we think we're logged in, check for the "You must be logged-in" # error page. if ( ( $self->logged_in ) && ( ! $self->_check_login( $res ) ) ) { $self->error( "Not logged in" ); $page_ok=0; } # If the page load is "successful", check for other problems. elsif ( $res->is_success ) { # Page loaded, but make sure it isn't an error page. $page = $res->decoded_content; # Get the content $page =~ s/[ \t\n\r]+/ /go; # Strip whitespace # If they gave us a RE with which to verify the page, look for it. if ( $regexp ) { # See what format it's in and convert to RE if necessary $regexp = $self->_regex( $regexp ) if ( $self->_regex( $regexp ) ); if ( $regexp !~ /^\(\?/ ) { $regexp = qr/$regexp/i } # Page must match the regexp unless ( $page =~ $regexp ) { $page_ok = 0; $self->error("Page doesn't match verification pattern: $regexp"); # warn "Page doesn't match verification pattern.\n"; } # Otherwise, look for our known temporary errors. } else { foreach my $error_regexp ( @ERROR_REGEXPS ) { if ( $page =~ $error_regexp ) { $page_ok = 0; $self->error( "Got error page." ); # warn "Got error page.\n"; last; } } } } else { $self->error("Error getting page: \n" . " " . $res->status_line); $page_ok = 0; warn "Error getting page: \n" . " " . $res->status_line . "\n"; } sleep 2 unless ( $page_ok ); return $page_ok; } =head2 _check_login Checks for "You must be logged in to do that". If found, tries to log in again and returns 0, otherwise returns 1. =cut sub _check_login { my ( $res ) = @_; # Check the current page by default unless ( $res ) { $res = $self->current_page } # Check for the "proper" error response, or just look for the # error message on the page. if ( ( $res->is_error == 403 ) || ( $res->decoded_content =~ $self->_regex('not_logged_in') ) ) { if ( $res->is_error ) { warn "Error: " . $res->is_error . "\n" } else { warn "Got \"not logged in\" page\n"; } # If we already logged in, try to log us back in. if ( $self->logged_in ) { $self->site_login } # Return 0 so they'll try again. return 0; } else { return 1; } } #--------------------------------------------------------------------- # submit_form( $url, $form_no, $button, $fields_ref, [ $regexp1 ], # [ $regexp2 ] ) # Fill in and submit a form on the specified web page. # $url is the URL of the page OR a reference to a HTTP::Request object. # $form_no is the number of the form (starting at 0). i.e. if there # are 2 forms on the page and you want to submit to the 2nd one, set # $form_no to "1"). # $button is the name of the button of the form to press. # $fields_ref is a reference to a hash that contains field names # and values you want to fill in on the form. # submit_form returns 1 if it succeeded, 0 if it fails. =head2 submit_form( $url, $form_no, $button, $fields_ref, [ $regexp1 ], [ $regexp2 ] ) This format is being deprecated. Please use the format below if you use this method (which you shouldn't need unless you're writing more methods). Be aware that I might make this method private at some point. =head2 submit_form( $options_hashref ) Valid options: $myspace->submit_form( { page => "http://some.url.org/formpage.html", follow => 1, # 0 or 1 form_no => 1, form_name => "myform", # Use this OR form_no OR form form => $form, # HTML::Form object with a ready-to-post form. # (page, form_no, form_name, fields_ref and action will # be ignored). button => "mybutton", no_click => 0, # 0 or 1. fields_ref => { field => 'value', field2 => 'value' }, re1 => 'something unique.?about this[ \t\n]+page', re2 => 'something unique about the submitted page', action => 'http://some.url.org/newpostpage.cgi', # Only needed in weird occasions } ); This powerful little method reads the web page specified by "page", finds the form specified by "form_no" or "form_name", fills in the values specified in "fields_ref", and clicks the button named "button". You may or may not need this method - it's used internally by any method that needs to fill in and post a form. I made it public just in case you need to fill in and post a form that's not handled by another method (in which case, see CONTRIBUTING below :). "page" can either be a text string that is a URL or a reference to an HTTP::Response object that contains the source of the page that contains the form. If it is an empty string or not specified, the current page ( $myspace->current_page ) is used. "follow" indicates whether or not we're supposedly following a link to the URL supplied in "page". If "page" isn't a URL, "follow" is ignored. This causes "submit_form" to use the "follow_to" method instead of "get_page" when getting the URL. This makes it look like we clicked a link to get to this page instead of just going straight to it. "form_no" is used to numerically identify the form on the page. It's a simple counter starting from 0. If there are 3 forms on the page and you want to fill in and submit the second form, set "form_no => 1". For the first form, use "form_no => 0". "form_name" is used to indentify the form by name. In actuality, submit_form simply uses "form_name" to iterate through the forms and sets "form_no" for you. "form" can be used if you have a customized form you want to submit. Pass an HTML::Form object and set "button", "no_click", and "re2" as desired, and you can use submit_form's tenacious submission routine with your own values. "button" is the name of the button to submit. This will frequently be "submit", but if they've named the button something clever like "Submit22" (as MySpace did in their login form), then you may have to use that. If no button is specified (either by button => '' or by not specifying button at all), the first button on the form is clicked. If "no_click" is set to 1, the form willl be submitted without clicking any button. This is used to simulate the JavaScript form submits Myspace does on the browse pages. "fields_ref" is a reference to a hash that contains field names and values you want to fill in on the form. For checkboxes with no "value" attribute, specify a value of "on" to check it, "off" to uncheck it. "re1" is an optional Regular Expression that will be used to make sure the proper form page has been loaded. The page content will be matched to the RE, and will be treated as an error page and retried until it matches. See get_page for more info. "re2" is an optional RE that will me used to make sure that the post was successful. USE THIS CAREFULLY! If your RE breaks, you could end up repeatedly posting a form. This is used by post_comemnts to make sure that the Verify Comment page is actually shown. "action" is the post action for the form, as in:
This is here because Myspace likes to do weird things like reset form actions with Javascript then post them without clicking form buttons. =cut sub submit_form { my ( $url, $form_no, $button, $fields_ref, $regexp1, $regexp2, $base_url ) = @_; # Initialize our variables my $mech = $self->mech; # For convenience my $res = ""; my ( $field ); my $options; # $base_url = $BASE_URL unless $base_url; # $form_no++; # For backwards compatibility. # Parse the options # Unless they passed a hashref of options, set using the # positional parameters. if ( ref $url eq "HASH" ) { $options = $url; } else { $options = { 'url' => $url, 'form_no' => $form_no, 'button' => $button, 'fields_ref' => $fields_ref, 're1' => $regexp1, 're2' => $regexp2, 'base' => $base_url, 'page' => $url, }; } # If they gave us a form, use it. Otherwise, get it and fill it in. my $f = ""; if ( $options->{'form'} ) { $f = $options->{'form'}; } else { # Get the page if ( ref( $options->{'page'} ) eq "HTTP::Response" ) { # They gave us a page already $res = $options->{'page'}; } elsif ( ! $options->{'page'} ) { $res = $self->current_page; } else { # Get the page ( $DEBUG ) && print "Getting $options->{page}\n"; if ( $options->{'follow'} ) { $res = $self->follow_to( $options->{'page'}, $options->{'re1'} ); } else { $res = $self->get_page( $options->{'page'}, $options->{'re1'} ); } # If we couldn't get the page, return failure. return 0 if $self->error; } # Select the form they wanted, or return failure if we can't. my @forms = HTML::Form->parse( $res, $options->{'base'} ); if ( $options->{'form_no'} ) { unless ( @forms > $options->{'form_no'} ) { $self->error( "Form " . $options->{form_no} . " not on page in submit_form!" ); return 0; } } if ( $options->{'form_name'} ) { $form_no = 0; foreach my $form ( @forms ) { if ( ( $form->attr( 'name' ) ) && ( $form->attr( 'name' ) eq $options->{'form_name'} ) ) { $options->{'form_no'} = $form_no; last; } $form_no++; } unless ( $options->{form_no} ) { $self->error( "Form " . $options->{form_name} . " not on page in submit_form!" ); return 0; } } $f = $forms[ $options->{'form_no'} ]; # Set the action if they gave us one if ( $options->{'action'} ) { $f->action( $options->{'action'} ) } # Fill in the fields ( $DEBUG ) && print "Filling in form number " . $options->{'form_no'} . ".\n"; ( $DEBUG ) && print $f->dump; # Loop through the fields in the form and set them. foreach my $field ( keys %{ $options->{'fields_ref'} } ) { # If the field "exists" on the form, just fill it in, # otherwise, add it as a hidden field. if ( $f->find_input( $field ) ) { if ( $f->find_input( $field )->readonly ) { $f->find_input( $field )->readonly(0) } $f->param( $field, $options->{'fields_ref'}->{ $field } ); } else { $f = $self->_add_to_form( $f, $field, $options->{'fields_ref'}->{ $field } ); } } } if ( $options->{'die'} ) { print $f->dump; die } # Submit the form. Try up to $max_attempts times. my $attempt = 0; my $max_attempts = $self->max_post_attempts; my $trying_again = 0; # Make our request based on our options my $request = undef; if ( $options->{'button'} ) { $request = $f->click( $options->{'button'} ); } elsif ( $options->{'no_click'} ) { # We use make_request because Myspace likes submitting forms # that have buttons by using Javascript. make_request submits # the form without clicking anything, whereas "click" clicks # the first button, which can break things. $request = $f->make_request; } else { # Just click the first button $request = $f->click; } $request->header( 'Referer' => $self->current_page->request->uri ); do { # If we're trying again, mention it. warn $self->error . "\n" if $trying_again; eval { $res = $self->mech->request( $request ); }; # If it died (it will if there's no button), just return failure. if ( $@ ) { $self->error( $@ ); return 0; } $attempt++; $trying_again = 1; $self->_traceme("Submit form attempt $attempt",$res); } until ( ( $self->_page_ok( $res, $options->{'re2'} ) ) || ( $attempt >= $max_attempts ) ); # Return the result $self->{current_page} = $res; return ( ! $self->error ); } =head2 _add_to_form Internal method to add a hidden field to a form. HTML::Form thinks we don't want to change hidden fields, and if a hidden field has no value, it won't even create an input object for it. If that's way over your head don't worry, it just means we're fixing things with this method, and submit_form will call this method for you if you pass it a field that doesn't show up on the form. Returns a form object that is the old form with the new field in it. # Add field $fieldname to form $form (a HTML::Form object) and # set it's value to $value. $self->_add_to_form( $form, $fieldname, $value ) =cut sub _add_to_form { my ( $f, $field, $value ) = @_; $f->push_input( 'hidden', { name => $field, value => $value } ); return $f; } #--------------------------------------------------------------------- # get_friends_on_page( $page ); # This routine takes the SOURCE CODE of the page and returns # a list of friendIDs for which there are profile links on the page. # Notes: # - Our friend ID will be one of those returned, so we check for it. # - We use the hash method because there are multiple links for each user # (hence duplicate friendIDs will be returned). (One link for the name, # one for their image). This is pretty safe against changes to the page. # - We filter out 6221, Tom's ID... =head2 get_friends_on_page( $friends_page, $exclude ); This routine takes the SOURCE CODE of an HTML page and returns a list of friendIDs for which there are profile links on the page. This routine is used internally by "get_friends" to scan each of the user's "View my friends" pages. Notes: - It does not return the logged_in user's friendID. - We filter out 6221, Tom's ID. - friendIDs are returned in the order in which they appear on the change (note that this is new in 0.62 - in previous versions they were returned in an indetermined order) If $friends_page is not specified or is '', the current page will be used. $exclude is the number of a single friendID to exclude. This is used by get_friends to exclude the friendID of the profile whose friends you're getting since Myspace displays a link to that person's profile on every page of his friend list, which would show up in the list returned by this method. EXAMPLE: List the friendIDs mentioned on Tom's profile (i.e. his top 8, people who left comments, etc): use WWW::Myspace; my $myspace = new WWW::Myspace; $res = $myspace->get_profile( 6221 ); @friends = $myspace->get_friends_on_page( $res->decoded_content ); print "These people have left comments or have links on Tom's page:\n"; foreach $id ( @friends ) { print "$id\n"; } =cut sub get_friends_on_page { my ( $page, $exclude ) = @_; # Default to current page unless ( $page ) { $page = $self->current_page->decoded_content } my @friend_ids = (); while ( $page =~ s/.*?${FRIEND_REGEXP}([0-9]+)//smi ) { unless ( ( ( $self->logged_in ) && ( "$2" == $self->my_friend_id ) ) || ( "$2" == 6221 ) || ( ( $exclude ) && ( "$2" == $exclude ) )|| ( @friend_ids && ( "$2" == $friend_ids[$#friend_ids] ) ) # Duplicate check ) { push( @friend_ids, $2 ); } } return ( @friend_ids ); } =head2 remove_cache Remove the login cache file. Call this after creating the object if you don't want the login data stored: my $myspace = new WWW::Myspace( qw( myaccount, mypassword ) ); $myspace->remove_cache; =cut sub remove_cache { my $cache_file_path = catfile( $self->cache_dir, $self->cache_file ); unlink $cache_file_path; } #--------------------------------------------------------------------- # make_cache_dir =head2 make_cache_dir Creates the cache directory in cache_dir. Only creates the top-level directory, croaks if it can't create it. $myspace->cache_dir("/path/to/dir"); $myspace->make_cache_dir; This function mainly exists for the internal login method to use, and for related sub-modules that store their cache files by default in WWW:Myspace's cache directory. =cut sub make_cache_dir { # Make the cache directory if it doesn't exist. unless ( -d $self->cache_dir ) { mkdir $self->cache_dir or croak "Can't create cache directory ". $self->cache_dir; } } #--------------------------------------------------------------------- # _die_unless_logged_in sub _die_unless_logged_in { my ( $method ) = @_; unless ( $self->logged_in ) { croak "$method called when not logged in\n"; } } #--------------------------------------------------------------------- # _fix_textareas( $tree ) # Takes an HTML::Element node and traverses it, fixing any # textarea elements so they have a content element. # Bug workaround - HTTP::Request::Form will die if a textarea # field has no content (because the parser doesn't add a # "_content" element). So, we add one. sub _fix_textareas() { my $x = $_[0]; # If this is a textarea, push an empty string as the # content if it doesn't have any. if ( $x->tag eq "textarea" ) { $x->{_content} = [] unless defined $x->content; } # Recursively traverse the tree on our search. foreach my $c ($x->content_list) { _fix_textareas($c) if ref $c; # ignore text nodes } } #--------------------------------------------------------------------- # _get_acct() # Get and store the login and password. We check the user's preference # file for defaults, then prompt them. sub _get_acct { # Initialize my %prefs = (); my $ref = ""; my ( $pref, $value, $res ); my $cache_filepath = catfile( $self->cache_dir, $self->cache_file); # Read what we got last time. if ( open ( PREFS, "< ", $cache_filepath ) ) { while () { chomp; ( $pref, $value ) = split( ":" ); $prefs{"$pref"} = $value; } close PREFS; } # Prompt them for current values unless ( defined $prefs{"email"} ) { $prefs{"email"} = "" } print "Email [" . $prefs{"email"} . "]: "; $res = ; chomp $res; if ( $res ) { $prefs{"email"} = $res; } unless ( defined $prefs{"password"} ) { $prefs{"password"} = "" } print "Password [". $prefs{"password"} . "]: "; $res = ; chomp $res; if ( $res ) { $prefs{"password"} = $res; } # Make the cache directory if it doesn't exist. $self->make_cache_dir; # Store the new values. open ( PREFS, ">", $cache_filepath ) or croak $!; print PREFS "email:" . $prefs{"email"} . "\n" . "password:" . $prefs{"password"} . "\n"; close PREFS; # Store the account info. $self->{account_name}=$prefs{"email"}; $self->{password}=$prefs{"password"}; } #--------------------------------------------------------------------- # _get_friend_id( $homepage ) # This internal method stores our friend ID. We get this from the # "View Profile" link on our home page (the page we see when we # click the "Home" link in the top nav bar) sub _get_friend_id { my ( $homepage ) = @_; # Search the code for the link. This is why we like Perl. :) my $page_source = $homepage->decoded_content; $page_source =~ /index\.cfm\?fuseaction=user\.viewprofile\&(amp;)friendid=([0-9]+)/io; my $friend_id=$2; ( $DEBUG ) && print "Got friend ID: $friend_id\n"; # Store it $self->{my_friend_id} = $friend_id; if ( $friend_id ) { $self->error(0) } else { $self->error("Couldn't get friendID from home page") } } #--------------------------------------------------------------------- # _get_friend_page( $page, %attr_ref ) # Examples: # $self->_get_friend_page( 1, 'group', 100011592 ); # Gets the friends from page 1 (the second page) of the myspace # group with ID 100011592. # # $self->_get_friend_page( 1 ) # Get the the friends from page 1 of the logged in user's friend pages. # # $self->_get_friend_page( 1, 'inbox' ); # Gets the friends from page 1 of the logged in user's mail inbox. # # Return the content of the friend page. $page is the page number. # $id sub _get_friend_page { my ( $page, $source, $id ) = @_; my ( $url, $res, $success ); my $verify_re = ''; $source = '' unless defined $source; my $follow = 1; # Add referer header unless first page # Set the URL string for the right set of pages if ( $source eq "group" ) { $url = "http://groups.myspace.com/index.cfm?fuseaction=". "groups.viewMembers&groupID=${id}&page=${page}"; $follow = 0 if ( $page == 0 ); } else { # Make sure we got the friend page, and that we got the whole page. $verify_re = "View All Friends.*(Previous|Next).*<\/html>"; ( $DEBUG ) && print "Loading friend page $page\n"; # Unless they specified a profile to get friends from, # use our own. unless ( $source eq 'profile' ) { $id = $self->my_friend_id; } if ( $page == 1 ) { # First page $url = "http://home.myspace.com/index.cfm?". "fuseaction=user.viewfriends&". "friendID=" . $id; $follow = 0; } else { # Subsequent pages $url = "http://home.myspace.com/index.cfm?". "fuseaction=user.viewfriends&". "friendID=" . $id . "&" . "friendCount=" . $self->{_friend_count} . "&" . "userName=" . $self->{_user_name} . "&" . "page=" . $page . "&" . "prevPage=" . $self->{_last_friend_page} . "&" . "PREVPageFirstONERETURENED=" . $self->{_low_friend_id}."&". "PREVPageLASTONERETURENED=" . $self->{_high_friend_id}; } } # Get the page ( $DEBUG ) && print " Getting URL: $url\n"; $res = $self->get_page( $url, $verify_re, $follow ); if ( $res->decoded_content =~ /This\s+profile\s+is\s+set\s+to\s+private.\s+This\s+user\s+must\s+add\s+\s*you\s+as\s+a\s+friend\s+to\s+see\s+his\/her\s+profile./o ) { # good lord $self->error("User profile is set to private."); } # Save info if we need to unless ( $self->error ) { $self->$save_friend_info if ( ( ( $source eq '' ) || ( $source eq 'profile' ) ) && ( $page == 1 ) ); } return $res; } #--------------------------------------------------------------------- # save_friend_info # We need to grab some info off the View Friends page to feed back # to subsequent pages. my sub save_friend_info { # Get and store the friend count and user name # Friend count $self->current_page->decoded_content =~ /name="friendCount"\s+value="([0-9]+)"/io; $self->{_friend_count} = $1; warn "Didn't get friend count" unless ( $self->{_friend_count} ); # User name $self->current_page->decoded_content =~ /name="userName"\s+value="([^"]*)"/io; $self->{_user_name} = $1; warn "Didn't get user_name" unless ( $self->{_user_name} ); # Number of pages $self->current_page->decoded_content =~ /of( |\s)+{_friend_pages} ); # warn "friend_pages: " . $self->{_friend_pages}; # warn "Stored friend count " . $self->{_friend_count} . ", ". # "user name " . $self->{_user_name} . ".\n"; } =head2 _next_button Takes the source code of a page, or nothing. If nothing is passed, uses $self->current_page->decoded_content. Returns true if there is a next button on the page. This is so we can say: last unless ( $self->_next_button( $page_source ) ); or: while ( $self->_next_button ) { do stuff } or while ( $self->_next_button ) { do stuff and click next } One of these days I'm going write a "stuff" subroutine so I can actually type that. EXAMPLES =cut sub _next_button { my ( $content ) = @_; unless ( $content ) { $content = $self->current_page->decoded_content; } $content =~ /">\s*Next\s*((<\/a>)?(\s| )+(\>|>)|›\s*<\/a>)/io; } =head2 _previous_button As you might guess, returns true if there's a "Previous" link on the page. This is used to sanity-check functions like get_friends. If there isn't a "Next" button, this method can be used to make sure there is a "Previous" button. # Exit the loop if we're on the last page last unless ( $self->_next_button( $page_source ) && $self->_previous_button( $page_source ) ); =cut sub _previous_button { my ( $content ) = @_; unless ( $content ) { $content = $self->current_page->decoded_content; } $content =~ /(<\s*]+>|\s*\‹)\s*Previous\s*<\/a>/io; } # Simple method to count the keys in a hash my sub count_keys { my ( $hashref ) = @_; return keys( %{$hashref} ); } #--------------------------------------------------------------------- # _format_html( $text ) # Simple translator from text to HTML - changes newlines # to "
\n". sub _format_html { my ( $text ) = @_; $text =~ s/\n/
\n/gs; return $text; } =head2 _go_home Internal method to go to the home page. Checks to see if we're already there. If not, tries to click the Home button on the page. If there isn't one, loads the page explicitly. =cut sub _go_home { # If we're not logged in, go to the home page unless ( $self->logged_in ) { $self->get_page( $BASE_URL ) or return; return 1; } # Are we there? if ( $self->mech->uri =~ /[\?&;]fuseaction=user([&;]|$)/io ) { # warn "I think I'm on the homepage\n"; # warn $self->mech->uri . "\n"; return 1; } # # No, try to click home # # Broken by myspace on 10/10/07 - Home page link set by Javascript. # my $home_link = ""; # # if ( $home_link = $self->mech->find_link( # url_regex => qr/fuseaction=user([&;]|$|")/io # ) # ) { # warn "_go_home going to " . $home_link->url . "\n"; # $self->follow_to( $home_link->url ) or return; # return 1; # } # Still here? Load the page explicitly $self->get_page( $HOME_PAGE ) or return undef; # warn "I think I loaded $HOME_PAGE\n"; return 1; } # _validate_page_request( [ $friend_id | friend_id => $friend_id | page => $page ], # [ no_validation => 1 ]); # # Internal method (obviously) that handles validation for methods that get # information from a profile page. # # Instead of parsing a friendID and calling get_profile, you can # just do: # my ( $page ) = $self->_validate_page_request( @_ ); # # Then apply your regex to the page or do whatever else you need to do to it. # # Arguments are parsed as follows: # no args: returns $self->current_page # friend_id: calls get_profile (get_page if no_validation is specified as a true value) # and returns the resulting HTTP::Response object # page: Returns the page # # if no_validation is set to a true value (use 1 just in case this changes in # the future), get_profile will be told not to check for the page validation # regex. This is currently used by is_invalid to check for invalid profiles. # # You can put these docs in your method. Change "MY_METHOD" to the name of your # method: # # =head2 C $friend_id | page => $page ] )> # If passed no arguments, MY_METHOD parses the current page. If passed a friend_id, # it calls get_profile to retrieve the friend's profile page. If passed # a page (an HTTP::Response object), it parses $page->decoded_content. sub _validate_page_request { my %args = ( ); # accept one lone parameter as an argument if it's a digit -- treat it as # a friend_id to keep it in line with the rest of the app if ( scalar @_ == 1 ) { my $friend_id = shift; if ( $friend_id && $friend_id !~ /[^0-9]/ ) { $args{'friend_id'} = $friend_id; } else { croak "if passing one parameter, please pass a valid friend_id"; } } elsif ( scalar @_ == 0 ) { $args{'page'} = $self->current_page; } else { %args = @_; } my $page = undef; # If they gave a friend_id, we load the profile and look at it. if ( exists $args{'page'} && defined $args{'page'}) { $page = $args{'page'}; } elsif ( exists $args{'friend_id'} ) { # Get the profile page # Set the no_validation argument to a definite value so we can pass it # through to get_profile. $args{'no_validation'}=0 unless $args{'no_validation'}; my $res = $self->get_profile( $args{'friend_id'}, $args{'no_validation'} ); $page = $res unless ( $self->error ); } else { die "You must provide either a friend_id or a response object"; } return $page; } # _regex( $regex_key ) # # When passed a key string, _regex returns the matching regular expression defined # in the "regex" hash. # # Example: # # if ( $source =~ $self->_regex{'is_invalid'} ) { # print "Page matches invalid regex\n"; # } # # # Note that you probably won't need to use this much since you'll be using # _apply_regex instead. But should you need to directly match an RE that for # some reason can't be handled in _apply_regex, use this method to keep matching # centralized for future mods and internationalization. sub _regex { my $requested = shift; if ( exists $regex{$requested} ) { return $regex{$requested}; } } # _apply_regex( page => $res_object, # source => $page_text, # regex => $regex_reference # ); # # _apply_regex provides a centralized source for matching regular expressions on # pages against the centralized "regex" hash. It returns a true value if the # page or source contains the regex. If the RE contains parenthesis, returns $1. # # page: An HTTP::Response object (optional) # source: A string containing text (i.e. the HTML source of a page) against # which the regex should be matched (optional) # regex: A string that must match the keys to the appropriate regex. # # If neither page nor source are specified, _apply_regex will apply the regex to # $self->current_page->decoded_content (that is, to the current page). # # Example: # # my $private = $self->_apply_regex( # page => $page, # regex => 'is_private', # ); # # if ( $private ) { return 1 } else { return 0 } # # # # Example 2: # # my $source = $self->current_page->decoded_content; # # if ( $self->_apply_regex( # source => $source, # regex => 'is_invalid' # ) # ) { print "Source matches invalid regex\n"; } # # # Note that technically you could include both "page" and "source" arguments. # "page" would be tested first and if it didn't match then "source" would be # tested. This isn't necessarily supported, so it might change in the future. sub _apply_regex { my %args = @_; # If they didn't specify a page or source, default to current page. unless ( $args{'page'} || $args{'source'} ) { $args{'page'} = $self->current_page } # Test the regex against the supplied page or source if ( exists $regex{$args{'regex'}} ) { if ( $args{'page'} && ( $args{'page'}->decoded_content =~ $regex{$args{'regex'}} ) ) { if ( $1 ) { return $1 } else { return 1 }; } if ( $args{'source'} && ( $args{'source'} =~ $regex{$args{'regex'}} ) ) { if ( $1 ) { return $1 } else { return 1 }; } } } sub _use_captcha_killer { my $api_key = $self->captcha_killer_api_key; my ( $captcha_url, $upload_filename ) = @_; my $ua = LWP::UserAgent->new; $ua->default_headers->push_header('CAPTCHA-Client' => "WWW-Myspace-$VERSION"); push @{ $ua->requests_redirectable }, "POST"; my $captcha_id = ""; my $captcha_result = ""; my $response = $ua->post( "http://www.captchakiller.com/api.php", Content_Type => 'form-data', Content => [ api_key => $api_key, method => "upload_captcha", captcha_url => $captcha_url, expire => ( $self->captcha_tries * 10 ), file => [ $upload_filename ] ] ); $captcha_id = ""; if ( $response->is_success ) { print $response->decoded_content; if ( $response->decoded_content =~ /SUCCESS: captcha_id=([\w\-]+)/o ) { $captcha_id = $1; print "GOT CAPTCHA ID: $captcha_id\n"; } else { return; # Can't recognize CAPTCHA } } else { return; # can't upload CAPTCHA? } $captcha_result = ""; for ( my $cnt = 1; $cnt < $self->captcha_tries; $cnt++ ) { print "ATTEMPT $cnt\n"; my $response = $ua->post( "http://www.captchakiller.com/api.php", Content => [ api_key => $api_key, method => "get_result", captcha_id => $captcha_id ] ); if ( $response->is_success ) { print $response->decoded_content; next if ( $response->decoded_content =~ /^WAIT/o ); last if ( $response->decoded_content =~ /^(ERROR|FAILURE)/o ); if ( $response->decoded_content =~ /^SUCCESS: captcha_result=\"(.*)\"$/o ) { $captcha_result = $1; last; } } sleep 2; } return $captcha_result; } sub _handle_captcha { return if ( $self->captcha_killer_api_key eq "" ); # Not handling CAPTCHAs my $url = shift; print "GOT CAPTCHA URL: $url\n"; my $file = catfile( $self->cache_dir, "captcha$$" ); print "SAVING INTO FILE: $file\n"; for ( my $i = 0; $i < 5; $i++ ) { my $res = $self->mech->get( $url, ':content_file' => $file ); last if ( -f $file ); print "FILE TROUBLE: ", Dumper( $file ); } return "" if ( ! -f $file ); my $solution = $self->_use_captcha_killer( $url, $file ); unlink ( $file ); return $solution; } sub ____IN_PROGRESS____ {} =head1 IN PROGRESS Methods that aren't quite working yet. =cut 1; __END__ =head1 AUTHOR Grant Grueninger, C<< >> (Bug reports sent to this address will probably be lost - see "BUGS" below to report bugs) Thanks to: Tom Kerswill (http://tomkerswill.co.uk) for the friend_url method, which also inspired the friend_user_name method. Olaf Alders (http://www.wundersolutions.com) for the human-readable status codes in send_friend request, for the excellent sample code which provides a workaround for CAPTCHA responses, and for the friends_from_profile idea. =head1 KNOWN ISSUES =over 4 =item - One of the modules upon which WWW::Myspace depends generates the following warnings when logging in: Day too big - 2932896 > 24855 Sec too big - 2932896 > 11647 Day too big - 2932896 > 24855 Sec too big - 2932896 > 11647 These are harmless but annoying. See the "date.patch" file included at the root level of the distribution if you want to fix them. =item - Some myspace error pages are not accounted for, such as their new Server Application error page. If you know enough about web development to identify an error page that would return a successful HTTP response code (i.e. returns 200 OK), but then displays an error message, please keep an eye out for such pages. If you get such an error message page, PLEASE EMAIL ME (see BUGS below) the page content so I can account for it. =item - If the text used to verify that the profile page has been loaded changes, get_profile and post_comments will report that the page hasn't been loaded when in fact it has. =item - A user has reported that the module fails to log in with human=>0. We recommend always leaving human=>1 (the default). =item - Your account location must be set to United States for the module to work. It will work with other English-speaking locations, but some methods (such as last_login) will fail if your location causes dates to be displayed in a manner other than month/day/year. =back =head1 TODO Have 'approve_friends' method check GUIDS after first submit to make sure the current page of GUIDS doesn't contain any duplicates. This is to prevent a possible infinite loop that could occur if the submission of the friend requests fails, and also to signal a warning if myspace changes in a way that breaks the method. Add checks to all methods to self-diagnose to detect changes in myspace site that break this module. get_friends needs to throw an error, or at least set error, if it can't return the full list of friends (i.e. if either of the "warn" statements are triggered) get_friends needs to check the number of pages and try to get all of them. Currently if a next button isn't on a page for any reason, the method will think it's retreived all the friends. Add tests for get_comments. Add Internationalization (i18n) support. Centralize all regular expressions into _regex and _apply_regex methods. =head1 CONTRIBUTING If you would like to contribute to this module, you can post patches by following the simple 4-step process below. If you end up posting several patches and your code shows a good understanding of the module, we will probbaly ask you if you'd like to be added as a developer on the project. There are many methods that could be added to this module (profile editing, for example). If you find yourself using the "submit_form" method, it probably means you should write whatever you're editing into a method and post it on RT. See the TODO section above for starters, and be sure to read the next section about how to submit patches for features/fixes. =head1 HOW TO SUBMIT A PATCH To submit a patch for a new feature or a bug fix, please observe the following. Doing so will allow us to implement your patch quickly. Not doing so may delay its implementation or prevent us from implementing your patch at all. - Check out the newest development version from SVN. The command to use is here: http://sourceforge.net/svn/?group_id=163042 (Or see http://sourceforge.net/projects/www-myspace) - Makke your changes to that version. * - Create a unified or context diff of the changed file(s): svn diff filename > filename.diff (i.e. svn diff Myspace.pm > Myspace.pm.diff) - Email the output (filename.diff) with comments regarding what the patch implements/fixes to C, or go to the CPAN RT web site (see below) and submit it there. We will apply your patch and run the tests on it. * You can use the checked-out version in your scripts by one of several methods: # Somewhere in your script: use lib '/path/to/svn/checkout/lib'; # Top of your script: #!/usr/bin/perl -w -I/path/to/svn/checkout/lib # Command line: perl -I'/path/to/svn/checkout/lib' =head1 BUGS Please report any bugs or feature requests, or send any patches, to C, or through the web interface at L. We will be notified, and then you'll automatically be notified of progress on your bug as we make changes. IF YOU USE A MAIL SERVICE (or program) WITH JUNK MAIL FILTERING, especially HOTMAIL or YAHOO, add the bug reporting email address above to your address book so that you can receive status updates. Bug reports are nice, patches are nicer (see "HOW TO SUBMIT A PATCH" above). =head1 SUPPORT You can find documentation for this module with the perldoc command. perldoc WWW::Myspace You can also look for information at: =over 4 =item * AnnoCPAN: Annotated CPAN documentation L =item * CPAN Ratings L =item * RT: CPAN's request tracker L =item * Search CPAN L =back =head1 COPYRIGHT & LICENSE Copyright 2005-2006 Grant Grueninger, all rights reserved. This program is free software; you can redistribute it and/or modify it under the same terms as Perl itself. =cut