Class WWW::Mechanize::Page
In: lib/www/mechanize/monkey_patch.rb
lib/www/mechanize/page/base.rb
lib/www/mechanize/page/frame.rb
lib/www/mechanize/page/link.rb
lib/www/mechanize/page/meta.rb
lib/www/mechanize/page.rb
Parent: Object
Mechanize\n[lib/www/mechanize.rb\nlib/www/mechanize/chain.rb\nlib/www/mechanize/chain/auth_headers.rb\nlib/www/mechanize/chain/body_decoding_handler.rb\nlib/www/mechanize/chain/connection_resolver.rb\nlib/www/mechanize/chain/custom_headers.rb\nlib/www/mechanize/chain/header_resolver.rb\nlib/www/mechanize/chain/parameter_resolver.rb\nlib/www/mechanize/chain/pre_connect_hook.rb\nlib/www/mechanize/chain/request_resolver.rb\nlib/www/mechanize/chain/response_body_parser.rb\nlib/www/mechanize/chain/response_header_handler.rb\nlib/www/mechanize/chain/response_reader.rb\nlib/www/mechanize/chain/ssl_resolver.rb\nlib/www/mechanize/chain/uri_resolver.rb\nlib/www/mechanize/content_type_error.rb\nlib/www/mechanize/cookie.rb\nlib/www/mechanize/cookie_jar.rb\nlib/www/mechanize/file.rb\nlib/www/mechanize/file_response.rb\nlib/www/mechanize/file_saver.rb\nlib/www/mechanize/form.rb\nlib/www/mechanize/form/button.rb\nlib/www/mechanize/form/check_box.rb\nlib/www/mechanize/form/field.rb\nlib/www/mechanize/form/file_upload.rb\nlib/www/mechanize/form/image_button.rb\nlib/www/mechanize/form/multi_select_list.rb\nlib/www/mechanize/form/option.rb\nlib/www/mechanize/form/radio_button.rb\nlib/www/mechanize/form/select_list.rb\nlib/www/mechanize/headers.rb\nlib/www/mechanize/history.rb\nlib/www/mechanize/monkey_patch.rb\nlib/www/mechanize/page.rb\nlib/www/mechanize/page/base.rb\nlib/www/mechanize/page/frame.rb\nlib/www/mechanize/page/link.rb\nlib/www/mechanize/page/meta.rb\nlib/www/mechanize/pluggable_parsers.rb\nlib/www/mechanize/redirect_limit_reached_error.rb\nlib/www/mechanize/redirect_not_get_or_head_error.rb\nlib/www/mechanize/response_code_error.rb\nlib/www/mechanize/unsupported_scheme_error.rb\nlib/www/mechanize/util.rb] lib/www/mechanize.rb Handler WWW dot/m_52_0.png

Synopsis

This class encapsulates an HTML page. If Mechanize finds a content type of ‘text/html’, this class will be instantiated and returned.

Example

 require 'rubygems'
 require 'mechanize'

 agent = WWW::Mechanize.new
 agent.get('http://google.com/').class  #=> WWW::Mechanize::Page

Methods

bases   content_type   encoding   encoding=   forms   frames   html_body   iframes   links   meta   new   parser   root   title  

Classes and Modules

Class WWW::Mechanize::Page::Base
Class WWW::Mechanize::Page::Frame
Class WWW::Mechanize::Page::Link
Class WWW::Mechanize::Page::Meta

External Aliases

pretty_inspect -> inspect

Attributes

mech  [RW] 

Public Class methods

[Source]

    # File lib/www/mechanize/page.rb, line 25
25:       def initialize(uri=nil, response=nil, body=nil, code=nil, mech=nil)
26:         @encoding = nil
27: 
28:         method = response.respond_to?(:each_header) ? :each_header : :each
29:         response.send(method) do |header,v|
30:           next unless v =~ /charset/i
31:           encoding = v.split('=').last.strip
32:           @encoding = encoding unless encoding == 'none'
33:         end
34: 
35:         # Force the encoding to be 8BIT so we can perform regular expressions.
36:         # We'll set it to the detected encoding later
37:         body.force_encoding('ASCII-8BIT') if defined?(Encoding) && body
38: 
39:         @encoding ||= Util.detect_charset(body)
40: 
41:         super(uri, response, body, code)
42:         @mech           ||= mech
43: 
44:         @encoding = nil if html_body =~ /<meta[^>]*charset[^>]*>/i
45: 
46:         raise Mechanize::ContentTypeError.new(response['content-type']) unless
47:            response['content-type'] =~ /^(text\/html)|(application\/xhtml\+xml)/i
48:         @parser = @links = @forms = @meta = @bases = @frames = @iframes = nil
49:       end

Public Instance methods

[Source]

     # File lib/www/mechanize/page.rb, line 151
151:       def bases
152:         @bases ||=
153:           search('base').map { |node| Base.new(node, @mech, self) }
154:       end

Get the content type

[Source]

    # File lib/www/mechanize/page.rb, line 86
86:       def content_type
87:         response['content-type']
88:       end

[Source]

    # File lib/www/mechanize/page.rb, line 66
66:       def encoding
67:         parser.respond_to?(:encoding) ? parser.encoding : nil
68:       end

[Source]

    # File lib/www/mechanize/page.rb, line 57
57:       def encoding=(encoding)
58:         @encoding = encoding
59: 
60:         if @parser && @parser.encoding.downcase != encoding.downcase
61:           # lazy reinitialize the parser with the new encoding
62:           @parser = nil
63:         end
64:       end

[Source]

     # File lib/www/mechanize/page.rb, line 129
129:       def forms
130:         @forms ||= search('form').map do |html_form|
131:           form = Form.new(html_form, @mech, self)
132:           form.action ||= @uri.to_s
133:           form
134:         end
135:       end

[Source]

     # File lib/www/mechanize/page.rb, line 156
156:       def frames
157:         @frames ||=
158:           search('frame').map { |node| Frame.new(node, @mech, self) }
159:       end

[Source]

     # File lib/www/mechanize/page.rb, line 161
161:       def iframes
162:         @iframes ||= 
163:           search('iframe').map { |node| Frame.new(node, @mech, self) }
164:       end

[Source]

     # File lib/www/mechanize/page.rb, line 121
121:       def links
122:         @links ||= %w{ a area }.map do |tag|
123:           search(tag).map do |node|
124:             Link.new(node, @mech, self)
125:           end
126:         end.flatten
127:       end

[Source]

     # File lib/www/mechanize/page.rb, line 137
137:       def meta
138:         @meta ||= search('meta').map do |node|
139:           next unless node['http-equiv'] && node['content']
140:           (equiv, content) = node['http-equiv'], node['content']
141:           if equiv && equiv.downcase == 'refresh'
142:             Meta.parse(content, uri) do |delay, href|
143:               node['delay'] = delay
144:               node['href'] = href
145:               Meta.new(node, @mech, self)
146:             end
147:           end
148:         end.compact
149:       end

[Source]

    # File lib/www/mechanize/page.rb, line 70
70:       def parser
71:         return @parser if @parser
72: 
73:         if body && response
74:           if mech.html_parser == Nokogiri::HTML
75:             @parser = mech.html_parser.parse(html_body, nil, @encoding)
76:           else
77:             @parser = mech.html_parser.parse(html_body)
78:           end
79:         end
80: 
81:         @parser
82:       end
root()

Alias for parser

[Source]

    # File lib/www/mechanize/page.rb, line 51
51:       def title
52:         @title ||= if parser && search('title').inner_text.length > 0
53:           search('title').inner_text
54:         end
55:       end

Private Instance methods

[Source]

     # File lib/www/mechanize/page.rb, line 168
168:       def html_body
169:         if body
170:           body.length > 0 ? body : '<html></html>'
171:         else
172:           ''
173:         end
174:       end

[Validate]