summaryrefslogtreecommitdiff
path: root/spec/rubyspec/library/uri/extract_spec.rb
blob: 7b660851b6d1e063ea7af9ed41064b84d40d011a (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
require File.expand_path('../../../spec_helper', __FILE__)
require 'uri'

describe "URI.extract" do
  it "behaves according to its documentation" do
    URI.extract("text here http://foo.example.org/bla and here mailto:test@example.com and here also.").should == ["http://foo.example.org/bla", "mailto:test@example.com"]
  end

  it "treats contiguous URIs as a single URI" do
    URI.extract('http://example.jphttp://example.jp').should == ['http://example.jphttp://example.jp']
  end

  it "treats pretty much anything with a colon as a URI" do
    URI.extract('From: XXX [mailto:xxx@xxx.xxx.xxx]').should == ['From:', 'mailto:xxx@xxx.xxx.xxx]']
  end

  it "wraps a URI string in an array" do
    URI.extract("http://github.com/brixen/rubyspec/tree/master").should == ["http://github.com/brixen/rubyspec/tree/master"]
  end

  it "pulls a variety of protocol URIs from a string" do
    URI.extract("this is a string, it has http://rubini.us/ in it").should == ["http://rubini.us/"]
    URI.extract("mailto:spambait@example.com").should == ["mailto:spambait@example.com"]
    URI.extract("ftp://ruby-lang.org/").should == ["ftp://ruby-lang.org/"]
    URI.extract("https://mail.google.com").should == ["https://mail.google.com"]
    URI.extract("anything://example.com/").should == ["anything://example.com/"]
  end

  it "pulls all URIs within a string in order into an array when a block is not given" do
    URI.extract("1.3. Example URI

       The following examples illustrate URI that are in common use.

       ftp://ftp.is.co.za/rfc/rfc1808.txt
          -- ftp scheme for File Transfer Protocol services

       gopher://spinaltap.micro.umn.edu/00/Weather/California/Los%20Angeles
          -- gopher scheme for Gopher and Gopher+ Protocol services

       http://www.math.uio.no/faq/compression-faq/part1.html
          -- http scheme for Hypertext Transfer Protocol services

       mailto:mduerst@ifi.unizh.ch
          -- mailto scheme for electronic mail addresses

       news:comp.infosystems.www.servers.unix
          -- news scheme for USENET news groups and articles

       telnet://melvyl.ucop.edu/
          -- telnet scheme for interactive services via the TELNET Protocol
    ").should == ["ftp://ftp.is.co.za/rfc/rfc1808.txt","gopher://spinaltap.micro.umn.edu/00/Weather/California/Los%20Angeles","http://www.math.uio.no/faq/compression-faq/part1.html","mailto:mduerst@ifi.unizh.ch","news:comp.infosystems.www.servers.unix","telnet://melvyl.ucop.edu/"]
  end

  it "yields each URI in the given string in order to a block, if given, and returns nil" do
    results = ["http://foo.example.org/bla", "mailto:test@example.com"]
    URI.extract("text here http://foo.example.org/bla and here mailto:test@example.com and here also.") {|uri|
      uri.should == results.shift
    }.should == nil
    results.should == []
  end

  it "allows the user to specify a list of acceptable protocols of URIs to scan for" do
    URI.extract("1.3. Example URI

       The following examples illustrate URI that are in common use.

       ftp://ftp.is.co.za/rfc/rfc1808.txt
          -- ftp scheme for File Transfer Protocol services

       gopher://spinaltap.micro.umn.edu/00/Weather/California/Los%20Angeles
          -- gopher scheme for Gopher and Gopher+ Protocol services

       http://www.math.uio.no/faq/compression-faq/part1.html
          -- http scheme for Hypertext Transfer Protocol services

       mailto:mduerst@ifi.unizh.ch
          -- mailto scheme for electronic mail addresses

       news:comp.infosystems.www.servers.unix
          -- news scheme for USENET news groups and articles

       telnet://melvyl.ucop.edu/
          -- telnet scheme for interactive services via the TELNET Protocol
    ", ["http","ftp","mailto"]).should == ["ftp://ftp.is.co.za/rfc/rfc1808.txt","http://www.math.uio.no/faq/compression-faq/part1.html","mailto:mduerst@ifi.unizh.ch"]
  end
end