aboutsummaryrefslogtreecommitdiffstats
path: root/test/lua/unit/url.lua
blob: a593ac15385c41d44868d79d39ce3d82a65f7d80 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
-- URL parser tests

context("URL check functions", function()
  local mpool = require("rspamd_mempool")
  local ffi = require("ffi")
  
  ffi.cdef[[
  struct rspamd_url {
  char *string;
  int protocol;

  int ip_family;

  char *user;
  char *password;
  char *host;
  char *port;
  char *data;
  char *query;
  char *fragment;
  char *post;
  char *surbl;

  struct rspamd_url *phished_url;

  unsigned int protocollen;
  unsigned int userlen;
  unsigned int passwordlen;
  unsigned int hostlen;
  unsigned int portlen;
  unsigned int datalen;
  unsigned int querylen;
  unsigned int fragmentlen;
  unsigned int surbllen;

  /* Flags */
  int ipv6;  /* URI contains IPv6 host */
  int form;  /* URI originated from form */
  int is_phished; /* URI maybe phishing */
  };
  struct rspamd_config;
  struct rspamd_url* rspamd_url_get_next (void *pool,
    const char *start, char const **pos);
  void * rspamd_mempool_new (unsigned long size);
  void rspamd_url_init (const char *tld_file);
  ]]
  
  test("Extract urls from text", function()
    local pool = ffi.C.rspamd_mempool_new(4096)
    local cases = {
      {"test.com text", {"test.com", nil}},
      {"mailto:A.User@example.com text", {"example.com", "A.User"}},
      {"http://Тест.Рф:18 text", {"тест.рф", nil}},
      {"http://user:password@тест2.РФ:18 text", {"тест2.рф", "user"}},
    }
    
    ffi.C.rspamd_url_init(nil)
    
    for _,c in ipairs(cases) do
      local res = ffi.C.rspamd_url_get_next(pool, c[1], nil)
      
      assert_not_nil(res, "cannot parse " .. c[1])
      assert_equal(c[2][1], ffi.string(res.host, res.hostlen))
      
      if c[2][2] then
        assert_equal(c[2][2], ffi.string(res.user, res.userlen))
      end
    end
  end)
end)