



Copyright 2009 Dominic Sayers 

This source file is subject to the Common Public Attribution License Version 1.0 (CPAL) license. 
The license terms are available through the world-wide-web at 
function is_email ($email, $checkDNS = false) { 
    //    Check that $email is a valid address 
    //        ( 
    //        ( 
    //        ( 
    //        ( 
    //        ( 
    //    Contemporary email addresses consist of a "local part" separated from 
    //    a "domain part" (a fully-qualified domain name) by an at-sign ("@"). 
    //        ( 
    $index = strrpos($email,'@');

if ($index === false)        return false;    //    No at-sign 
    if ($index === 0)            return false;    //    No local part 
    if ($index > 64)            return false;    //    Local part too long

$localPart        = substr($email, 0, $index); 
    $domain            = substr($email, $index + 1); 
    $domainLength    = strlen($domain); 
    if ($domainLength === 0)    return false;    //    No domain part 
    if ($domainLength > 255)    return false;    //    Domain part too long

//    Let's check the local part for RFC compliance... 
    //    Period (".") may...appear, but may not be used to start or end the 
    //    local part, nor may two or more consecutive periods appear. 
    //        ( 
    if (preg_match('/^\\.|\\.\\.|\\.$/', $localPart) > 0)                return false;    //    Dots in wrong place

//    Any ASCII graphic (printing) character other than the 
    //    at-sign ("@"), backslash, double quote, comma, or square brackets may 
    //    appear without quoting.  If any of that list of excluded characters 
    //    are to appear, they must be quoted 
    //        ( 
    if (preg_match('/^"(?:.)*"$/', $localPart) > 0) { 
        //    Local part is a quoted string 
        if (preg_match('/(?:.)+[^\\\\]"(?:.)+/', $localPart) > 0)    return false;    //    Unescaped quote character inside quoted string 
    } else { 
        if (preg_match('/[ @\\[\\]\\\\",]/', $localPart) > 0) 
            //    Check all excluded characters are escaped 
            $stripped = preg_replace('/\\\\[ @\\[\\]\\\\",]/', '', $localPart); 
            if (preg_match('/[ @\\[\\]\\\\",]/', $stripped) > 0)        return false;    //    Unquoted excluded characters 

//    Now let's check the domain part...

//    The domain name can also be replaced by an IP address in square brackets 
    //        ( 
    //        ( 
    //        ( 
    if (preg_match('/^\\[(.)+]$/', $domain) === 1) { 
        //    It's an address-literal 
        $addressLiteral = substr($domain, 1, $domainLength - 2); 
        $matchesIP        = array(); 
        //    Extract IPv4 part from the end of the address-literal (if there is one) 
        if (preg_match('/\\b(?:(?:25[0-5]|2[0-4][0-9]|[01]?[0-9][0-9]?)\\.){3}(?:25[0-5]|2[0-4][0-9]|[01]?[0-9][0-9]?)$/', $addressLiteral, $matchesIP) > 0) { 
            $index = strrpos($addressLiteral, $matchesIP[0]); 
            if ($index === 0) { 
                //    Nothing there except a valid IPv4 address, so... 
                return true; 
            } else { 
                //    Assume it's an attempt at a mixed address (IPv6 + IPv4) 
                if ($addressLiteral[$index - 1] !== ':')            return false;    //    Character preceding IPv4 address must be ':' 
                if (substr($addressLiteral, 0, 5) !== 'IPv6:')        return false;    //    RFC5321 section 4.1.3

$IPv6 = substr($addressLiteral, 5, ($index ===7) ? 2 : $index - 6); 
                $groupMax = 6; 
        } else { 
            //    It must be an attempt at pure IPv6 
            if (substr($addressLiteral, 0, 5) !== 'IPv6:')            return false;    //    RFC5321 section 4.1.3 
            $IPv6 = substr($addressLiteral, 5); 
            $groupMax = 8; 

$groupCount    = preg_match_all('/^[0-9a-fA-F]{0,4}|\\:[0-9a-fA-F]{0,4}|(.)/', $IPv6, $matchesIP); 
        $index        = strpos($IPv6,'::');

if ($index === false) { 
            //    We need exactly the right number of groups 
            if ($groupCount !== $groupMax)                            return false;    //    RFC5321 section 4.1.3 
        } else { 
            if ($index !== strrpos($IPv6,'::'))                        return false;    //    More than one '::' 
            $groupMax = ($index === 0 || $index === (strlen($IPv6) - 2)) ? $groupMax : $groupMax - 1; 
            if ($groupCount > $groupMax)                            return false;    //    Too many IPv6 groups in address 

//    Check for unmatched characters 
        array_multisort($matchesIP[1], SORT_DESC); 
        if ($matchesIP[1][0] !== '')                                    return false;    //    Illegal characters in address

//    It's a valid IPv6 address, so... 
        return true; 
    } else { 
        //    It's a domain name...

//    The syntax of a legal Internet host name was specified in RFC-952 
        //    One aspect of host name syntax is hereby changed: the 
        //    restriction on the first character is relaxed to allow either a 
        //    letter or a digit. 
        //        ( 
        //    NB RFC 1123 updates RFC 1035, but this is not currently apparent from reading RFC 1035. 
        //    Most common applications, including email and the Web, will generally not permit...escaped strings 
        //        ( 
        //    Characters outside the set of alphabetic characters, digits, and hyphen MUST NOT appear in domain name 
        //    labels for SMTP clients or servers 
        //        ( 
        //    RFC5321 precludes the use of a trailing dot in a domain name for SMTP purposes 
        //        ( 
        $matches    = array(); 
        $groupCount    = preg_match_all('/(?:[0-9a-zA-Z][0-9a-zA-Z-]{0,61}[0-9a-zA-Z]|[a-zA-Z])(?:\\.|$)|(.)/', $domain, $matches); 
        $level        = count($matches[0]);

if ($level == 1)                                            return false;    //    Mail host can't be a TLD

$TLD = $matches[0][$level - 1]; 
        if (substr($TLD, strlen($TLD) - 1, 1) === '.')                return false;    //    TLD can't end in a dot 
        if (preg_match('/^[0-9]+$/', $TLD) > 0)                        return false;    //    TLD can't be all-numeric

//    Check for unmatched characters 
        array_multisort($matches[1], SORT_DESC); 
        if ($matches[1][0] !== '')                            return false;    //    Illegal characters in domain, or label longer than 63 characters

//    Check DNS? 
        if ($checkDNS && function_exists('checkdnsrr')) { 
            if (!(checkdnsrr($domain, 'A') || checkdnsrr($domain, 'MX'))) { 
                                                                    return false;    //    Domain doesn't actually exist 

//    Eliminate all other factors, and the one which remains must be the truth. 
        //        (Sherlock Holmes, The Sign of Four) 
        return true; 

function unitTest ($email, $reason = '') { 
    $expected    = ($reason === '') ? true : false; 
    $valid        = is_email($email); 
    $not        = ($valid) ? '' : ' not'; 
    $unexpected    = ($valid !== $expected) ? ' <b>This was unexpected!</b>' : ''; 
    $reason        = ($reason === '') ? "" : " Reason: $reason"; 
    return "The address <i>$email</i> is$not valid.$unexpected$reason<br />\n"; 

//    Email validator test cases (Dominic Sayers, January 2009) 
//    Valid addresses 
echo unitTest(''); 
echo unitTest(''); 
echo unitTest('"first last"'); 
echo unitTest('"first\\"last"');    //    Not totally sure whether this is valid or not 
echo unitTest('first\\'); 
echo unitTest('"first@last"'); 
echo unitTest('first\\\\');    //    Note that \ is escaped even in single-quote strings, so this is testing "first\\last" 
echo unitTest('first.last@x23456789.x23456789.x23456789.x23456789.x23456789.x23456789.x23456789.x23456789.x23456789.x23456789.x23456789.x23456789.x23456789.x23456789.
echo unitTest('first.last@[]'); 
echo unitTest('first.last@[IPv6:::]'); 
echo unitTest('first.last@[IPv6:1111:2222:3333::4444:]'); 
echo unitTest('first.last@[IPv6:1111:2222:3333:4444:5555:6666:]'); 
echo unitTest('first.last@[IPv6:::1111:2222:3333:4444:5555:6666]'); 
echo unitTest('first.last@[IPv6:1111:2222:3333::4444:5555:6666]'); 
echo unitTest('first.last@[IPv6:1111:2222:3333:4444:5555:6666::]'); 
echo unitTest('first.last@[IPv6:1111:2222:3333:4444:5555:6666:7777:8888]'); 
echo unitTest(''); 
echo unitTest(''); 
echo unitTest('');

//    Invalid addresses 
echo unitTest('first.last', "No @"); 
echo unitTest('', "No local part"); 
echo unitTest('', "Local part more than 64 characters"); 
echo unitTest('', "Local part starts with a dot"); 
echo unitTest('', "Local part ends with a dot"); 
echo unitTest('', "Local part has consecutive dots"); 
echo unitTest('"first"last"', "Local part contains unescaped excluded characters"); 
echo unitTest('first\\\\', "Local part contains unescaped excluded characters"); 
echo unitTest('first.last@', "No domain"); 
echo unitTest('first.last@x23456789.x23456789.x23456789.x23456789.x23456789.x23456789.x23456789.x23456789.x23456789.x23456789.x23456789.x23456789.x23456789.x23456789.
x23456789.x23456789.x23456789.x23456789.x23456789.x23456789.x23456789.x23456789.x23456789.x23456789.x23456789.x23456', "Domain exceeds 255 chars");
echo unitTest('first.last@[.]', "Only char that can precede IPv4 address is ':'"); 
echo unitTest('first.last@[]', "Can't be interpreted as IPv4 so IPv6 tag is missing"); 
echo unitTest('first.last@[::]', "IPv6 tag is missing"); 
echo unitTest('first.last@[IPv5:::]', "IPv6 tag is wrong"); 
echo unitTest('first.last@[IPv6:1111:2222:3333::4444:5555:]', "Too many IPv6 groups (4 max)"); 
echo unitTest('first.last@[IPv6:1111:2222:3333:4444:5555:]', "Not enough IPv6 groups"); 
echo unitTest('first.last@[IPv6:1111:2222:3333:4444:5555:6666:7777:]', "Too many IPv6 groups (6 max)"); 
echo unitTest('first.last@[IPv6:1111:2222:3333:4444:5555:6666:7777]', "Not enough IPv6 groups"); 
echo unitTest('first.last@[IPv6:1111:2222:3333:4444:5555:6666:7777:8888:9999]', "Too many IPv6 groups (8 max)"); 
echo unitTest('first.last@[IPv6:1111:2222::3333::4444:5555:6666]', "Too many '::' (can be none or one)"); 
echo unitTest('first.last@[IPv6:1111:2222:3333::4444:5555:6666:7777]', "Too many IPv6 groups (6 max)"); 
echo unitTest('first.last@[IPv6:1111:2222:333x::4444:5555]', "x is not valid in an IPv6 address"); 
echo unitTest('first.last@[IPv6:1111:2222:33333::4444:5555]', "33333 is not a valid group in an IPv6 address"); 
echo unitTest('first.last@example.123', "TLD can't be all digits"); 
echo unitTest('first.last@com', "Mail host must be second- or lower level"); 
echo unitTest('', "Label can't begin with a hyphen"); 
echo unitTest('', "Label can't end with a hyphen"); 
echo unitTest('', "Label can't be longer than 63 octets");

//    Test cases from RFC3696 (February 2004, 
echo unitTest('Abc\\'); 
echo unitTest('Fred\\'); 
echo unitTest('Joe.\\\\'); 
echo unitTest('"Abc@def"'); 
echo unitTest('"Fred Bloggs"'); 
echo unitTest(''); 
echo unitTest('customer/'); 
echo unitTest('$'); 
echo unitTest('!def!'); 
echo unitTest('');

//    Test cases from Doug Lovell (LinuxJournal, June 2007, 
echo unitTest(""); 
echo unitTest("abc\\"); 
echo unitTest("abc\\\\"); 
echo unitTest("Fred\\"); 
echo unitTest("Joe.\\\\"); 
echo unitTest("\"Abc@def\""); 
echo unitTest("\"Fred Bloggs\""); 
echo unitTest("customer/"); 
echo unitTest("\$"); 
echo unitTest("!def!"); 
echo unitTest(""); 
echo unitTest(""); 
echo unitTest(""); 
echo unitTest("Doug\\ \\\"Ace\\\"\\"); 
echo unitTest("\"Doug \\\"Ace\\\" L.\""); 
echo unitTest("", "Doug Lovell says this should fail"); 
echo unitTest("abc\\\\", "Doug Lovell says this should fail"); 
echo unitTest("abc\\", "Doug Lovell says this should fail"); 
echo unitTest("", "Doug Lovell says this should fail"); 
echo unitTest("doug@", "Doug Lovell says this should fail"); 
echo unitTest("\"", "Doug Lovell says this should fail"); 
echo unitTest("ote\"", "Doug Lovell says this should fail"); 
echo unitTest("", "Doug Lovell says this should fail"); 
echo unitTest("", "Doug Lovell says this should fail"); 
echo unitTest("", "Doug Lovell says this should fail"); 
echo unitTest("\"Doug \"Ace\" L.\"", "Doug Lovell says this should fail"); 
echo unitTest("Doug\\ \\\"Ace\\\"\\ L\\", "Doug Lovell says this should fail"); 
echo unitTest("hello", "Doug Lovell says this should fail"); 
echo unitTest("", "Doug Lovell says this should fail"); 


php RFC兼容的电子邮件地址验证的更多相关文章

  1. PHP正则表达式 验证电子邮件地址

    我们最经常遇到的验证,就是电子邮件地址验证.网站上常见.各种网页脚本也都常用“正则表达式”(regular expression)对我们输入的电子邮件地址进行验证,判断是否合法.有的还能分解出用户名和 ...

  2. C++11标准 STL正则表达式 验证电子邮件地址

    转自: 我们最经常遇到的验证,就是电子邮件地址验证.网站上常见.各种网页 ...

  3. shell(sed/gawk)脚本(计算目录文件/验证电话号码/解析电子邮件地址)

    1.计算目录文件 #!/bin/bash mypath=`echo $PATH | sed 's/:/ /g'`#注意` ` 和 ‘ ’ count= for directory in $mypath ...

  4. 验证-- email类型输入框(电子邮件地址)--multiple

    如果需要一个用来填写电子邮件地址的输入框,可以使用email类型.这样浏览器可以帮我们验证格式是否正确,而不需要自己写验证规则.原文:HTML5新控件 - email类型输入框(电子邮件地址) 1,只 ...

  5. [Swift]LeetCode929. 独特的电子邮件地址 | Unique Email Addresses

    Every email consists of a local name and a domain name, separated by the @ sign. For example, in ali ...

  6. 【LeetCode】Unique Email Addresses(独特的电子邮件地址)

    这道题是LeetCode里的第929道题. 题目要求: 每封电子邮件都由一个本地名称和一个域名组成,以 @ 符号分隔. 例如,在 alice@leetcode.com中, alice 是本地名称,而  ...

  7. 【leecode】独特的电子邮件地址

    每封电子邮件都由一个本地名称和一个域名组成,以 @ 符号分隔. 例如,在 alice@leetcode.com中, alice 是本地名称,而 是域名. 除了小写字母,这些电 ...

  8. leetCode 929 独特的电子邮件地址

    题目: 每封电子邮件都由一个本地名称和一个域名组成,以 @ 符号分隔. 例如,在 alice@leetcode.com中, alice 是本地名称,而 是域名. 除了小写字母 ...

  9. Leetcode929.Unique Email Addresses独特的电子邮件地址

    每封电子邮件都由一个本地名称和一个域名组成,以 @ 符号分隔. 例如,在 alice@leetcode.com中, alice 是本地名称,而 是域名. 除了小写字母,这些电 ...


  1. js将秒数换算成时分秒

    转载自: <script language="javascr ...

  2. invalid comparison: java.util.ArrayList and java.lang.String——bug解决办法

    今天碰到个问题,解决了很久才搞定,来记录下,希望可以帮助到大家 贴错误源码: 这是一个根据list集合的查找数据的 sql,在接收list的时候加了判断 list != ‘ ’ “”,引起了集合与St ...

  3. pipe_wait问题_转

    转自:调用Process.waitfor导致的进程挂起 最近遇到pipe_wait问题,父进程调用子进程时,子进程阻塞,cat /proc/$child/wchan输出pipe_wait,进程阻塞在p ...

  4. wget命令 -c断点续传

    wget -O 下载文件在指定位置并进行重命名 -O file       - ...

  5. flask 邮箱配置 先进入邮箱设置 POP3/SMTP/IMAP 下面代码来自知乎 https://www.z ...

  6. 成功抓取csdn阅读量过万博文 var commentscount = 1; 嵌套的评论算一条,这个可能有 ...

  7. 第一百五十节,封装库--JavaScript,表单验证--密码验证

    封装库--JavaScript,表单验证--密码验证 效果图 html <div id="reg"> <h2 class="tuo">& ...

  8. 第一百四十五节,JavaScript,同步动画

    JavaScript,同步动画 将上一节的,移动透明动画,修改成可以支持同步动画,也就是可以给这个动画方法多个动画任务,让它同时完成 原理: 向方法里添加一个属性,这个属性是一个对象,同步动画属性,属 ...

  9. hdu 5078

    Osu! Time Limit: 2000/1000 MS (Java/Others)    Memory Limit: 262144/262144 K (Java/Others) Total Sub ...

  10. sudo -E的意思

    1.sudo -E -E选项在man page中的解释是: -E The -E (preserve environment) option indicates to the security poli ...