xref: /dokuwiki/inc/mail.php (revision ba36e50e218d376617ba001263d7fa7728717209)
1ed7b5f09Sandi<?php
244f669e9Sandi/**
344f669e9Sandi * Mail functions
444f669e9Sandi *
544f669e9Sandi * @license    GPL 2 (http://www.gnu.org/licenses/gpl.html)
644f669e9Sandi * @author     Andreas Gohr <andi@splitbrain.org>
744f669e9Sandi */
844f669e9Sandi
9ed7b5f09Sandi  if(!defined('DOKU_INC')) define('DOKU_INC',realpath(dirname(__FILE__).'/../').'/');
10ed7b5f09Sandi  require_once(DOKU_INC.'inc/utf8.php');
1144f669e9Sandi
1229f3a5faSAndreas Gohr  // end of line for mail lines - RFC822 says CRLF but postfix (and other MTAs?)
1329f3a5faSAndreas Gohr  // think different
1429f3a5faSAndreas Gohr  if(!defined('MAILHEADER_EOL')) define('MAILHEADER_EOL',"\n");
15e1906e6eSandi  #define('MAILHEADER_ASCIIONLY',1);
1644f669e9Sandi
1744f669e9Sandi/**
1844f669e9Sandi * UTF-8 autoencoding replacement for PHPs mail function
1944f669e9Sandi *
2044f669e9Sandi * Email address fields (To, From, Cc, Bcc can contain a textpart and an address
2144f669e9Sandi * like this: 'Andreas Gohr <andi@splitbrain.org>' - the text part is encoded
2244f669e9Sandi * automatically. You can seperate receivers by commas.
2344f669e9Sandi *
2444f669e9Sandi * @param string $to      Receiver of the mail (multiple seperated by commas)
2544f669e9Sandi * @param string $subject Mailsubject
2644f669e9Sandi * @param string $body    Messagebody
2744f669e9Sandi * @param string $from    Sender address
2844f669e9Sandi * @param string $cc      CarbonCopy receiver (multiple seperated by commas)
2944f669e9Sandi * @param string $bcc     BlindCarbonCopy receiver (multiple seperated by commas)
3044f669e9Sandi * @param string $headers Additional Headers (seperated by MAILHEADER_EOL
3144f669e9Sandi * @param string $params  Additonal Sendmail params (passed to mail())
3244f669e9Sandi *
3344f669e9Sandi * @author Andreas Gohr <andi@splitbrain.org>
3444f669e9Sandi * @see    mail()
3544f669e9Sandi */
3644f669e9Sandifunction mail_send($to, $subject, $body, $from='', $cc='', $bcc='', $headers=null, $params=null){
37e1906e6eSandi  if(defined('MAILHEADER_ASCIIONLY')){
38e1906e6eSandi    $subject = utf8_deaccent($subject);
39e1906e6eSandi    $subject = utf8_strip($subject);
40e1906e6eSandi  }
41e1906e6eSandi
42265f02e3SGuy Brand  if(!utf8_isASCII($subject)) {
4391275a65SAndreas Gohr    $subject = '=?UTF-8?Q?'.mail_quotedprintable_encode($subject,0).'?=';
44265f02e3SGuy Brand    // Spaces must be encoded according to rfc2047. Use the "_" shorthand
45265f02e3SGuy Brand    $subject = preg_replace('/ /', '_', $subject);
46265f02e3SGuy Brand  }
4744f669e9Sandi
4844f669e9Sandi  $header  = '';
49e1906e6eSandi
50f95e691eSAndreas Gohr  // No named recipients for To: in Windows (see FS#652)
51f95e691eSAndreas Gohr  $usenames = (strtoupper(substr(PHP_OS, 0, 3)) === 'WIN') ? false : true;
52f95e691eSAndreas Gohr
53f95e691eSAndreas Gohr  $to = mail_encode_address($to,'',$usenames);
5444f669e9Sandi  $header .= mail_encode_address($from,'From');
5544f669e9Sandi  $header .= mail_encode_address($cc,'Cc');
5644f669e9Sandi  $header .= mail_encode_address($bcc,'Bcc');
5744f669e9Sandi  $header .= 'MIME-Version: 1.0'.MAILHEADER_EOL;
5844f669e9Sandi  $header .= 'Content-Type: text/plain; charset=UTF-8'.MAILHEADER_EOL;
5944f669e9Sandi  $header .= 'Content-Transfer-Encoding: quoted-printable'.MAILHEADER_EOL;
6044f669e9Sandi  $header .= $headers;
61e1906e6eSandi  $header  = trim($header);
6244f669e9Sandi
6344f669e9Sandi  $body = mail_quotedprintable_encode($body);
6444f669e9Sandi
65d7785cceSandi  if($params == null){
66d7785cceSandi    return @mail($to,$subject,$body,$header);
67d7785cceSandi  }else{
68e1906e6eSandi    return @mail($to,$subject,$body,$header,$params);
6944f669e9Sandi  }
70d7785cceSandi}
7144f669e9Sandi
7244f669e9Sandi/**
7344f669e9Sandi * Encodes an email address header
7444f669e9Sandi *
75e1906e6eSandi * Unicode characters will be deaccented and encoded
76e1906e6eSandi * quoted_printable for headers.
7744f669e9Sandi * Addresses may not contain Non-ASCII data!
7844f669e9Sandi *
7944f669e9Sandi * Example:
80a2021ad8Sandi *   mail_encode_address("föö <foo@bar.com>, me@somewhere.com","TBcc");
8144f669e9Sandi *
82f95e691eSAndreas Gohr * @param string  $string Multiple adresses separated by commas
83f95e691eSAndreas Gohr * @param string  $header Name of the header (To,Bcc,Cc,...)
84f95e691eSAndreas Gohr * @param boolean $names  Allow named Recipients?
8544f669e9Sandi */
86f95e691eSAndreas Gohrfunction mail_encode_address($string,$header='',$names=true){
8744f669e9Sandi  $headers = '';
8844f669e9Sandi  $parts = split(',',$string);
8944f669e9Sandi  foreach ($parts as $part){
9044f669e9Sandi    $part = trim($part);
9144f669e9Sandi
9244f669e9Sandi    // parse address
9344f669e9Sandi    if(preg_match('#(.*?)<(.*?)>#',$part,$matches)){
9444f669e9Sandi      $text = trim($matches[1]);
9544f669e9Sandi      $addr = $matches[2];
9644f669e9Sandi    }else{
9744f669e9Sandi      $addr = $part;
9844f669e9Sandi    }
9944f669e9Sandi
10044f669e9Sandi    // skip empty ones
10144f669e9Sandi    if(empty($addr)){
10244f669e9Sandi      continue;
10344f669e9Sandi    }
10444f669e9Sandi
10544f669e9Sandi    // FIXME: is there a way to encode the localpart of a emailaddress?
10644f669e9Sandi    if(!utf8_isASCII($addr)){
10744f669e9Sandi      msg(htmlspecialchars("E-Mail address <$addr> is not ASCII"),-1);
10844f669e9Sandi      continue;
10944f669e9Sandi    }
11044f669e9Sandi
11144f669e9Sandi    if(!mail_isvalid($addr)){
11244f669e9Sandi      msg(htmlspecialchars("E-Mail address <$addr> is not valid"),-1);
11344f669e9Sandi      continue;
11444f669e9Sandi    }
11544f669e9Sandi
116a2021ad8Sandi    // text was given
117f95e691eSAndreas Gohr    if(!empty($text) && $names){
118a2021ad8Sandi      // add address quotes
119a2021ad8Sandi      $addr = "<$addr>";
12044f669e9Sandi
121e1906e6eSandi      if(defined('MAILHEADER_ASCIIONLY')){
122e1906e6eSandi        $text = utf8_deaccent($text);
123e1906e6eSandi        $text = utf8_strip($text);
124e1906e6eSandi      }
125e1906e6eSandi
12644f669e9Sandi      if(!utf8_isASCII($text)){
12791275a65SAndreas Gohr        $text = '=?UTF-8?Q?'.mail_quotedprintable_encode($text,0).'?=';
12844f669e9Sandi      }
129628e6ba7SAndreas Gohr    }else{
130628e6ba7SAndreas Gohr      $text = '';
13144f669e9Sandi    }
13244f669e9Sandi
133a2021ad8Sandi    // add to header comma seperated and in new line to avoid too long headers
134a2021ad8Sandi    if($headers != '') $headers .= ','.MAILHEADER_EOL.' ';
135*ba36e50eSAndreas Gohr    $headers .= $text.' '.$addr;
136a2021ad8Sandi  }
137a2021ad8Sandi
138a2021ad8Sandi  if(empty($headers)) return null;
139a2021ad8Sandi
140a2021ad8Sandi  //if headername was given add it and close correctly
141a2021ad8Sandi  if($header) $headers = $header.': '.$headers.MAILHEADER_EOL;
142a2021ad8Sandi
14344f669e9Sandi  return $headers;
14444f669e9Sandi}
14544f669e9Sandi
14644f669e9Sandi/**
14744f669e9Sandi * Uses a regular expresion to check if a given mail address is valid
14844f669e9Sandi *
14944f669e9Sandi * May not be completly RFC conform!
1500a1d30bfSchris * @link    http://www.faqs.org/rfcs/rfc2822.html    (paras 3.4.1 & 3.2.4)
15144f669e9Sandi *
1520a1d30bfSchris * @author  Chris Smith <chris@jalakai.co.uk>
15344f669e9Sandi *
15444f669e9Sandi * @param   string $email the address to check
15544f669e9Sandi * @return  bool          true if address is valid
15644f669e9Sandi */
1570a1d30bfSchris
1580a1d30bfSchris// patterns for use in email detection and validation
1590a1d30bfSchris// NOTE: there is an unquoted '/' in RFC2822_ATEXT, it must remain unquoted to be used in the parser
1600a1d30bfSchris//       the pattern uses non-capturing groups as captured groups aren't allowed in the parser
1610a1d30bfSchris//       select pattern delimiters with care!
1620a1d30bfSchrisif (!defined('RFC2822_ATEXT')) define('RFC2822_ATEXT',"0-9A-Za-z!#$%&'*+/=?^_`{|}~-");
1630a1d30bfSchrisif (!defined('PREG_PATTERN_VALID_EMAIL')) define('PREG_PATTERN_VALID_EMAIL', '['.RFC2822_ATEXT.']+(?:\.['.RFC2822_ATEXT.']+)*@(?:[0-9A-Za-z][0-9A-Za-z-]*\.)+[A-Za-z]{2,4}');
1640a1d30bfSchris
16544f669e9Sandifunction mail_isvalid($email){
1660a1d30bfSchris  return preg_match('<^'.PREG_PATTERN_VALID_EMAIL.'$>', $email);
16744f669e9Sandi}
16844f669e9Sandi
16944f669e9Sandi/**
17044f669e9Sandi * Quoted printable encoding
17144f669e9Sandi *
17291275a65SAndreas Gohr * @author umu <umuAThrz.tu-chemnitz.de>
17391275a65SAndreas Gohr * @link   http://www.php.net/manual/en/function.imap-8bit.php#61216
17444f669e9Sandi */
17591275a65SAndreas Gohrfunction mail_quotedprintable_encode($sText,$maxlen=74,$bEmulate_imap_8bit=true) {
17691275a65SAndreas Gohr  // split text into lines
17791275a65SAndreas Gohr  $aLines= preg_split("/(?:\r\n|\r|\n)/", $sText);
17891275a65SAndreas Gohr
17991275a65SAndreas Gohr  for ($i=0;$i<count($aLines);$i++) {
18091275a65SAndreas Gohr    $sLine =& $aLines[$i];
18191275a65SAndreas Gohr    if (strlen($sLine)===0) continue; // do nothing, if empty
18291275a65SAndreas Gohr
18391275a65SAndreas Gohr    $sRegExp = '/[^\x09\x20\x21-\x3C\x3E-\x7E]/e';
18491275a65SAndreas Gohr
18591275a65SAndreas Gohr    // imap_8bit encodes x09 everywhere, not only at lineends,
18691275a65SAndreas Gohr    // for EBCDIC safeness encode !"#$@[\]^`{|}~,
18791275a65SAndreas Gohr    // for complete safeness encode every character :)
18891275a65SAndreas Gohr    if ($bEmulate_imap_8bit)
18991275a65SAndreas Gohr      $sRegExp = '/[^\x20\x21-\x3C\x3E-\x7E]/e';
19091275a65SAndreas Gohr
19191275a65SAndreas Gohr    $sReplmt = 'sprintf( "=%02X", ord ( "$0" ) ) ;';
19291275a65SAndreas Gohr    $sLine = preg_replace( $sRegExp, $sReplmt, $sLine );
19391275a65SAndreas Gohr
19491275a65SAndreas Gohr    // encode x09,x20 at lineends
19591275a65SAndreas Gohr    {
19691275a65SAndreas Gohr      $iLength = strlen($sLine);
19791275a65SAndreas Gohr      $iLastChar = ord($sLine{$iLength-1});
19891275a65SAndreas Gohr
19991275a65SAndreas Gohr      //              !!!!!!!!
20091275a65SAndreas Gohr      // imap_8_bit does not encode x20 at the very end of a text,
20191275a65SAndreas Gohr      // here is, where I don't agree with imap_8_bit,
20291275a65SAndreas Gohr      // please correct me, if I'm wrong,
20391275a65SAndreas Gohr      // or comment next line for RFC2045 conformance, if you like
20491275a65SAndreas Gohr      if (!($bEmulate_imap_8bit && ($i==count($aLines)-1)))
20591275a65SAndreas Gohr
20691275a65SAndreas Gohr      if (($iLastChar==0x09)||($iLastChar==0x20)) {
20791275a65SAndreas Gohr        $sLine{$iLength-1}='=';
20891275a65SAndreas Gohr        $sLine .= ($iLastChar==0x09)?'09':'20';
20944f669e9Sandi      }
21091275a65SAndreas Gohr    }    // imap_8bit encodes x20 before chr(13), too
21191275a65SAndreas Gohr    // although IMHO not requested by RFC2045, why not do it safer :)
21291275a65SAndreas Gohr    // and why not encode any x20 around chr(10) or chr(13)
21391275a65SAndreas Gohr    if ($bEmulate_imap_8bit) {
21491275a65SAndreas Gohr      $sLine=str_replace(' =0D','=20=0D',$sLine);
21591275a65SAndreas Gohr      //$sLine=str_replace(' =0A','=20=0A',$sLine);
21691275a65SAndreas Gohr      //$sLine=str_replace('=0D ','=0D=20',$sLine);
21791275a65SAndreas Gohr      //$sLine=str_replace('=0A ','=0A=20',$sLine);
21844f669e9Sandi    }
21944f669e9Sandi
22091275a65SAndreas Gohr    // finally split into softlines no longer than $maxlen chars,
22191275a65SAndreas Gohr    // for even more safeness one could encode x09,x20
22291275a65SAndreas Gohr    // at the very first character of the line
22391275a65SAndreas Gohr    // and after soft linebreaks, as well,
22491275a65SAndreas Gohr    // but this wouldn't be caught by such an easy RegExp
22591275a65SAndreas Gohr    if($maxlen){
22691275a65SAndreas Gohr      preg_match_all( '/.{1,'.($maxlen - 2).'}([^=]{0,2})?/', $sLine, $aMatch );
22729f3a5faSAndreas Gohr      $sLine = implode( '=' . MAILHEADER_EOL, $aMatch[0] ); // add soft crlf's
22891275a65SAndreas Gohr    }
22991275a65SAndreas Gohr  }
23091275a65SAndreas Gohr
23191275a65SAndreas Gohr  // join lines into text
23229f3a5faSAndreas Gohr  return implode(MAILHEADER_EOL,$aLines);
23391275a65SAndreas Gohr}
23444f669e9Sandi
235340756e4Sandi
236340756e4Sandi//Setup VIM: ex: et ts=2 enc=utf-8 :
237